diff --git "a/data/benchmarks/hfopenllm_v2.json" "b/data/benchmarks/hfopenllm_v2.json" new file mode 100644--- /dev/null +++ "b/data/benchmarks/hfopenllm_v2.json" @@ -0,0 +1,58452 @@ +{ + "models": [ + { + "model_id": "0-hero/Matter-0.2-7B-DPO", + "name": "Matter-0.2-7B-DPO", + "developer": "0-hero", + "scores": { + "IFEval": 0.3303, + "BBH": 0.3596, + "MATH Level 5": 0.0144, + "GPQA": 0.2592, + "MUSR": 0.3814, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "01-ai/Yi-1.5-34B", + "name": "Yi-1.5-34B", + "developer": "01-ai", + "scores": { + "IFEval": 0.2841, + "BBH": 0.5976, + "MATH Level 5": 0.1533, + "GPQA": 0.3658, + "MUSR": 0.4236, + "MMLU-PRO": 0.4666 + } + }, + { + "model_id": "01-ai/Yi-1.5-34B-32K", + "name": "Yi-1.5-34B-32K", + "developer": "01-ai", + "scores": { + "IFEval": 0.3119, + "BBH": 0.6016, + "MATH Level 5": 0.1541, + "GPQA": 0.3633, + "MUSR": 0.4398, + "MMLU-PRO": 0.4709 + } + }, + { + "model_id": "01-ai/Yi-1.5-34B-Chat", + "name": "Yi-1.5-34B-Chat", + "developer": "01-ai", + "scores": { + "IFEval": 0.6067, + "BBH": 0.6084, + "MATH Level 5": 0.2772, + "GPQA": 0.3649, + "MUSR": 0.4282, + "MMLU-PRO": 0.452 + } + }, + { + "model_id": "01-ai/Yi-1.5-34B-Chat-16K", + "name": "Yi-1.5-34B-Chat-16K", + "developer": "01-ai", + "scores": { + "IFEval": 0.4564, + "BBH": 0.61, + "MATH Level 5": 0.2137, + "GPQA": 0.3381, + "MUSR": 0.4398, + "MMLU-PRO": 0.4545 + } + }, + { + "model_id": "01-ai/Yi-1.5-6B", + "name": "Yi-1.5-6B", + "developer": "01-ai", + "scores": { + "IFEval": 0.2617, + "BBH": 0.4493, + "MATH Level 5": 0.0665, + "GPQA": 0.3138, + "MUSR": 0.4374, + "MMLU-PRO": 0.3144 + } + }, + { + "model_id": "01-ai/Yi-1.5-6B-Chat", + "name": "Yi-1.5-6B-Chat", + "developer": "01-ai", + "scores": { + "IFEval": 0.5145, + "BBH": 0.4571, + "MATH Level 5": 0.1624, + "GPQA": 0.302, + "MUSR": 0.4392, + "MMLU-PRO": 0.3193 + } + }, + { + "model_id": "01-ai/Yi-1.5-9B", + "name": "Yi-1.5-9B", + "developer": "01-ai", + "scores": { + "IFEval": 0.2936, + "BBH": 0.5143, + "MATH Level 5": 0.114, + "GPQA": 0.3792, + "MUSR": 0.4328, + "MMLU-PRO": 0.3916 + } + }, + { + "model_id": "01-ai/Yi-1.5-9B-32K", + "name": "Yi-1.5-9B-32K", + "developer": "01-ai", + "scores": { + "IFEval": 0.2303, + "BBH": 0.4963, + "MATH Level 5": 0.108, + "GPQA": 0.3591, + "MUSR": 0.4186, + "MMLU-PRO": 0.3765 + } + }, + { + "model_id": "01-ai/Yi-1.5-9B-Chat", + "name": "Yi-1.5-9B-Chat", + "developer": "01-ai", + "scores": { + "IFEval": 0.6046, + "BBH": 0.5559, + "MATH Level 5": 0.2258, + "GPQA": 0.3347, + "MUSR": 0.4259, + "MMLU-PRO": 0.3975 + } + }, + { + "model_id": "01-ai/Yi-1.5-9B-Chat-16K", + "name": "Yi-1.5-9B-Chat-16K", + "developer": "01-ai", + "scores": { + "IFEval": 0.4214, + "BBH": 0.5153, + "MATH Level 5": 0.1782, + "GPQA": 0.3087, + "MUSR": 0.4099, + "MMLU-PRO": 0.3994 + } + }, + { + "model_id": "01-ai/Yi-34B", + "name": "Yi-34B", + "developer": "01-ai", + "scores": { + "IFEval": 0.3046, + "BBH": 0.5457, + "MATH Level 5": 0.0514, + "GPQA": 0.3666, + "MUSR": 0.4119, + "MMLU-PRO": 0.4412 + } + }, + { + "model_id": "01-ai/Yi-34B-200K", + "name": "Yi-34B-200K", + "developer": "01-ai", + "scores": { + "IFEval": 0.1542, + "BBH": 0.5442, + "MATH Level 5": 0.0574, + "GPQA": 0.3565, + "MUSR": 0.3817, + "MMLU-PRO": 0.4535 + } + }, + { + "model_id": "01-ai/Yi-34B-Chat", + "name": "Yi-34B-Chat", + "developer": "01-ai", + "scores": { + "IFEval": 0.4699, + "BBH": 0.5561, + "MATH Level 5": 0.0627, + "GPQA": 0.3381, + "MUSR": 0.3978, + "MMLU-PRO": 0.4093 + } + }, + { + "model_id": "01-ai/Yi-6B", + "name": "Yi-6B", + "developer": "01-ai", + "scores": { + "IFEval": 0.2893, + "BBH": 0.4309, + "MATH Level 5": 0.0159, + "GPQA": 0.2693, + "MUSR": 0.3937, + "MMLU-PRO": 0.2991 + } + }, + { + "model_id": "01-ai/Yi-6B-200K", + "name": "Yi-6B-200K", + "developer": "01-ai", + "scores": { + "IFEval": 0.0843, + "BBH": 0.4289, + "MATH Level 5": 0.0181, + "GPQA": 0.2819, + "MUSR": 0.4587, + "MMLU-PRO": 0.2844 + } + }, + { + "model_id": "01-ai/Yi-6B-Chat", + "name": "Yi-6B-Chat", + "developer": "01-ai", + "scores": { + "IFEval": 0.3395, + "BBH": 0.4133, + "MATH Level 5": 0.0136, + "GPQA": 0.2945, + "MUSR": 0.3688, + "MMLU-PRO": 0.3061 + } + }, + { + "model_id": "01-ai/Yi-9B", + "name": "Yi-9B", + "developer": "01-ai", + "scores": { + "IFEval": 0.2709, + "BBH": 0.494, + "MATH Level 5": 0.0559, + "GPQA": 0.318, + "MUSR": 0.4054, + "MMLU-PRO": 0.3574 + } + }, + { + "model_id": "01-ai/Yi-9B-200K", + "name": "Yi-9B-200K", + "developer": "01-ai", + "scores": { + "IFEval": 0.2327, + "BBH": 0.4793, + "MATH Level 5": 0.0665, + "GPQA": 0.3154, + "MUSR": 0.4294, + "MMLU-PRO": 0.3622 + } + }, + { + "model_id": "01-ai/Yi-Coder-9B-Chat", + "name": "Yi-Coder-9B-Chat", + "developer": "01-ai", + "scores": { + "IFEval": 0.4817, + "BBH": 0.4814, + "MATH Level 5": 0.04, + "GPQA": 0.2475, + "MUSR": 0.3992, + "MMLU-PRO": 0.2425 + } + }, + { + "model_id": "1-800-LLMs/Qwen-2.5-14B-Hindi", + "name": "Qwen-2.5-14B-Hindi", + "developer": "1-800-LLMs", + "scores": { + "IFEval": 0.5826, + "BBH": 0.6524, + "MATH Level 5": 0.3331, + "GPQA": 0.3624, + "MUSR": 0.4489, + "MMLU-PRO": 0.5263 + } + }, + { + "model_id": "1-800-LLMs/Qwen-2.5-14B-Hindi-Custom-Instruct", + "name": "Qwen-2.5-14B-Hindi-Custom-Instruct", + "developer": "1-800-LLMs", + "scores": { + "IFEval": 0.3077, + "BBH": 0.6284, + "MATH Level 5": 0.3112, + "GPQA": 0.37, + "MUSR": 0.4491, + "MMLU-PRO": 0.5164 + } + }, + { + "model_id": "1024m/PHI-4-Hindi", + "name": "PHI-4-Hindi", + "developer": "1024m", + "scores": { + "IFEval": 0.0082, + "BBH": 0.671, + "MATH Level 5": 0.2334, + "GPQA": 0.3977, + "MUSR": 0.4914, + "MMLU-PRO": 0.5239 + } + }, + { + "model_id": "1024m/QWEN-14B-B100", + "name": "QWEN-14B-B100", + "developer": "1024m", + "scores": { + "IFEval": 0.7762, + "BBH": 0.6533, + "MATH Level 5": 0.5438, + "GPQA": 0.3507, + "MUSR": 0.41, + "MMLU-PRO": 0.5179 + } + }, + { + "model_id": "152334H/miqu-1-70b-sf", + "name": "miqu-1-70b-sf", + "developer": "152334H", + "scores": { + "IFEval": 0.5182, + "BBH": 0.6102, + "MATH Level 5": 0.1246, + "GPQA": 0.3507, + "MUSR": 0.4582, + "MMLU-PRO": 0.4228 + } + }, + { + "model_id": "1TuanPham/T-VisStar-7B-v0.1", + "name": "T-VisStar-7B-v0.1", + "developer": "1TuanPham", + "scores": { + "IFEval": 0.3607, + "BBH": 0.5052, + "MATH Level 5": 0.0574, + "GPQA": 0.2852, + "MUSR": 0.4375, + "MMLU-PRO": 0.3211 + } + }, + { + "model_id": "1TuanPham/T-VisStar-v0.1", + "name": "T-VisStar-v0.1", + "developer": "1TuanPham", + "scores": { + "IFEval": 0.3607, + "BBH": 0.5052, + "MATH Level 5": 0.0574, + "GPQA": 0.2852, + "MUSR": 0.4375, + "MMLU-PRO": 0.3211 + } + }, + { + "model_id": "3rd-Degree-Burn/L-3.1-Science-Writer-8B", + "name": "L-3.1-Science-Writer-8B", + "developer": "3rd-Degree-Burn", + "scores": { + "IFEval": 0.4263, + "BBH": 0.5041, + "MATH Level 5": 0.1035, + "GPQA": 0.2743, + "MUSR": 0.3959, + "MMLU-PRO": 0.3649 + } + }, + { + "model_id": "3rd-Degree-Burn/Llama-3.1-8B-Squareroot", + "name": "Llama-3.1-8B-Squareroot", + "developer": "3rd-Degree-Burn", + "scores": { + "IFEval": 0.2213, + "BBH": 0.3461, + "MATH Level 5": 0.2659, + "GPQA": 0.2567, + "MUSR": 0.3089, + "MMLU-PRO": 0.175 + } + }, + { + "model_id": "3rd-Degree-Burn/Llama-3.1-8B-Squareroot-v1", + "name": "Llama-3.1-8B-Squareroot-v1", + "developer": "3rd-Degree-Burn", + "scores": { + "IFEval": 0.2892, + "BBH": 0.3343, + "MATH Level 5": 0.0884, + "GPQA": 0.2559, + "MUSR": 0.3341, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "3rd-Degree-Burn/Llama-Squared-8B", + "name": "Llama-Squared-8B", + "developer": "3rd-Degree-Burn", + "scores": { + "IFEval": 0.2755, + "BBH": 0.4431, + "MATH Level 5": 0.0574, + "GPQA": 0.2718, + "MUSR": 0.3089, + "MMLU-PRO": 0.2366 + } + }, + { + "model_id": "4season/final_model_test_v2", + "name": "final_model_test_v2", + "developer": "4season", + "scores": { + "IFEval": 0.3191, + "BBH": 0.6342, + "MATH Level 5": 0.0838, + "GPQA": 0.3272, + "MUSR": 0.4314, + "MMLU-PRO": 0.3528 + } + }, + { + "model_id": "AALF/FuseChat-Llama-3.1-8B-Instruct-preview", + "name": "FuseChat-Llama-3.1-8B-Instruct-preview", + "developer": "AALF", + "scores": { + "IFEval": 0.719, + "BBH": 0.512, + "MATH Level 5": 0.2477, + "GPQA": 0.3054, + "MUSR": 0.382, + "MMLU-PRO": 0.3733 + } + }, + { + "model_id": "AALF/FuseChat-Llama-3.1-8B-SFT-preview", + "name": "FuseChat-Llama-3.1-8B-SFT-preview", + "developer": "AALF", + "scores": { + "IFEval": 0.7281, + "BBH": 0.524, + "MATH Level 5": 0.2251, + "GPQA": 0.3045, + "MUSR": 0.402, + "MMLU-PRO": 0.3743 + } + }, + { + "model_id": "AALF/gemma-2-27b-it-SimPO-37K", + "name": "gemma-2-27b-it-SimPO-37K", + "developer": "AALF", + "scores": { + "IFEval": 0.2407, + "BBH": 0.3911, + "MATH Level 5": 0.0128, + "GPQA": 0.2802, + "MUSR": 0.3488, + "MMLU-PRO": 0.1971 + } + }, + { + "model_id": "AALF/gemma-2-27b-it-SimPO-37K-100steps", + "name": "gemma-2-27b-it-SimPO-37K-100steps", + "developer": "AALF", + "scores": { + "IFEval": 0.2568, + "BBH": 0.3931, + "MATH Level 5": 0.0211, + "GPQA": 0.2886, + "MUSR": 0.3329, + "MMLU-PRO": 0.2125 + } + }, + { + "model_id": "AELLM/gemma-2-aeria-infinity-9b", + "name": "gemma-2-aeria-infinity-9b", + "developer": "AELLM", + "scores": { + "IFEval": 0.7594, + "BBH": 0.5983, + "MATH Level 5": 0.2145, + "GPQA": 0.3339, + "MUSR": 0.402, + "MMLU-PRO": 0.3862 + } + }, + { + "model_id": "AELLM/gemma-2-lyco-infinity-9b", + "name": "gemma-2-lyco-infinity-9b", + "developer": "AELLM", + "scores": { + "IFEval": 0.7316, + "BBH": 0.584, + "MATH Level 5": 0.1707, + "GPQA": 0.328, + "MUSR": 0.4006, + "MMLU-PRO": 0.3787 + } + }, + { + "model_id": "AGI-0/Art-v0-3B", + "name": "Art-v0-3B", + "developer": "AGI-0", + "scores": { + "IFEval": 0.3192, + "BBH": 0.3401, + "MATH Level 5": 0.2462, + "GPQA": 0.2592, + "MUSR": 0.3768, + "MMLU-PRO": 0.1179 + } + }, + { + "model_id": "AGI-0/Artificium-llama3.1-8B-001", + "name": "Artificium-llama3.1-8B-001", + "developer": "AGI-0", + "scores": { + "IFEval": 0.5248, + "BBH": 0.4256, + "MATH Level 5": 0.136, + "GPQA": 0.2659, + "MUSR": 0.3795, + "MMLU-PRO": 0.3182 + } + }, + { + "model_id": "AGI-0/smartllama3.1-8B-001", + "name": "smartllama3.1-8B-001", + "developer": "AGI-0", + "scores": { + "IFEval": 0.3518, + "BBH": 0.467, + "MATH Level 5": 0.1299, + "GPQA": 0.3062, + "MUSR": 0.4386, + "MMLU-PRO": 0.3487 + } + }, + { + "model_id": "AI-MO/NuminaMath-7B-CoT", + "name": "NuminaMath-7B-CoT", + "developer": "AI-MO", + "scores": { + "IFEval": 0.2689, + "BBH": 0.4314, + "MATH Level 5": 0.2696, + "GPQA": 0.2659, + "MUSR": 0.3303, + "MMLU-PRO": 0.2868 + } + }, + { + "model_id": "AI-MO/NuminaMath-7B-TIR", + "name": "NuminaMath-7B-TIR", + "developer": "AI-MO", + "scores": { + "IFEval": 0.2756, + "BBH": 0.4144, + "MATH Level 5": 0.1609, + "GPQA": 0.2584, + "MUSR": 0.3509, + "MMLU-PRO": 0.2733 + } + }, + { + "model_id": "AI-Sweden-Models/Llama-3-8B-instruct", + "name": "Llama-3-8B-instruct", + "developer": "AI-Sweden-Models", + "scores": { + "IFEval": 0.2401, + "BBH": 0.4173, + "MATH Level 5": 0.0385, + "GPQA": 0.2659, + "MUSR": 0.4771, + "MMLU-PRO": 0.2597 + } + }, + { + "model_id": "AI-Sweden-Models/gpt-sw3-40b", + "name": "gpt-sw3-40b", + "developer": "AI-Sweden-Models", + "scores": { + "IFEval": 0.147, + "BBH": 0.3268, + "MATH Level 5": 0.0174, + "GPQA": 0.2349, + "MUSR": 0.3632, + "MMLU-PRO": 0.1276 + } + }, + { + "model_id": "AI4free/Dhanishtha", + "name": "Dhanishtha", + "developer": "AI4free", + "scores": { + "IFEval": 0.2451, + "BBH": 0.3404, + "MATH Level 5": 0.256, + "GPQA": 0.2525, + "MUSR": 0.3569, + "MMLU-PRO": 0.1643 + } + }, + { + "model_id": "AI4free/t2", + "name": "t2", + "developer": "AI4free", + "scores": { + "IFEval": 0.3867, + "BBH": 0.291, + "MATH Level 5": 0.1896, + "GPQA": 0.2576, + "MUSR": 0.3846, + "MMLU-PRO": 0.1144 + } + }, + { + "model_id": "AIDC-AI/Marco-o1", + "name": "Marco-o1", + "developer": "AIDC-AI", + "scores": { + "IFEval": 0.4771, + "BBH": 0.5364, + "MATH Level 5": 0.3746, + "GPQA": 0.2592, + "MUSR": 0.4138, + "MMLU-PRO": 0.4117 + } + }, + { + "model_id": "Aashraf995/Creative-7B-nerd", + "name": "Creative-7B-nerd", + "developer": "Aashraf995", + "scores": { + "IFEval": 0.4722, + "BBH": 0.5607, + "MATH Level 5": 0.3165, + "GPQA": 0.3263, + "MUSR": 0.4515, + "MMLU-PRO": 0.4492 + } + }, + { + "model_id": "Aashraf995/Gemma-Evo-10B", + "name": "Gemma-Evo-10B", + "developer": "Aashraf995", + "scores": { + "IFEval": 0.7332, + "BBH": 0.6044, + "MATH Level 5": 0.2228, + "GPQA": 0.354, + "MUSR": 0.4595, + "MMLU-PRO": 0.4275 + } + }, + { + "model_id": "Aashraf995/Qwen-Evo-7B", + "name": "Qwen-Evo-7B", + "developer": "Aashraf995", + "scores": { + "IFEval": 0.4757, + "BBH": 0.5709, + "MATH Level 5": 0.3142, + "GPQA": 0.3255, + "MUSR": 0.4541, + "MMLU-PRO": 0.4462 + } + }, + { + "model_id": "Aashraf995/QwenStock-14B", + "name": "QwenStock-14B", + "developer": "Aashraf995", + "scores": { + "IFEval": 0.5009, + "BBH": 0.655, + "MATH Level 5": 0.3573, + "GPQA": 0.3893, + "MUSR": 0.4793, + "MMLU-PRO": 0.5382 + } + }, + { + "model_id": "AbacusResearch/Jallabi-34B", + "name": "Jallabi-34B", + "developer": "AbacusResearch", + "scores": { + "IFEval": 0.3529, + "BBH": 0.6023, + "MATH Level 5": 0.0521, + "GPQA": 0.3389, + "MUSR": 0.4822, + "MMLU-PRO": 0.4682 + } + }, + { + "model_id": "Ahdoot/StructuredThinker-v0.3-MoreStructure", + "name": "StructuredThinker-v0.3-MoreStructure", + "developer": "Ahdoot", + "scores": { + "IFEval": 0.4193, + "BBH": 0.4838, + "MATH Level 5": 0.2908, + "GPQA": 0.297, + "MUSR": 0.4158, + "MMLU-PRO": 0.361 + } + }, + { + "model_id": "Ahdoot/Test_StealthThinker", + "name": "Test_StealthThinker", + "developer": "Ahdoot", + "scores": { + "IFEval": 0.422, + "BBH": 0.4647, + "MATH Level 5": 0.179, + "GPQA": 0.2961, + "MUSR": 0.428, + "MMLU-PRO": 0.3597 + } + }, + { + "model_id": "AicoresSecurity/Cybernet-Sec-3B-R1-V0", + "name": "Cybernet-Sec-3B-R1-V0", + "developer": "AicoresSecurity", + "scores": { + "IFEval": 0.6358, + "BBH": 0.4497, + "MATH Level 5": 0.1156, + "GPQA": 0.2634, + "MUSR": 0.3314, + "MMLU-PRO": 0.301 + } + }, + { + "model_id": "AicoresSecurity/Cybernet-Sec-3B-R1-V0-Coder", + "name": "Cybernet-Sec-3B-R1-V0-Coder", + "developer": "AicoresSecurity", + "scores": { + "IFEval": 0.7098, + "BBH": 0.4478, + "MATH Level 5": 0.1488, + "GPQA": 0.2718, + "MUSR": 0.3408, + "MMLU-PRO": 0.3178 + } + }, + { + "model_id": "AicoresSecurity/Cybernet-Sec-3B-R1-V1", + "name": "Cybernet-Sec-3B-R1-V1", + "developer": "AicoresSecurity", + "scores": { + "IFEval": 0.6146, + "BBH": 0.4282, + "MATH Level 5": 0.1518, + "GPQA": 0.2609, + "MUSR": 0.3287, + "MMLU-PRO": 0.2876 + } + }, + { + "model_id": "AicoresSecurity/Cybernet-Sec-3B-R1-V1.1", + "name": "Cybernet-Sec-3B-R1-V1.1", + "developer": "AicoresSecurity", + "scores": { + "IFEval": 0.673, + "BBH": 0.4392, + "MATH Level 5": 0.176, + "GPQA": 0.271, + "MUSR": 0.3541, + "MMLU-PRO": 0.3088 + } + }, + { + "model_id": "Alepach/notHumpback-M0", + "name": "notHumpback-M0", + "developer": "Alepach", + "scores": { + "IFEval": 0.235, + "BBH": 0.2785, + "MATH Level 5": 0.0189, + "GPQA": 0.2492, + "MUSR": 0.3552, + "MMLU-PRO": 0.1119 + } + }, + { + "model_id": "Alepach/notHumpback-M1", + "name": "notHumpback-M1", + "developer": "Alepach", + "scores": { + "IFEval": 0.2207, + "BBH": 0.2882, + "MATH Level 5": 0.0159, + "GPQA": 0.2374, + "MUSR": 0.342, + "MMLU-PRO": 0.1091 + } + }, + { + "model_id": "Alepach/notHumpback-M1-v2", + "name": "notHumpback-M1-v2", + "developer": "Alepach", + "scores": { + "IFEval": 0.2277, + "BBH": 0.2776, + "MATH Level 5": 0.0219, + "GPQA": 0.2601, + "MUSR": 0.3473, + "MMLU-PRO": 0.1119 + } + }, + { + "model_id": "Alibaba-NLP/gte-Qwen2-7B-instruct", + "name": "gte-Qwen2-7B-instruct", + "developer": "Alibaba-NLP", + "scores": { + "IFEval": 0.2255, + "BBH": 0.4495, + "MATH Level 5": 0.0642, + "GPQA": 0.245, + "MUSR": 0.3559, + "MMLU-PRO": 0.3321 + } + }, + { + "model_id": "Alsebay/Qwen2.5-7B-test-novelist", + "name": "Qwen2.5-7B-test-novelist", + "developer": "Alsebay", + "scores": { + "IFEval": 0.5352, + "BBH": 0.5151, + "MATH Level 5": 0.2349, + "GPQA": 0.2911, + "MUSR": 0.4749, + "MMLU-PRO": 0.3866 + } + }, + { + "model_id": "Amaorynho/BBAI2006", + "name": "BBAI2006", + "developer": "Amaorynho", + "scores": { + "IFEval": 0.1467, + "BBH": 0.2704, + "MATH Level 5": 0.0, + "GPQA": 0.2525, + "MUSR": 0.3605, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "Amaorynho/BBAI270V4", + "name": "BBAI270V4", + "developer": "Amaorynho", + "scores": { + "IFEval": 0.199, + "BBH": 0.3071, + "MATH Level 5": 0.0083, + "GPQA": 0.2458, + "MUSR": 0.3314, + "MMLU-PRO": 0.1114 + } + }, + { + "model_id": "Amaorynho/BBAIIFEV1", + "name": "BBAIIFEV1", + "developer": "Amaorynho", + "scores": { + "IFEval": 0.8047, + "BBH": 0.5292, + "MATH Level 5": 0.1934, + "GPQA": 0.3104, + "MUSR": 0.4185, + "MMLU-PRO": 0.3857 + } + }, + { + "model_id": "Amaorynho/BBAI_375", + "name": "BBAI_375", + "developer": "Amaorynho", + "scores": { + "IFEval": 0.1467, + "BBH": 0.2704, + "MATH Level 5": 0.0, + "GPQA": 0.2525, + "MUSR": 0.3605, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "Amu/t1-1.5B", + "name": "t1-1.5B", + "developer": "Amu", + "scores": { + "IFEval": 0.3394, + "BBH": 0.4008, + "MATH Level 5": 0.0514, + "GPQA": 0.2433, + "MUSR": 0.3517, + "MMLU-PRO": 0.2566 + } + }, + { + "model_id": "Amu/t1-3B", + "name": "t1-3B", + "developer": "Amu", + "scores": { + "IFEval": 0.3328, + "BBH": 0.3999, + "MATH Level 5": 0.1375, + "GPQA": 0.2408, + "MUSR": 0.3435, + "MMLU-PRO": 0.1284 + } + }, + { + "model_id": "ArliAI/ArliAI-RPMax-12B-v1.1", + "name": "ArliAI-RPMax-12B-v1.1", + "developer": "ArliAI", + "scores": { + "IFEval": 0.5349, + "BBH": 0.4752, + "MATH Level 5": 0.1125, + "GPQA": 0.2819, + "MUSR": 0.3618, + "MMLU-PRO": 0.3384 + } + }, + { + "model_id": "ArliAI/Llama-3.1-8B-ArliAI-RPMax-v1.1", + "name": "Llama-3.1-8B-ArliAI-RPMax-v1.1", + "developer": "ArliAI", + "scores": { + "IFEval": 0.6359, + "BBH": 0.5016, + "MATH Level 5": 0.1314, + "GPQA": 0.2836, + "MUSR": 0.3577, + "MMLU-PRO": 0.3551 + } + }, + { + "model_id": "Arthur-LAGACHERIE/Precis-1B-Instruct", + "name": "Precis-1B-Instruct", + "developer": "Arthur-LAGACHERIE", + "scores": { + "IFEval": 0.3671, + "BBH": 0.3224, + "MATH Level 5": 0.0038, + "GPQA": 0.2659, + "MUSR": 0.3436, + "MMLU-PRO": 0.1426 + } + }, + { + "model_id": "Artples/L-MChat-7b", + "name": "L-MChat-7b", + "developer": "Artples", + "scores": { + "IFEval": 0.5297, + "BBH": 0.46, + "MATH Level 5": 0.0921, + "GPQA": 0.3054, + "MUSR": 0.4029, + "MMLU-PRO": 0.3299 + } + }, + { + "model_id": "Artples/L-MChat-Small", + "name": "L-MChat-Small", + "developer": "Artples", + "scores": { + "IFEval": 0.3287, + "BBH": 0.4823, + "MATH Level 5": 0.0378, + "GPQA": 0.2676, + "MUSR": 0.3696, + "MMLU-PRO": 0.2464 + } + }, + { + "model_id": "Aryanne/QwentileSwap", + "name": "QwentileSwap", + "developer": "Aryanne", + "scores": { + "IFEval": 0.7378, + "BBH": 0.7008, + "MATH Level 5": 0.4222, + "GPQA": 0.3674, + "MUSR": 0.464, + "MMLU-PRO": 0.5946 + } + }, + { + "model_id": "Aryanne/SHBA", + "name": "SHBA", + "developer": "Aryanne", + "scores": { + "IFEval": 0.7817, + "BBH": 0.5233, + "MATH Level 5": 0.1798, + "GPQA": 0.3054, + "MUSR": 0.4161, + "MMLU-PRO": 0.3892 + } + }, + { + "model_id": "Aryanne/SuperHeart", + "name": "SuperHeart", + "developer": "Aryanne", + "scores": { + "IFEval": 0.5192, + "BBH": 0.5215, + "MATH Level 5": 0.1563, + "GPQA": 0.3012, + "MUSR": 0.4436, + "MMLU-PRO": 0.3912 + } + }, + { + "model_id": "AtAndDev/Qwen2.5-1.5B-continuous-learnt", + "name": "Qwen2.5-1.5B-continuous-learnt", + "developer": "AtAndDev", + "scores": { + "IFEval": 0.4605, + "BBH": 0.4258, + "MATH Level 5": 0.0748, + "GPQA": 0.2659, + "MUSR": 0.3636, + "MMLU-PRO": 0.2812 + } + }, + { + "model_id": "Ateron/Glowing-Forest-12B", + "name": "Glowing-Forest-12B", + "developer": "Ateron", + "scores": { + "IFEval": 0.3592, + "BBH": 0.5492, + "MATH Level 5": 0.0778, + "GPQA": 0.3331, + "MUSR": 0.4449, + "MMLU-PRO": 0.3718 + } + }, + { + "model_id": "Ateron/Lotus-Magpic", + "name": "Lotus-Magpic", + "developer": "Ateron", + "scores": { + "IFEval": 0.6286, + "BBH": 0.5254, + "MATH Level 5": 0.0997, + "GPQA": 0.3029, + "MUSR": 0.4332, + "MMLU-PRO": 0.3491 + } + }, + { + "model_id": "Ateron/Way_of_MagPicaro", + "name": "Way_of_MagPicaro", + "developer": "Ateron", + "scores": { + "IFEval": 0.2637, + "BBH": 0.5427, + "MATH Level 5": 0.0589, + "GPQA": 0.3339, + "MUSR": 0.4649, + "MMLU-PRO": 0.3536 + } + }, + { + "model_id": "AuraIndustries/Aura-4B", + "name": "Aura-4B", + "developer": "AuraIndustries", + "scores": { + "IFEval": 0.3816, + "BBH": 0.449, + "MATH Level 5": 0.0423, + "GPQA": 0.2878, + "MUSR": 0.3938, + "MMLU-PRO": 0.2706 + } + }, + { + "model_id": "AuraIndustries/Aura-8B", + "name": "Aura-8B", + "developer": "AuraIndustries", + "scores": { + "IFEval": 0.7205, + "BBH": 0.5131, + "MATH Level 5": 0.1518, + "GPQA": 0.2861, + "MUSR": 0.4004, + "MMLU-PRO": 0.3874 + } + }, + { + "model_id": "AuraIndustries/Aura-MoE-2x4B", + "name": "Aura-MoE-2x4B", + "developer": "AuraIndustries", + "scores": { + "IFEval": 0.4601, + "BBH": 0.4339, + "MATH Level 5": 0.031, + "GPQA": 0.2718, + "MUSR": 0.4085, + "MMLU-PRO": 0.265 + } + }, + { + "model_id": "AuraIndustries/Aura-MoE-2x4B-v2", + "name": "Aura-MoE-2x4B-v2", + "developer": "AuraIndustries", + "scores": { + "IFEval": 0.4778, + "BBH": 0.4315, + "MATH Level 5": 0.0317, + "GPQA": 0.2878, + "MUSR": 0.4101, + "MMLU-PRO": 0.261 + } + }, + { + "model_id": "Aurel9/testmerge-7b", + "name": "testmerge-7b", + "developer": "Aurel9", + "scores": { + "IFEval": 0.398, + "BBH": 0.519, + "MATH Level 5": 0.0657, + "GPQA": 0.3003, + "MUSR": 0.4659, + "MMLU-PRO": 0.3053 + } + }, + { + "model_id": "Ayush-Singh/Llama1B-sft-2", + "name": "Llama1B-sft-2", + "developer": "Ayush-Singh", + "scores": { + "IFEval": 0.1374, + "BBH": 0.2834, + "MATH Level 5": 0.0, + "GPQA": 0.2458, + "MUSR": 0.3552, + "MMLU-PRO": 0.1117 + } + }, + { + "model_id": "Azure99/Blossom-V6-14B", + "name": "Blossom-V6-14B", + "developer": "Azure99", + "scores": { + "IFEval": 0.6395, + "BBH": 0.5069, + "MATH Level 5": 0.5257, + "GPQA": 0.2626, + "MUSR": 0.4035, + "MMLU-PRO": 0.4544 + } + }, + { + "model_id": "Azure99/Blossom-V6-7B", + "name": "Blossom-V6-7B", + "developer": "Azure99", + "scores": { + "IFEval": 0.5538, + "BBH": 0.4974, + "MATH Level 5": 0.4585, + "GPQA": 0.3045, + "MUSR": 0.4301, + "MMLU-PRO": 0.4144 + } + }, + { + "model_id": "Azure99/blossom-v5-32b", + "name": "blossom-v5-32b", + "developer": "Azure99", + "scores": { + "IFEval": 0.5235, + "BBH": 0.5955, + "MATH Level 5": 0.1866, + "GPQA": 0.3112, + "MUSR": 0.402, + "MMLU-PRO": 0.4235 + } + }, + { + "model_id": "Azure99/blossom-v5-llama3-8b", + "name": "blossom-v5-llama3-8b", + "developer": "Azure99", + "scores": { + "IFEval": 0.4343, + "BBH": 0.4185, + "MATH Level 5": 0.0514, + "GPQA": 0.2651, + "MUSR": 0.367, + "MMLU-PRO": 0.2206 + } + }, + { + "model_id": "Azure99/blossom-v5.1-34b", + "name": "blossom-v5.1-34b", + "developer": "Azure99", + "scores": { + "IFEval": 0.5697, + "BBH": 0.6109, + "MATH Level 5": 0.2591, + "GPQA": 0.3096, + "MUSR": 0.3928, + "MMLU-PRO": 0.4558 + } + }, + { + "model_id": "Azure99/blossom-v5.1-9b", + "name": "blossom-v5.1-9b", + "developer": "Azure99", + "scores": { + "IFEval": 0.5086, + "BBH": 0.5343, + "MATH Level 5": 0.2122, + "GPQA": 0.3356, + "MUSR": 0.3994, + "MMLU-PRO": 0.3979 + } + }, + { + "model_id": "BAAI/Gemma2-9B-IT-Simpo-Infinity-Preference", + "name": "Gemma2-9B-IT-Simpo-Infinity-Preference", + "developer": "BAAI", + "scores": { + "IFEval": 0.3176, + "BBH": 0.5979, + "MATH Level 5": 0.0974, + "GPQA": 0.3398, + "MUSR": 0.3966, + "MMLU-PRO": 0.3869 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-3M-0613-Llama3-70B", + "name": "Infinity-Instruct-3M-0613-Llama3-70B", + "developer": "BAAI", + "scores": { + "IFEval": 0.6821, + "BBH": 0.6642, + "MATH Level 5": 0.2153, + "GPQA": 0.3582, + "MUSR": 0.4523, + "MMLU-PRO": 0.473 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-3M-0613-Mistral-7B", + "name": "Infinity-Instruct-3M-0613-Mistral-7B", + "developer": "BAAI", + "scores": { + "IFEval": 0.532, + "BBH": 0.4958, + "MATH Level 5": 0.0816, + "GPQA": 0.2961, + "MUSR": 0.4351, + "MMLU-PRO": 0.3161 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-3M-0625-Llama3-70B", + "name": "Infinity-Instruct-3M-0625-Llama3-70B", + "developer": "BAAI", + "scores": { + "IFEval": 0.7442, + "BBH": 0.667, + "MATH Level 5": 0.2251, + "GPQA": 0.3574, + "MUSR": 0.4617, + "MMLU-PRO": 0.4586 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-3M-0625-Llama3-8B", + "name": "Infinity-Instruct-3M-0625-Llama3-8B", + "developer": "BAAI", + "scores": { + "IFEval": 0.605, + "BBH": 0.4955, + "MATH Level 5": 0.0884, + "GPQA": 0.2752, + "MUSR": 0.3712, + "MMLU-PRO": 0.3252 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-3M-0625-Mistral-7B", + "name": "Infinity-Instruct-3M-0625-Mistral-7B", + "developer": "BAAI", + "scores": { + "IFEval": 0.5867, + "BBH": 0.494, + "MATH Level 5": 0.0763, + "GPQA": 0.2869, + "MUSR": 0.4272, + "MMLU-PRO": 0.323 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-3M-0625-Qwen2-7B", + "name": "Infinity-Instruct-3M-0625-Qwen2-7B", + "developer": "BAAI", + "scores": { + "IFEval": 0.5554, + "BBH": 0.5346, + "MATH Level 5": 0.1926, + "GPQA": 0.3129, + "MUSR": 0.3888, + "MMLU-PRO": 0.396 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-3M-0625-Yi-1.5-9B", + "name": "Infinity-Instruct-3M-0625-Yi-1.5-9B", + "developer": "BAAI", + "scores": { + "IFEval": 0.5186, + "BBH": 0.5509, + "MATH Level 5": 0.1639, + "GPQA": 0.354, + "MUSR": 0.4575, + "MMLU-PRO": 0.4118 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-7M-0729-Llama3_1-8B", + "name": "Infinity-Instruct-7M-0729-Llama3_1-8B", + "developer": "BAAI", + "scores": { + "IFEval": 0.6132, + "BBH": 0.5077, + "MATH Level 5": 0.1276, + "GPQA": 0.2928, + "MUSR": 0.3578, + "MMLU-PRO": 0.3224 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-7M-0729-mistral-7B", + "name": "Infinity-Instruct-7M-0729-mistral-7B", + "developer": "BAAI", + "scores": { + "IFEval": 0.6162, + "BBH": 0.4964, + "MATH Level 5": 0.0831, + "GPQA": 0.2903, + "MUSR": 0.4062, + "MMLU-PRO": 0.3274 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-7M-Gen-Llama3_1-70B", + "name": "Infinity-Instruct-7M-Gen-Llama3_1-70B", + "developer": "BAAI", + "scores": { + "IFEval": 0.7335, + "BBH": 0.6695, + "MATH Level 5": 0.2523, + "GPQA": 0.3758, + "MUSR": 0.4539, + "MMLU-PRO": 0.4607 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-7M-Gen-Llama3_1-8B", + "name": "Infinity-Instruct-7M-Gen-Llama3_1-8B", + "developer": "BAAI", + "scores": { + "IFEval": 0.6132, + "BBH": 0.5077, + "MATH Level 5": 0.1276, + "GPQA": 0.2928, + "MUSR": 0.3578, + "MMLU-PRO": 0.3224 + } + }, + { + "model_id": "BAAI/Infinity-Instruct-7M-Gen-mistral-7B", + "name": "Infinity-Instruct-7M-Gen-mistral-7B", + "developer": "BAAI", + "scores": { + "IFEval": 0.6147, + "BBH": 0.4964, + "MATH Level 5": 0.0831, + "GPQA": 0.2903, + "MUSR": 0.4062, + "MMLU-PRO": 0.3274 + } + }, + { + "model_id": "BAAI/OPI-Llama-3.1-8B-Instruct", + "name": "OPI-Llama-3.1-8B-Instruct", + "developer": "BAAI", + "scores": { + "IFEval": 0.2075, + "BBH": 0.3551, + "MATH Level 5": 0.0136, + "GPQA": 0.2743, + "MUSR": 0.3233, + "MMLU-PRO": 0.2124 + } + }, + { + "model_id": "BEE-spoke-data/Meta-Llama-3-8Bee", + "name": "Meta-Llama-3-8Bee", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.1951, + "BBH": 0.4626, + "MATH Level 5": 0.0483, + "GPQA": 0.3138, + "MUSR": 0.3654, + "MMLU-PRO": 0.322 + } + }, + { + "model_id": "BEE-spoke-data/smol_llama-101M-GQA", + "name": "smol_llama-101M-GQA", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.1384, + "BBH": 0.3018, + "MATH Level 5": 0.006, + "GPQA": 0.2576, + "MUSR": 0.3713, + "MMLU-PRO": 0.1107 + } + }, + { + "model_id": "BEE-spoke-data/smol_llama-220M-GQA", + "name": "smol_llama-220M-GQA", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.2386, + "BBH": 0.3032, + "MATH Level 5": 0.0106, + "GPQA": 0.2559, + "MUSR": 0.4059, + "MMLU-PRO": 0.1149 + } + }, + { + "model_id": "BEE-spoke-data/smol_llama-220M-GQA-fineweb_edu", + "name": "smol_llama-220M-GQA-fineweb_edu", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.1988, + "BBH": 0.2929, + "MATH Level 5": 0.0068, + "GPQA": 0.2592, + "MUSR": 0.4368, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "BEE-spoke-data/smol_llama-220M-openhermes", + "name": "smol_llama-220M-openhermes", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.1555, + "BBH": 0.3028, + "MATH Level 5": 0.0106, + "GPQA": 0.2676, + "MUSR": 0.3847, + "MMLU-PRO": 0.112 + } + }, + { + "model_id": "BEE-spoke-data/tFINE-900m-e16-d32-flan", + "name": "tFINE-900m-e16-d32-flan", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.1506, + "BBH": 0.3028, + "MATH Level 5": 0.0098, + "GPQA": 0.2332, + "MUSR": 0.3724, + "MMLU-PRO": 0.1307 + } + }, + { + "model_id": "BEE-spoke-data/tFINE-900m-e16-d32-flan-infinity-instruct-7m-T2T_en-1024", + "name": "tFINE-900m-e16-d32-flan-infinity-instruct-7m-T2T_en-1024", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.1321, + "BBH": 0.3138, + "MATH Level 5": 0.0106, + "GPQA": 0.2542, + "MUSR": 0.4393, + "MMLU-PRO": 0.1237 + } + }, + { + "model_id": "BEE-spoke-data/tFINE-900m-e16-d32-instruct_2e", + "name": "tFINE-900m-e16-d32-instruct_2e", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.1403, + "BBH": 0.3135, + "MATH Level 5": 0.0136, + "GPQA": 0.2592, + "MUSR": 0.4207, + "MMLU-PRO": 0.1237 + } + }, + { + "model_id": "BEE-spoke-data/tFINE-900m-instruct-orpo", + "name": "tFINE-900m-instruct-orpo", + "developer": "BEE-spoke-data", + "scores": { + "IFEval": 0.133, + "BBH": 0.3022, + "MATH Level 5": 0.0159, + "GPQA": 0.2592, + "MUSR": 0.3409, + "MMLU-PRO": 0.1152 + } + }, + { + "model_id": "BSC-LT/salamandra-7b", + "name": "salamandra-7b", + "developer": "BSC-LT", + "scores": { + "IFEval": 0.1367, + "BBH": 0.3517, + "MATH Level 5": 0.0038, + "GPQA": 0.2701, + "MUSR": 0.3501, + "MMLU-PRO": 0.1493 + } + }, + { + "model_id": "BSC-LT/salamandra-7b-instruct", + "name": "salamandra-7b-instruct", + "developer": "BSC-LT", + "scores": { + "IFEval": 0.2451, + "BBH": 0.3851, + "MATH Level 5": 0.0083, + "GPQA": 0.2643, + "MUSR": 0.4134, + "MMLU-PRO": 0.1805 + } + }, + { + "model_id": "Ba2han/Llama-Phi-3_DoRA", + "name": "Llama-Phi-3_DoRA", + "developer": "Ba2han", + "scores": { + "IFEval": 0.5131, + "BBH": 0.5515, + "MATH Level 5": 0.1216, + "GPQA": 0.3263, + "MUSR": 0.4069, + "MMLU-PRO": 0.3915 + } + }, + { + "model_id": "Baptiste-HUVELLE-10/LeTriomphant2.2_ECE_iLAB", + "name": "LeTriomphant2.2_ECE_iLAB", + "developer": "Baptiste-HUVELLE-10", + "scores": { + "IFEval": 0.5076, + "BBH": 0.7256, + "MATH Level 5": 0.4449, + "GPQA": 0.3993, + "MUSR": 0.4626, + "MMLU-PRO": 0.5851 + } + }, + { + "model_id": "BenevolenceMessiah/Qwen2.5-72B-2x-Instruct-TIES-v1.0", + "name": "Qwen2.5-72B-2x-Instruct-TIES-v1.0", + "developer": "BenevolenceMessiah", + "scores": { + "IFEval": 0.5473, + "BBH": 0.7273, + "MATH Level 5": 0.5785, + "GPQA": 0.3674, + "MUSR": 0.4207, + "MMLU-PRO": 0.5628 + } + }, + { + "model_id": "BenevolenceMessiah/Yi-Coder-9B-Chat-Instruct-TIES-MoE-v1.0", + "name": "Yi-Coder-9B-Chat-Instruct-TIES-MoE-v1.0", + "developer": "BenevolenceMessiah", + "scores": { + "IFEval": 0.3012, + "BBH": 0.4909, + "MATH Level 5": 0.0415, + "GPQA": 0.2626, + "MUSR": 0.408, + "MMLU-PRO": 0.268 + } + }, + { + "model_id": "BlackBeenie/Bloslain-8B-v0.2", + "name": "Bloslain-8B-v0.2", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.5023, + "BBH": 0.5111, + "MATH Level 5": 0.145, + "GPQA": 0.3062, + "MUSR": 0.4076, + "MMLU-PRO": 0.3654 + } + }, + { + "model_id": "BlackBeenie/Llama-3.1-8B-OpenO1-SFT-v0.1", + "name": "Llama-3.1-8B-OpenO1-SFT-v0.1", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.5124, + "BBH": 0.4787, + "MATH Level 5": 0.1526, + "GPQA": 0.2685, + "MUSR": 0.3618, + "MMLU-PRO": 0.3492 + } + }, + { + "model_id": "BlackBeenie/Llama-3.1-8B-pythonic-passthrough-merge", + "name": "Llama-3.1-8B-pythonic-passthrough-merge", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.2316, + "BBH": 0.3454, + "MATH Level 5": 0.0113, + "GPQA": 0.2685, + "MUSR": 0.3778, + "MMLU-PRO": 0.1332 + } + }, + { + "model_id": "BlackBeenie/Neos-Gemma-2-9b", + "name": "Neos-Gemma-2-9b", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.5876, + "BBH": 0.5503, + "MATH Level 5": 0.0982, + "GPQA": 0.323, + "MUSR": 0.3618, + "MMLU-PRO": 0.3981 + } + }, + { + "model_id": "BlackBeenie/Neos-Llama-3.1-8B", + "name": "Neos-Llama-3.1-8B", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.4944, + "BBH": 0.4425, + "MATH Level 5": 0.1322, + "GPQA": 0.2685, + "MUSR": 0.375, + "MMLU-PRO": 0.3262 + } + }, + { + "model_id": "BlackBeenie/Neos-Llama-3.1-base", + "name": "Neos-Llama-3.1-base", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.1751, + "BBH": 0.293, + "MATH Level 5": 0.0, + "GPQA": 0.2374, + "MUSR": 0.3499, + "MMLU-PRO": 0.1112 + } + }, + { + "model_id": "BlackBeenie/Neos-Phi-3-14B-v0.1", + "name": "Neos-Phi-3-14B-v0.1", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.4022, + "BBH": 0.6212, + "MATH Level 5": 0.1782, + "GPQA": 0.3054, + "MUSR": 0.4125, + "MMLU-PRO": 0.4564 + } + }, + { + "model_id": "BlackBeenie/llama-3-luminous-merged", + "name": "llama-3-luminous-merged", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.4323, + "BBH": 0.5154, + "MATH Level 5": 0.0869, + "GPQA": 0.2928, + "MUSR": 0.4149, + "MMLU-PRO": 0.3773 + } + }, + { + "model_id": "BlackBeenie/llama-3.1-8B-Galore-openassistant-guanaco", + "name": "llama-3.1-8B-Galore-openassistant-guanaco", + "developer": "BlackBeenie", + "scores": { + "IFEval": 0.2635, + "BBH": 0.5213, + "MATH Level 5": 0.0665, + "GPQA": 0.3003, + "MUSR": 0.4406, + "MMLU-PRO": 0.3206 + } + }, + { + "model_id": "Bllossom/llama-3.2-Korean-Bllossom-AICA-5B", + "name": "llama-3.2-Korean-Bllossom-AICA-5B", + "developer": "Bllossom", + "scores": { + "IFEval": 0.5172, + "BBH": 0.4293, + "MATH Level 5": 0.1239, + "GPQA": 0.2987, + "MUSR": 0.3834, + "MMLU-PRO": 0.271 + } + }, + { + "model_id": "BoltMonkey/DreadMix", + "name": "DreadMix", + "developer": "BoltMonkey", + "scores": { + "IFEval": 0.7095, + "BBH": 0.5435, + "MATH Level 5": 0.1556, + "GPQA": 0.2995, + "MUSR": 0.4212, + "MMLU-PRO": 0.379 + } + }, + { + "model_id": "BoltMonkey/NeuralDaredevil-SuperNova-Lite-7B-DARETIES-abliterated", + "name": "NeuralDaredevil-SuperNova-Lite-7B-DARETIES-abliterated", + "developer": "BoltMonkey", + "scores": { + "IFEval": 0.459, + "BBH": 0.5185, + "MATH Level 5": 0.0937, + "GPQA": 0.2743, + "MUSR": 0.4083, + "MMLU-PRO": 0.3631 + } + }, + { + "model_id": "BoltMonkey/SuperNeuralDreadDevil-8b", + "name": "SuperNeuralDreadDevil-8b", + "developer": "BoltMonkey", + "scores": { + "IFEval": 0.771, + "BBH": 0.5286, + "MATH Level 5": 0.0929, + "GPQA": 0.2919, + "MUSR": 0.3977, + "MMLU-PRO": 0.3679 + } + }, + { + "model_id": "BrainWave-ML/llama3.2-3B-maths-orpo", + "name": "llama3.2-3B-maths-orpo", + "developer": "BrainWave-ML", + "scores": { + "IFEval": 0.2049, + "BBH": 0.2912, + "MATH Level 5": 0.0, + "GPQA": 0.2592, + "MUSR": 0.3575, + "MMLU-PRO": 0.1168 + } + }, + { + "model_id": "BramVanroy/GEITje-7B-ultra", + "name": "GEITje-7B-ultra", + "developer": "BramVanroy", + "scores": { + "IFEval": 0.3723, + "BBH": 0.3776, + "MATH Level 5": 0.0159, + "GPQA": 0.2626, + "MUSR": 0.329, + "MMLU-PRO": 0.2011 + } + }, + { + "model_id": "BramVanroy/fietje-2", + "name": "fietje-2", + "developer": "BramVanroy", + "scores": { + "IFEval": 0.2098, + "BBH": 0.4036, + "MATH Level 5": 0.0159, + "GPQA": 0.2542, + "MUSR": 0.3696, + "MMLU-PRO": 0.1986 + } + }, + { + "model_id": "BramVanroy/fietje-2-chat", + "name": "fietje-2-chat", + "developer": "BramVanroy", + "scores": { + "IFEval": 0.2917, + "BBH": 0.415, + "MATH Level 5": 0.0189, + "GPQA": 0.2399, + "MUSR": 0.3528, + "MMLU-PRO": 0.2055 + } + }, + { + "model_id": "BramVanroy/fietje-2-instruct", + "name": "fietje-2-instruct", + "developer": "BramVanroy", + "scores": { + "IFEval": 0.279, + "BBH": 0.4136, + "MATH Level 5": 0.0227, + "GPQA": 0.2332, + "MUSR": 0.3369, + "MMLU-PRO": 0.2104 + } + }, + { + "model_id": "CYFRAGOVPL/Llama-PLLuM-8B-base", + "name": "Llama-PLLuM-8B-base", + "developer": "CYFRAGOVPL", + "scores": { + "IFEval": 0.2899, + "BBH": 0.432, + "MATH Level 5": 0.0363, + "GPQA": 0.2852, + "MUSR": 0.397, + "MMLU-PRO": 0.2757 + } + }, + { + "model_id": "CYFRAGOVPL/Llama-PLLuM-8B-chat", + "name": "Llama-PLLuM-8B-chat", + "developer": "CYFRAGOVPL", + "scores": { + "IFEval": 0.3515, + "BBH": 0.4077, + "MATH Level 5": 0.034, + "GPQA": 0.2643, + "MUSR": 0.4199, + "MMLU-PRO": 0.2719 + } + }, + { + "model_id": "CYFRAGOVPL/PLLuM-12B-base", + "name": "PLLuM-12B-base", + "developer": "CYFRAGOVPL", + "scores": { + "IFEval": 0.2821, + "BBH": 0.4391, + "MATH Level 5": 0.0287, + "GPQA": 0.2903, + "MUSR": 0.4142, + "MMLU-PRO": 0.274 + } + }, + { + "model_id": "CYFRAGOVPL/PLLuM-12B-chat", + "name": "PLLuM-12B-chat", + "developer": "CYFRAGOVPL", + "scores": { + "IFEval": 0.3214, + "BBH": 0.4446, + "MATH Level 5": 0.0181, + "GPQA": 0.2601, + "MUSR": 0.4115, + "MMLU-PRO": 0.2872 + } + }, + { + "model_id": "CYFRAGOVPL/PLLuM-12B-nc-base", + "name": "PLLuM-12B-nc-base", + "developer": "CYFRAGOVPL", + "scores": { + "IFEval": 0.2405, + "BBH": 0.4277, + "MATH Level 5": 0.0219, + "GPQA": 0.2701, + "MUSR": 0.3645, + "MMLU-PRO": 0.2559 + } + }, + { + "model_id": "CYFRAGOVPL/PLLuM-12B-nc-chat", + "name": "PLLuM-12B-nc-chat", + "developer": "CYFRAGOVPL", + "scores": { + "IFEval": 0.2834, + "BBH": 0.4576, + "MATH Level 5": 0.0121, + "GPQA": 0.2827, + "MUSR": 0.4354, + "MMLU-PRO": 0.2597 + } + }, + { + "model_id": "CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct", + "name": "Llama-3.2-Rabbit-Ko-3B-Instruct", + "developer": "CarrotAI", + "scores": { + "IFEval": 0.7199, + "BBH": 0.4427, + "MATH Level 5": 0.2054, + "GPQA": 0.271, + "MUSR": 0.3649, + "MMLU-PRO": 0.2822 + } + }, + { + "model_id": "CarrotAI/Llama-3.2-Rabbit-Ko-3B-Instruct-2412", + "name": "Llama-3.2-Rabbit-Ko-3B-Instruct-2412", + "developer": "CarrotAI", + "scores": { + "IFEval": 0.4782, + "BBH": 0.4358, + "MATH Level 5": 0.176, + "GPQA": 0.2928, + "MUSR": 0.3872, + "MMLU-PRO": 0.3134 + } + }, + { + "model_id": "Casual-Autopsy/L3-Umbral-Mind-RP-v2.0-8B", + "name": "L3-Umbral-Mind-RP-v2.0-8B", + "developer": "Casual-Autopsy", + "scores": { + "IFEval": 0.7123, + "BBH": 0.5262, + "MATH Level 5": 0.1095, + "GPQA": 0.2869, + "MUSR": 0.3687, + "MMLU-PRO": 0.3723 + } + }, + { + "model_id": "CausalLM/14B", + "name": "14B", + "developer": "CausalLM", + "scores": { + "IFEval": 0.2788, + "BBH": 0.47, + "MATH Level 5": 0.0755, + "GPQA": 0.3029, + "MUSR": 0.4155, + "MMLU-PRO": 0.3221 + } + }, + { + "model_id": "CausalLM/34b-beta", + "name": "34b-beta", + "developer": "CausalLM", + "scores": { + "IFEval": 0.3043, + "BBH": 0.5591, + "MATH Level 5": 0.0483, + "GPQA": 0.3465, + "MUSR": 0.3749, + "MMLU-PRO": 0.5325 + } + }, + { + "model_id": "CausalLM/preview-1-hf", + "name": "preview-1-hf", + "developer": "CausalLM", + "scores": { + "IFEval": 0.5559, + "BBH": 0.3615, + "MATH Level 5": 0.0302, + "GPQA": 0.2617, + "MUSR": 0.3422, + "MMLU-PRO": 0.3597 + } + }, + { + "model_id": "Changgil/K2S3-14b-v0.2", + "name": "K2S3-14b-v0.2", + "developer": "Changgil", + "scores": { + "IFEval": 0.3243, + "BBH": 0.4613, + "MATH Level 5": 0.0574, + "GPQA": 0.281, + "MUSR": 0.3923, + "MMLU-PRO": 0.2644 + } + }, + { + "model_id": "Changgil/K2S3-v0.1", + "name": "K2S3-v0.1", + "developer": "Changgil", + "scores": { + "IFEval": 0.3277, + "BBH": 0.4655, + "MATH Level 5": 0.0461, + "GPQA": 0.2643, + "MUSR": 0.4014, + "MMLU-PRO": 0.2562 + } + }, + { + "model_id": "ClaudioItaly/Albacus", + "name": "Albacus", + "developer": "ClaudioItaly", + "scores": { + "IFEval": 0.4667, + "BBH": 0.5113, + "MATH Level 5": 0.071, + "GPQA": 0.2718, + "MUSR": 0.4135, + "MMLU-PRO": 0.3165 + } + }, + { + "model_id": "ClaudioItaly/Book-Gut12B", + "name": "Book-Gut12B", + "developer": "ClaudioItaly", + "scores": { + "IFEval": 0.3998, + "BBH": 0.5417, + "MATH Level 5": 0.102, + "GPQA": 0.307, + "MUSR": 0.4635, + "MMLU-PRO": 0.367 + } + }, + { + "model_id": "ClaudioItaly/Evolutionstory-7B-v2.2", + "name": "Evolutionstory-7B-v2.2", + "developer": "ClaudioItaly", + "scores": { + "IFEval": 0.4814, + "BBH": 0.5108, + "MATH Level 5": 0.071, + "GPQA": 0.2752, + "MUSR": 0.4135, + "MMLU-PRO": 0.3159 + } + }, + { + "model_id": "ClaudioItaly/intelligence-cod-rag-7b-v3", + "name": "intelligence-cod-rag-7b-v3", + "developer": "ClaudioItaly", + "scores": { + "IFEval": 0.6898, + "BBH": 0.5366, + "MATH Level 5": 0.3807, + "GPQA": 0.2727, + "MUSR": 0.4153, + "MMLU-PRO": 0.4195 + } + }, + { + "model_id": "CohereForAI/aya-23-35B", + "name": "aya-23-35B", + "developer": "CohereForAI", + "scores": { + "IFEval": 0.6462, + "BBH": 0.54, + "MATH Level 5": 0.0347, + "GPQA": 0.2945, + "MUSR": 0.431, + "MMLU-PRO": 0.3356 + } + }, + { + "model_id": "CohereForAI/aya-23-8B", + "name": "aya-23-8B", + "developer": "CohereForAI", + "scores": { + "IFEval": 0.4699, + "BBH": 0.4296, + "MATH Level 5": 0.0166, + "GPQA": 0.2844, + "MUSR": 0.3941, + "MMLU-PRO": 0.2278 + } + }, + { + "model_id": "CohereForAI/aya-expanse-32b", + "name": "aya-expanse-32b", + "developer": "CohereForAI", + "scores": { + "IFEval": 0.7302, + "BBH": 0.5649, + "MATH Level 5": 0.1533, + "GPQA": 0.3255, + "MUSR": 0.3873, + "MMLU-PRO": 0.413 + } + }, + { + "model_id": "CohereForAI/aya-expanse-8b", + "name": "aya-expanse-8b", + "developer": "CohereForAI", + "scores": { + "IFEval": 0.6359, + "BBH": 0.4977, + "MATH Level 5": 0.0861, + "GPQA": 0.3029, + "MUSR": 0.3729, + "MMLU-PRO": 0.3004 + } + }, + { + "model_id": "CohereForAI/c4ai-command-r-plus", + "name": "c4ai-command-r-plus", + "developer": "CohereForAI", + "scores": { + "IFEval": 0.7664, + "BBH": 0.5815, + "MATH Level 5": 0.0801, + "GPQA": 0.3054, + "MUSR": 0.4807, + "MMLU-PRO": 0.3992 + } + }, + { + "model_id": "CohereForAI/c4ai-command-r-plus-08-2024", + "name": "c4ai-command-r-plus-08-2024", + "developer": "CohereForAI", + "scores": { + "IFEval": 0.754, + "BBH": 0.5996, + "MATH Level 5": 0.1239, + "GPQA": 0.3507, + "MUSR": 0.4829, + "MMLU-PRO": 0.4421 + } + }, + { + "model_id": "CohereForAI/c4ai-command-r-v01", + "name": "c4ai-command-r-v01", + "developer": "CohereForAI", + "scores": { + "IFEval": 0.6748, + "BBH": 0.5406, + "MATH Level 5": 0.0347, + "GPQA": 0.307, + "MUSR": 0.4517, + "MMLU-PRO": 0.3369 + } + }, + { + "model_id": "CohereForAI/c4ai-command-r7b-12-2024", + "name": "c4ai-command-r7b-12-2024", + "developer": "CohereForAI", + "scores": { + "IFEval": 0.7713, + "BBH": 0.5503, + "MATH Level 5": 0.2991, + "GPQA": 0.3087, + "MUSR": 0.4125, + "MMLU-PRO": 0.3572 + } + }, + { + "model_id": "Columbia-NLP/LION-Gemma-2b-dpo-v1.0", + "name": "LION-Gemma-2b-dpo-v1.0", + "developer": "Columbia-NLP", + "scores": { + "IFEval": 0.3278, + "BBH": 0.392, + "MATH Level 5": 0.0431, + "GPQA": 0.2492, + "MUSR": 0.412, + "MMLU-PRO": 0.1666 + } + }, + { + "model_id": "Columbia-NLP/LION-Gemma-2b-odpo-v1.0", + "name": "LION-Gemma-2b-odpo-v1.0", + "developer": "Columbia-NLP", + "scores": { + "IFEval": 0.3066, + "BBH": 0.3896, + "MATH Level 5": 0.0695, + "GPQA": 0.2424, + "MUSR": 0.4279, + "MMLU-PRO": 0.1692 + } + }, + { + "model_id": "Columbia-NLP/LION-Gemma-2b-sft-v1.0", + "name": "LION-Gemma-2b-sft-v1.0", + "developer": "Columbia-NLP", + "scores": { + "IFEval": 0.3692, + "BBH": 0.3879, + "MATH Level 5": 0.068, + "GPQA": 0.2559, + "MUSR": 0.4027, + "MMLU-PRO": 0.1782 + } + }, + { + "model_id": "Columbia-NLP/LION-LLaMA-3-8b-dpo-v1.0", + "name": "LION-LLaMA-3-8b-dpo-v1.0", + "developer": "Columbia-NLP", + "scores": { + "IFEval": 0.4957, + "BBH": 0.5028, + "MATH Level 5": 0.1171, + "GPQA": 0.281, + "MUSR": 0.4097, + "MMLU-PRO": 0.3219 + } + }, + { + "model_id": "Columbia-NLP/LION-LLaMA-3-8b-odpo-v1.0", + "name": "LION-LLaMA-3-8b-odpo-v1.0", + "developer": "Columbia-NLP", + "scores": { + "IFEval": 0.3968, + "BBH": 0.5024, + "MATH Level 5": 0.1065, + "GPQA": 0.2852, + "MUSR": 0.4057, + "MMLU-PRO": 0.3152 + } + }, + { + "model_id": "Columbia-NLP/LION-LLaMA-3-8b-sft-v1.0", + "name": "LION-LLaMA-3-8b-sft-v1.0", + "developer": "Columbia-NLP", + "scores": { + "IFEval": 0.3817, + "BBH": 0.5088, + "MATH Level 5": 0.114, + "GPQA": 0.2777, + "MUSR": 0.4503, + "MMLU-PRO": 0.3237 + } + }, + { + "model_id": "CombinHorizon/Josiefied-abliteratedV4-Qwen2.5-14B-Inst-BaseMerge-TIES", + "name": "Josiefied-abliteratedV4-Qwen2.5-14B-Inst-BaseMerge-TIES", + "developer": "CombinHorizon", + "scores": { + "IFEval": 0.824, + "BBH": 0.637, + "MATH Level 5": 0.5317, + "GPQA": 0.3247, + "MUSR": 0.426, + "MMLU-PRO": 0.4979 + } + }, + { + "model_id": "CombinHorizon/Rombos-Qwen2.5-7B-Inst-BaseMerge-TIES", + "name": "Rombos-Qwen2.5-7B-Inst-BaseMerge-TIES", + "developer": "CombinHorizon", + "scores": { + "IFEval": 0.7564, + "BBH": 0.5402, + "MATH Level 5": 0.4932, + "GPQA": 0.2978, + "MUSR": 0.4033, + "MMLU-PRO": 0.4342 + } + }, + { + "model_id": "CombinHorizon/YiSM-blossom5.1-34B-SLERP", + "name": "YiSM-blossom5.1-34B-SLERP", + "developer": "CombinHorizon", + "scores": { + "IFEval": 0.5033, + "BBH": 0.6208, + "MATH Level 5": 0.2153, + "GPQA": 0.3557, + "MUSR": 0.4413, + "MMLU-PRO": 0.4741 + } + }, + { + "model_id": "CombinHorizon/huihui-ai-abliterated-Qwen2.5-32B-Inst-BaseMerge-TIES", + "name": "huihui-ai-abliterated-Qwen2.5-32B-Inst-BaseMerge-TIES", + "developer": "CombinHorizon", + "scores": { + "IFEval": 0.8206, + "BBH": 0.6929, + "MATH Level 5": 0.5944, + "GPQA": 0.3389, + "MUSR": 0.4207, + "MMLU-PRO": 0.5721 + } + }, + { + "model_id": "CombinHorizon/huihui-ai-abliteratedV2-Qwen2.5-14B-Inst-BaseMerge-TIES", + "name": "huihui-ai-abliteratedV2-Qwen2.5-14B-Inst-BaseMerge-TIES", + "developer": "CombinHorizon", + "scores": { + "IFEval": 0.8176, + "BBH": 0.6336, + "MATH Level 5": 0.5476, + "GPQA": 0.3146, + "MUSR": 0.426, + "MMLU-PRO": 0.491 + } + }, + { + "model_id": "CombinHorizon/zetasepic-abliteratedV2-Qwen2.5-32B-Inst-BaseMerge-TIES", + "name": "zetasepic-abliteratedV2-Qwen2.5-32B-Inst-BaseMerge-TIES", + "developer": "CombinHorizon", + "scores": { + "IFEval": 0.8328, + "BBH": 0.6955, + "MATH Level 5": 0.5853, + "GPQA": 0.3674, + "MUSR": 0.4314, + "MMLU-PRO": 0.5685 + } + }, + { + "model_id": "ContactDoctor/Bio-Medical-3B-CoT-012025", + "name": "Bio-Medical-3B-CoT-012025", + "developer": "ContactDoctor", + "scores": { + "IFEval": 0.3604, + "BBH": 0.4383, + "MATH Level 5": 0.2213, + "GPQA": 0.3045, + "MUSR": 0.3368, + "MMLU-PRO": 0.2934 + } + }, + { + "model_id": "ContactDoctor/Bio-Medical-Llama-3-8B", + "name": "Bio-Medical-Llama-3-8B", + "developer": "ContactDoctor", + "scores": { + "IFEval": 0.4422, + "BBH": 0.4863, + "MATH Level 5": 0.0672, + "GPQA": 0.3339, + "MUSR": 0.3514, + "MMLU-PRO": 0.3648 + } + }, + { + "model_id": "CoolSpring/Qwen2-0.5B-Abyme", + "name": "Qwen2-0.5B-Abyme", + "developer": "CoolSpring", + "scores": { + "IFEval": 0.1915, + "BBH": 0.2862, + "MATH Level 5": 0.0295, + "GPQA": 0.2534, + "MUSR": 0.3542, + "MMLU-PRO": 0.1333 + } + }, + { + "model_id": "CoolSpring/Qwen2-0.5B-Abyme-merge2", + "name": "Qwen2-0.5B-Abyme-merge2", + "developer": "CoolSpring", + "scores": { + "IFEval": 0.2022, + "BBH": 0.2994, + "MATH Level 5": 0.0332, + "GPQA": 0.2601, + "MUSR": 0.3687, + "MMLU-PRO": 0.1489 + } + }, + { + "model_id": "CoolSpring/Qwen2-0.5B-Abyme-merge3", + "name": "Qwen2-0.5B-Abyme-merge3", + "developer": "CoolSpring", + "scores": { + "IFEval": 0.2386, + "BBH": 0.3003, + "MATH Level 5": 0.0317, + "GPQA": 0.2643, + "MUSR": 0.3501, + "MMLU-PRO": 0.15 + } + }, + { + "model_id": "Corianas/Neural-Mistral-7B", + "name": "Neural-Mistral-7B", + "developer": "Corianas", + "scores": { + "IFEval": 0.5489, + "BBH": 0.4428, + "MATH Level 5": 0.0189, + "GPQA": 0.2836, + "MUSR": 0.3873, + "MMLU-PRO": 0.2738 + } + }, + { + "model_id": "Corianas/Quokka_2.7b", + "name": "Quokka_2.7b", + "developer": "Corianas", + "scores": { + "IFEval": 0.1749, + "BBH": 0.3055, + "MATH Level 5": 0.0083, + "GPQA": 0.2559, + "MUSR": 0.3908, + "MMLU-PRO": 0.1145 + } + }, + { + "model_id": "Corianas/llama-3-reactor", + "name": "llama-3-reactor", + "developer": "Corianas", + "scores": { + "IFEval": 0.23, + "BBH": 0.4457, + "MATH Level 5": 0.0468, + "GPQA": 0.2978, + "MUSR": 0.3977, + "MMLU-PRO": 0.2801 + } + }, + { + "model_id": "CortexLM/btlm-7b-base-v0.2", + "name": "btlm-7b-base-v0.2", + "developer": "CortexLM", + "scores": { + "IFEval": 0.1483, + "BBH": 0.4006, + "MATH Level 5": 0.0151, + "GPQA": 0.2534, + "MUSR": 0.3846, + "MMLU-PRO": 0.235 + } + }, + { + "model_id": "Cran-May/SCE-2-24B", + "name": "SCE-2-24B", + "developer": "Cran-May", + "scores": { + "IFEval": 0.5866, + "BBH": 0.6265, + "MATH Level 5": 0.1896, + "GPQA": 0.3372, + "MUSR": 0.4528, + "MMLU-PRO": 0.4612 + } + }, + { + "model_id": "Cran-May/SCE-3-24B", + "name": "SCE-3-24B", + "developer": "Cran-May", + "scores": { + "IFEval": 0.5465, + "BBH": 0.5973, + "MATH Level 5": 0.1881, + "GPQA": 0.3465, + "MUSR": 0.4435, + "MMLU-PRO": 0.4647 + } + }, + { + "model_id": "Cran-May/T.E-8.1", + "name": "T.E-8.1", + "developer": "Cran-May", + "scores": { + "IFEval": 0.7077, + "BBH": 0.5582, + "MATH Level 5": 0.4456, + "GPQA": 0.3129, + "MUSR": 0.4505, + "MMLU-PRO": 0.4432 + } + }, + { + "model_id": "Cran-May/merge_model_20250308_2", + "name": "merge_model_20250308_2", + "developer": "Cran-May", + "scores": { + "IFEval": 0.5932, + "BBH": 0.6585, + "MATH Level 5": 0.4381, + "GPQA": 0.3909, + "MUSR": 0.4794, + "MMLU-PRO": 0.542 + } + }, + { + "model_id": "Cran-May/merge_model_20250308_3", + "name": "merge_model_20250308_3", + "developer": "Cran-May", + "scores": { + "IFEval": 0.6018, + "BBH": 0.6271, + "MATH Level 5": 0.2545, + "GPQA": 0.3221, + "MUSR": 0.432, + "MMLU-PRO": 0.4962 + } + }, + { + "model_id": "Cran-May/merge_model_20250308_4", + "name": "merge_model_20250308_4", + "developer": "Cran-May", + "scores": { + "IFEval": 0.454, + "BBH": 0.6664, + "MATH Level 5": 0.4199, + "GPQA": 0.3977, + "MUSR": 0.4688, + "MMLU-PRO": 0.5367 + } + }, + { + "model_id": "Cran-May/tempmotacilla-cinerea-0308", + "name": "tempmotacilla-cinerea-0308", + "developer": "Cran-May", + "scores": { + "IFEval": 0.8085, + "BBH": 0.6551, + "MATH Level 5": 0.5551, + "GPQA": 0.3624, + "MUSR": 0.4208, + "MMLU-PRO": 0.525 + } + }, + { + "model_id": "CreitinGameplays/Llama-3.1-8B-R1-v0.1", + "name": "Llama-3.1-8B-R1-v0.1", + "developer": "CreitinGameplays", + "scores": { + "IFEval": 0.3235, + "BBH": 0.3057, + "MATH Level 5": 0.1813, + "GPQA": 0.2584, + "MUSR": 0.3622, + "MMLU-PRO": 0.1252 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Broca", + "name": "Qwen2.5-14B-Broca", + "developer": "CultriX", + "scores": { + "IFEval": 0.5604, + "BBH": 0.6527, + "MATH Level 5": 0.358, + "GPQA": 0.3867, + "MUSR": 0.4767, + "MMLU-PRO": 0.5364 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-BrocaV9", + "name": "Qwen2.5-14B-BrocaV9", + "developer": "CultriX", + "scores": { + "IFEval": 0.6763, + "BBH": 0.6391, + "MATH Level 5": 0.3814, + "GPQA": 0.3641, + "MUSR": 0.469, + "MMLU-PRO": 0.5331 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Brocav3", + "name": "Qwen2.5-14B-Brocav3", + "developer": "CultriX", + "scores": { + "IFEval": 0.6952, + "BBH": 0.6452, + "MATH Level 5": 0.3875, + "GPQA": 0.3591, + "MUSR": 0.4756, + "MMLU-PRO": 0.5317 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Brocav6", + "name": "Qwen2.5-14B-Brocav6", + "developer": "CultriX", + "scores": { + "IFEval": 0.6995, + "BBH": 0.6389, + "MATH Level 5": 0.3875, + "GPQA": 0.3674, + "MUSR": 0.4742, + "MMLU-PRO": 0.5319 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Brocav7", + "name": "Qwen2.5-14B-Brocav7", + "developer": "CultriX", + "scores": { + "IFEval": 0.6724, + "BBH": 0.6444, + "MATH Level 5": 0.3844, + "GPQA": 0.3674, + "MUSR": 0.4796, + "MMLU-PRO": 0.5258 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Emerged", + "name": "Qwen2.5-14B-Emerged", + "developer": "CultriX", + "scores": { + "IFEval": 0.7, + "BBH": 0.626, + "MATH Level 5": 0.3248, + "GPQA": 0.3574, + "MUSR": 0.4691, + "MMLU-PRO": 0.5186 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Emergedv3", + "name": "Qwen2.5-14B-Emergedv3", + "developer": "CultriX", + "scores": { + "IFEval": 0.6388, + "BBH": 0.6191, + "MATH Level 5": 0.4358, + "GPQA": 0.3607, + "MUSR": 0.4728, + "MMLU-PRO": 0.5174 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-FinalMerge", + "name": "Qwen2.5-14B-FinalMerge", + "developer": "CultriX", + "scores": { + "IFEval": 0.4891, + "BBH": 0.5715, + "MATH Level 5": 0.3814, + "GPQA": 0.3549, + "MUSR": 0.4379, + "MMLU-PRO": 0.4574 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Hyper", + "name": "Qwen2.5-14B-Hyper", + "developer": "CultriX", + "scores": { + "IFEval": 0.5391, + "BBH": 0.6507, + "MATH Level 5": 0.3437, + "GPQA": 0.3918, + "MUSR": 0.4898, + "MMLU-PRO": 0.5374 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-HyperMarck-dl", + "name": "Qwen2.5-14B-HyperMarck-dl", + "developer": "CultriX", + "scores": { + "IFEval": 0.665, + "BBH": 0.6096, + "MATH Level 5": 0.5287, + "GPQA": 0.3674, + "MUSR": 0.4416, + "MMLU-PRO": 0.5091 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Hyperionv3", + "name": "Qwen2.5-14B-Hyperionv3", + "developer": "CultriX", + "scores": { + "IFEval": 0.6836, + "BBH": 0.6522, + "MATH Level 5": 0.3701, + "GPQA": 0.3708, + "MUSR": 0.473, + "MMLU-PRO": 0.534 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Hyperionv4", + "name": "Qwen2.5-14B-Hyperionv4", + "developer": "CultriX", + "scores": { + "IFEval": 0.5416, + "BBH": 0.6472, + "MATH Level 5": 0.3474, + "GPQA": 0.3977, + "MUSR": 0.4832, + "MMLU-PRO": 0.5364 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Hyperionv5", + "name": "Qwen2.5-14B-Hyperionv5", + "developer": "CultriX", + "scores": { + "IFEval": 0.6729, + "BBH": 0.6443, + "MATH Level 5": 0.3822, + "GPQA": 0.3716, + "MUSR": 0.4795, + "MMLU-PRO": 0.5302 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-MegaMerge-pt2", + "name": "Qwen2.5-14B-MegaMerge-pt2", + "developer": "CultriX", + "scores": { + "IFEval": 0.5683, + "BBH": 0.6578, + "MATH Level 5": 0.3995, + "GPQA": 0.3792, + "MUSR": 0.4729, + "MMLU-PRO": 0.5421 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-MergeStock", + "name": "Qwen2.5-14B-MergeStock", + "developer": "CultriX", + "scores": { + "IFEval": 0.5685, + "BBH": 0.6579, + "MATH Level 5": 0.4147, + "GPQA": 0.3733, + "MUSR": 0.4676, + "MMLU-PRO": 0.5396 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-ReasoningMerge", + "name": "Qwen2.5-14B-ReasoningMerge", + "developer": "CultriX", + "scores": { + "IFEval": 0.4605, + "BBH": 0.6578, + "MATH Level 5": 0.5204, + "GPQA": 0.4077, + "MUSR": 0.5166, + "MMLU-PRO": 0.5345 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Ultimav2", + "name": "Qwen2.5-14B-Ultimav2", + "developer": "CultriX", + "scores": { + "IFEval": 0.55, + "BBH": 0.6555, + "MATH Level 5": 0.3844, + "GPQA": 0.3851, + "MUSR": 0.4966, + "MMLU-PRO": 0.5417 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Unity", + "name": "Qwen2.5-14B-Unity", + "developer": "CultriX", + "scores": { + "IFEval": 0.6739, + "BBH": 0.602, + "MATH Level 5": 0.4313, + "GPQA": 0.3473, + "MUSR": 0.4679, + "MMLU-PRO": 0.5076 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Wernicke", + "name": "Qwen2.5-14B-Wernicke", + "developer": "CultriX", + "scores": { + "IFEval": 0.5235, + "BBH": 0.6568, + "MATH Level 5": 0.3814, + "GPQA": 0.3935, + "MUSR": 0.4689, + "MMLU-PRO": 0.5424 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Wernicke-SFT", + "name": "Qwen2.5-14B-Wernicke-SFT", + "developer": "CultriX", + "scores": { + "IFEval": 0.4937, + "BBH": 0.6461, + "MATH Level 5": 0.3595, + "GPQA": 0.354, + "MUSR": 0.39, + "MMLU-PRO": 0.507 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Wernicke-SLERP", + "name": "Qwen2.5-14B-Wernicke-SLERP", + "developer": "CultriX", + "scores": { + "IFEval": 0.5589, + "BBH": 0.6441, + "MATH Level 5": 0.4486, + "GPQA": 0.344, + "MUSR": 0.414, + "MMLU-PRO": 0.5094 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-Wernickev3", + "name": "Qwen2.5-14B-Wernickev3", + "developer": "CultriX", + "scores": { + "IFEval": 0.7048, + "BBH": 0.6184, + "MATH Level 5": 0.3542, + "GPQA": 0.3624, + "MUSR": 0.4717, + "MMLU-PRO": 0.5151 + } + }, + { + "model_id": "CultriX/Qwen2.5-14B-partialmergept1", + "name": "Qwen2.5-14B-partialmergept1", + "developer": "CultriX", + "scores": { + "IFEval": 0.6337, + "BBH": 0.6151, + "MATH Level 5": 0.4539, + "GPQA": 0.3616, + "MUSR": 0.4757, + "MMLU-PRO": 0.5208 + } + }, + { + "model_id": "CultriX/Qwenfinity-2.5-14B", + "name": "Qwenfinity-2.5-14B", + "developer": "CultriX", + "scores": { + "IFEval": 0.4814, + "BBH": 0.5655, + "MATH Level 5": 0.4101, + "GPQA": 0.349, + "MUSR": 0.4506, + "MMLU-PRO": 0.4498 + } + }, + { + "model_id": "CultriX/Qwestion-14B", + "name": "Qwestion-14B", + "developer": "CultriX", + "scores": { + "IFEval": 0.6318, + "BBH": 0.645, + "MATH Level 5": 0.3724, + "GPQA": 0.3683, + "MUSR": 0.4636, + "MMLU-PRO": 0.5422 + } + }, + { + "model_id": "CultriX/SeQwence-14B", + "name": "SeQwence-14B", + "developer": "CultriX", + "scores": { + "IFEval": 0.5352, + "BBH": 0.6506, + "MATH Level 5": 0.3535, + "GPQA": 0.3607, + "MUSR": 0.4666, + "MMLU-PRO": 0.5419 + } + }, + { + "model_id": "CultriX/SeQwence-14B-EvolMerge", + "name": "SeQwence-14B-EvolMerge", + "developer": "CultriX", + "scores": { + "IFEval": 0.5382, + "BBH": 0.6572, + "MATH Level 5": 0.3671, + "GPQA": 0.3809, + "MUSR": 0.4821, + "MMLU-PRO": 0.5419 + } + }, + { + "model_id": "CultriX/SeQwence-14B-EvolMergev1", + "name": "SeQwence-14B-EvolMergev1", + "developer": "CultriX", + "scores": { + "IFEval": 0.5555, + "BBH": 0.6546, + "MATH Level 5": 0.4215, + "GPQA": 0.3767, + "MUSR": 0.4623, + "MMLU-PRO": 0.5393 + } + }, + { + "model_id": "CultriX/SeQwence-14B-v5", + "name": "SeQwence-14B-v5", + "developer": "CultriX", + "scores": { + "IFEval": 0.592, + "BBH": 0.6517, + "MATH Level 5": 0.3308, + "GPQA": 0.37, + "MUSR": 0.4714, + "MMLU-PRO": 0.5415 + } + }, + { + "model_id": "CultriX/SeQwence-14Bv1", + "name": "SeQwence-14Bv1", + "developer": "CultriX", + "scores": { + "IFEval": 0.6678, + "BBH": 0.6345, + "MATH Level 5": 0.361, + "GPQA": 0.3616, + "MUSR": 0.4704, + "MMLU-PRO": 0.532 + } + }, + { + "model_id": "CultriX/SeQwence-14Bv2", + "name": "SeQwence-14Bv2", + "developer": "CultriX", + "scores": { + "IFEval": 0.5786, + "BBH": 0.6305, + "MATH Level 5": 0.4758, + "GPQA": 0.3607, + "MUSR": 0.4601, + "MMLU-PRO": 0.5334 + } + }, + { + "model_id": "CultriX/SeQwence-14Bv3", + "name": "SeQwence-14Bv3", + "developer": "CultriX", + "scores": { + "IFEval": 0.5719, + "BBH": 0.6302, + "MATH Level 5": 0.4766, + "GPQA": 0.3649, + "MUSR": 0.4624, + "MMLU-PRO": 0.5335 + } + }, + { + "model_id": "DRXD1000/Atlas-7B", + "name": "Atlas-7B", + "developer": "DRXD1000", + "scores": { + "IFEval": 0.3704, + "BBH": 0.3302, + "MATH Level 5": 0.0189, + "GPQA": 0.2576, + "MUSR": 0.3342, + "MMLU-PRO": 0.1401 + } + }, + { + "model_id": "DRXD1000/Phoenix-7B", + "name": "Phoenix-7B", + "developer": "DRXD1000", + "scores": { + "IFEval": 0.321, + "BBH": 0.3932, + "MATH Level 5": 0.0166, + "GPQA": 0.2785, + "MUSR": 0.3849, + "MMLU-PRO": 0.2343 + } + }, + { + "model_id": "DUAL-GPO/zephyr-7b-ipo-0k-15k-i1", + "name": "zephyr-7b-ipo-0k-15k-i1", + "developer": "DUAL-GPO", + "scores": { + "IFEval": 0.2756, + "BBH": 0.4473, + "MATH Level 5": 0.0302, + "GPQA": 0.2911, + "MUSR": 0.4173, + "MMLU-PRO": 0.313 + } + }, + { + "model_id": "DZgas/GIGABATEMAN-7B", + "name": "GIGABATEMAN-7B", + "developer": "DZgas", + "scores": { + "IFEval": 0.4607, + "BBH": 0.5032, + "MATH Level 5": 0.0551, + "GPQA": 0.2894, + "MUSR": 0.4328, + "MMLU-PRO": 0.3177 + } + }, + { + "model_id": "Daemontatox/AetherDrake-SFT", + "name": "AetherDrake-SFT", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4813, + "BBH": 0.4872, + "MATH Level 5": 0.1511, + "GPQA": 0.3205, + "MUSR": 0.4088, + "MMLU-PRO": 0.3499 + } + }, + { + "model_id": "Daemontatox/AetherSett", + "name": "AetherSett", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.537, + "BBH": 0.5452, + "MATH Level 5": 0.3973, + "GPQA": 0.3079, + "MUSR": 0.4603, + "MMLU-PRO": 0.4279 + } + }, + { + "model_id": "Daemontatox/AetherTOT", + "name": "AetherTOT", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4398, + "BBH": 0.5066, + "MATH Level 5": 0.1488, + "GPQA": 0.3238, + "MUSR": 0.4079, + "MMLU-PRO": 0.3804 + } + }, + { + "model_id": "Daemontatox/AetherUncensored", + "name": "AetherUncensored", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4042, + "BBH": 0.4463, + "MATH Level 5": 0.145, + "GPQA": 0.2886, + "MUSR": 0.3747, + "MMLU-PRO": 0.271 + } + }, + { + "model_id": "Daemontatox/Cogito-MIS", + "name": "Cogito-MIS", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.1815, + "BBH": 0.506, + "MATH Level 5": 0.0861, + "GPQA": 0.2567, + "MUSR": 0.3768, + "MMLU-PRO": 0.1435 + } + }, + { + "model_id": "Daemontatox/CogitoDistil", + "name": "CogitoDistil", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.2776, + "BBH": 0.3677, + "MATH Level 5": 0.3927, + "GPQA": 0.2592, + "MUSR": 0.3755, + "MMLU-PRO": 0.2625 + } + }, + { + "model_id": "Daemontatox/CogitoZ", + "name": "CogitoZ", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.3967, + "BBH": 0.6734, + "MATH Level 5": 0.5242, + "GPQA": 0.3951, + "MUSR": 0.4793, + "MMLU-PRO": 0.5593 + } + }, + { + "model_id": "Daemontatox/CogitoZ14", + "name": "CogitoZ14", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.6637, + "BBH": 0.6298, + "MATH Level 5": 0.4222, + "GPQA": 0.3163, + "MUSR": 0.4059, + "MMLU-PRO": 0.3999 + } + }, + { + "model_id": "Daemontatox/DocumentCogito", + "name": "DocumentCogito", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.5064, + "BBH": 0.5112, + "MATH Level 5": 0.1631, + "GPQA": 0.3163, + "MUSR": 0.3973, + "MMLU-PRO": 0.3802 + } + }, + { + "model_id": "Daemontatox/Llama3.3-70B-CogniLink", + "name": "Llama3.3-70B-CogniLink", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.6931, + "BBH": 0.6668, + "MATH Level 5": 0.4139, + "GPQA": 0.4455, + "MUSR": 0.4877, + "MMLU-PRO": 0.5173 + } + }, + { + "model_id": "Daemontatox/Llama_cot", + "name": "Llama_cot", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.7549, + "BBH": 0.4838, + "MATH Level 5": 0.2024, + "GPQA": 0.2911, + "MUSR": 0.3872, + "MMLU-PRO": 0.3518 + } + }, + { + "model_id": "Daemontatox/MawaredT1", + "name": "MawaredT1", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4199, + "BBH": 0.5215, + "MATH Level 5": 0.3021, + "GPQA": 0.3347, + "MUSR": 0.4702, + "MMLU-PRO": 0.4718 + } + }, + { + "model_id": "Daemontatox/Mini_QwQ", + "name": "Mini_QwQ", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4497, + "BBH": 0.5549, + "MATH Level 5": 0.4192, + "GPQA": 0.3037, + "MUSR": 0.4682, + "MMLU-PRO": 0.4373 + } + }, + { + "model_id": "Daemontatox/NemoR", + "name": "NemoR", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.2287, + "BBH": 0.5194, + "MATH Level 5": 0.0831, + "GPQA": 0.3272, + "MUSR": 0.3908, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "Daemontatox/PathFinderAI2.0", + "name": "PathFinderAI2.0", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4541, + "BBH": 0.6658, + "MATH Level 5": 0.5076, + "GPQA": 0.302, + "MUSR": 0.4216, + "MMLU-PRO": 0.5547 + } + }, + { + "model_id": "Daemontatox/PathFinderAi3.0", + "name": "PathFinderAi3.0", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4271, + "BBH": 0.6884, + "MATH Level 5": 0.5045, + "GPQA": 0.4086, + "MUSR": 0.4807, + "MMLU-PRO": 0.5757 + } + }, + { + "model_id": "Daemontatox/PathfinderAI", + "name": "PathfinderAI", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4855, + "BBH": 0.6627, + "MATH Level 5": 0.4841, + "GPQA": 0.3096, + "MUSR": 0.4256, + "MMLU-PRO": 0.5542 + } + }, + { + "model_id": "Daemontatox/Phi-4-COT", + "name": "Phi-4-COT", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.1793, + "BBH": 0.6173, + "MATH Level 5": 0.2243, + "GPQA": 0.3356, + "MUSR": 0.453, + "MMLU-PRO": 0.5005 + } + }, + { + "model_id": "Daemontatox/PixelParse_AI", + "name": "PixelParse_AI", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4383, + "BBH": 0.5034, + "MATH Level 5": 0.1473, + "GPQA": 0.3238, + "MUSR": 0.4052, + "MMLU-PRO": 0.3778 + } + }, + { + "model_id": "Daemontatox/RA2.0", + "name": "RA2.0", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.3784, + "BBH": 0.4889, + "MATH Level 5": 0.3837, + "GPQA": 0.3054, + "MUSR": 0.4091, + "MMLU-PRO": 0.2616 + } + }, + { + "model_id": "Daemontatox/RA_Reasoner", + "name": "RA_Reasoner", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.5592, + "BBH": 0.6054, + "MATH Level 5": 0.2122, + "GPQA": 0.3314, + "MUSR": 0.3964, + "MMLU-PRO": 0.43 + } + }, + { + "model_id": "Daemontatox/RA_Reasoner2.0", + "name": "RA_Reasoner2.0", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.5366, + "BBH": 0.6062, + "MATH Level 5": 0.2311, + "GPQA": 0.3247, + "MUSR": 0.3884, + "MMLU-PRO": 0.4353 + } + }, + { + "model_id": "Daemontatox/ReasonTest", + "name": "ReasonTest", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.408, + "BBH": 0.5435, + "MATH Level 5": 0.2137, + "GPQA": 0.3188, + "MUSR": 0.4315, + "MMLU-PRO": 0.4272 + } + }, + { + "model_id": "Daemontatox/Research_PathfinderAI", + "name": "Research_PathfinderAI", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.3457, + "BBH": 0.2872, + "MATH Level 5": 0.1699, + "GPQA": 0.2408, + "MUSR": 0.3394, + "MMLU-PRO": 0.113 + } + }, + { + "model_id": "Daemontatox/SphinX", + "name": "SphinX", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.5725, + "BBH": 0.5441, + "MATH Level 5": 0.3082, + "GPQA": 0.2978, + "MUSR": 0.4405, + "MMLU-PRO": 0.4366 + } + }, + { + "model_id": "Daemontatox/Sphinx2.0", + "name": "Sphinx2.0", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.7123, + "BBH": 0.6473, + "MATH Level 5": 0.4018, + "GPQA": 0.2936, + "MUSR": 0.426, + "MMLU-PRO": 0.5184 + } + }, + { + "model_id": "Daemontatox/TinySphinx", + "name": "TinySphinx", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.2567, + "BBH": 0.331, + "MATH Level 5": 0.0431, + "GPQA": 0.2735, + "MUSR": 0.3328, + "MMLU-PRO": 0.1698 + } + }, + { + "model_id": "Daemontatox/TinySphinx2.0", + "name": "TinySphinx2.0", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.2535, + "BBH": 0.3168, + "MATH Level 5": 0.0325, + "GPQA": 0.2685, + "MUSR": 0.3382, + "MMLU-PRO": 0.1731 + } + }, + { + "model_id": "Daemontatox/Zirel-7B-Math", + "name": "Zirel-7B-Math", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.6639, + "BBH": 0.5448, + "MATH Level 5": 0.1979, + "GPQA": 0.3263, + "MUSR": 0.4789, + "MMLU-PRO": 0.4237 + } + }, + { + "model_id": "Daemontatox/Zirel_1.5", + "name": "Zirel_1.5", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.4168, + "BBH": 0.3985, + "MATH Level 5": 0.1133, + "GPQA": 0.2601, + "MUSR": 0.3658, + "MMLU-PRO": 0.2143 + } + }, + { + "model_id": "Daemontatox/mini-Cogito-R1", + "name": "mini-Cogito-R1", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.2298, + "BBH": 0.328, + "MATH Level 5": 0.2749, + "GPQA": 0.2869, + "MUSR": 0.3447, + "MMLU-PRO": 0.1482 + } + }, + { + "model_id": "Daemontatox/mini_Pathfinder", + "name": "mini_Pathfinder", + "developer": "Daemontatox", + "scores": { + "IFEval": 0.2962, + "BBH": 0.3956, + "MATH Level 5": 0.4751, + "GPQA": 0.2584, + "MUSR": 0.3781, + "MMLU-PRO": 0.2809 + } + }, + { + "model_id": "Dampfinchen/Llama-3.1-8B-Ultra-Instruct", + "name": "Llama-3.1-8B-Ultra-Instruct", + "developer": "Dampfinchen", + "scores": { + "IFEval": 0.8081, + "BBH": 0.5258, + "MATH Level 5": 0.2205, + "GPQA": 0.2919, + "MUSR": 0.4003, + "MMLU-PRO": 0.3826 + } + }, + { + "model_id": "Danielbrdz/Barcenas-10b", + "name": "Barcenas-10b", + "developer": "Danielbrdz", + "scores": { + "IFEval": 0.6608, + "BBH": 0.6121, + "MATH Level 5": 0.2153, + "GPQA": 0.3414, + "MUSR": 0.4135, + "MMLU-PRO": 0.4361 + } + }, + { + "model_id": "Danielbrdz/Barcenas-14b-Phi-3-medium-ORPO", + "name": "Barcenas-14b-Phi-3-medium-ORPO", + "developer": "Danielbrdz", + "scores": { + "IFEval": 0.4799, + "BBH": 0.6536, + "MATH Level 5": 0.2024, + "GPQA": 0.3263, + "MUSR": 0.4808, + "MMLU-PRO": 0.4723 + } + }, + { + "model_id": "Danielbrdz/Barcenas-14b-phi-4", + "name": "Barcenas-14b-phi-4", + "developer": "Danielbrdz", + "scores": { + "IFEval": 0.0498, + "BBH": 0.6769, + "MATH Level 5": 0.2583, + "GPQA": 0.3834, + "MUSR": 0.5097, + "MMLU-PRO": 0.5175 + } + }, + { + "model_id": "Danielbrdz/Barcenas-14b-phi-4-v2", + "name": "Barcenas-14b-phi-4-v2", + "developer": "Danielbrdz", + "scores": { + "IFEval": 0.2775, + "BBH": 0.6573, + "MATH Level 5": 0.3218, + "GPQA": 0.3784, + "MUSR": 0.4399, + "MMLU-PRO": 0.5244 + } + }, + { + "model_id": "Danielbrdz/Barcenas-3b-GRPO", + "name": "Barcenas-3b-GRPO", + "developer": "Danielbrdz", + "scores": { + "IFEval": 0.5444, + "BBH": 0.4414, + "MATH Level 5": 0.1375, + "GPQA": 0.2903, + "MUSR": 0.3576, + "MMLU-PRO": 0.3037 + } + }, + { + "model_id": "Danielbrdz/Barcenas-Llama3-8b-ORPO", + "name": "Barcenas-Llama3-8b-ORPO", + "developer": "Danielbrdz", + "scores": { + "IFEval": 0.7372, + "BBH": 0.4987, + "MATH Level 5": 0.0657, + "GPQA": 0.307, + "MUSR": 0.419, + "MMLU-PRO": 0.383 + } + }, + { + "model_id": "Danielbrdz/Barcenas-R1-Qwen-1.5b", + "name": "Barcenas-R1-Qwen-1.5b", + "developer": "Danielbrdz", + "scores": { + "IFEval": 0.2428, + "BBH": 0.3587, + "MATH Level 5": 0.3497, + "GPQA": 0.3037, + "MUSR": 0.3541, + "MMLU-PRO": 0.1909 + } + }, + { + "model_id": "Dans-DiscountModels/12b-mn-dans-reasoning-test-2", + "name": "12b-mn-dans-reasoning-test-2", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.3711, + "BBH": 0.4807, + "MATH Level 5": 0.0634, + "GPQA": 0.2735, + "MUSR": 0.3702, + "MMLU-PRO": 0.2507 + } + }, + { + "model_id": "Dans-DiscountModels/12b-mn-dans-reasoning-test-3", + "name": "12b-mn-dans-reasoning-test-3", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.5053, + "BBH": 0.4839, + "MATH Level 5": 0.0778, + "GPQA": 0.271, + "MUSR": 0.4168, + "MMLU-PRO": 0.2516 + } + }, + { + "model_id": "Dans-DiscountModels/Dans-Instruct-CoreCurriculum-12b-ChatML", + "name": "Dans-Instruct-CoreCurriculum-12b-ChatML", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.2111, + "BBH": 0.4792, + "MATH Level 5": 0.0431, + "GPQA": 0.2802, + "MUSR": 0.3606, + "MMLU-PRO": 0.2805 + } + }, + { + "model_id": "Dans-DiscountModels/Dans-Instruct-Mix-8b-ChatML", + "name": "Dans-Instruct-Mix-8b-ChatML", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.0825, + "BBH": 0.4738, + "MATH Level 5": 0.0551, + "GPQA": 0.2945, + "MUSR": 0.3918, + "MMLU-PRO": 0.3288 + } + }, + { + "model_id": "Dans-DiscountModels/Dans-Instruct-Mix-8b-ChatML-V0.1.0", + "name": "Dans-Instruct-Mix-8b-ChatML-V0.1.0", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.0668, + "BBH": 0.4775, + "MATH Level 5": 0.0672, + "GPQA": 0.2861, + "MUSR": 0.3786, + "MMLU-PRO": 0.3284 + } + }, + { + "model_id": "Dans-DiscountModels/Dans-Instruct-Mix-8b-ChatML-V0.1.1", + "name": "Dans-Instruct-Mix-8b-ChatML-V0.1.1", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.0911, + "BBH": 0.4749, + "MATH Level 5": 0.0597, + "GPQA": 0.2911, + "MUSR": 0.3825, + "MMLU-PRO": 0.3279 + } + }, + { + "model_id": "Dans-DiscountModels/Dans-Instruct-Mix-8b-ChatML-V0.2.0", + "name": "Dans-Instruct-Mix-8b-ChatML-V0.2.0", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.5064, + "BBH": 0.4624, + "MATH Level 5": 0.0733, + "GPQA": 0.2936, + "MUSR": 0.3644, + "MMLU-PRO": 0.3 + } + }, + { + "model_id": "Dans-DiscountModels/Mistral-7b-v0.3-Test-E0.7", + "name": "Mistral-7b-v0.3-Test-E0.7", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.5124, + "BBH": 0.475, + "MATH Level 5": 0.034, + "GPQA": 0.2961, + "MUSR": 0.4005, + "MMLU-PRO": 0.2744 + } + }, + { + "model_id": "Dans-DiscountModels/mistral-7b-test-merged", + "name": "mistral-7b-test-merged", + "developer": "Dans-DiscountModels", + "scores": { + "IFEval": 0.6678, + "BBH": 0.4898, + "MATH Level 5": 0.0446, + "GPQA": 0.2945, + "MUSR": 0.3754, + "MMLU-PRO": 0.2978 + } + }, + { + "model_id": "Darkknight535/OpenCrystal-12B-L3", + "name": "OpenCrystal-12B-L3", + "developer": "Darkknight535", + "scores": { + "IFEval": 0.4071, + "BBH": 0.5223, + "MATH Level 5": 0.0899, + "GPQA": 0.3062, + "MUSR": 0.3657, + "MMLU-PRO": 0.364 + } + }, + { + "model_id": "DavidAU/DeepHermes-3-Llama-3-8B-Preview-16.5B-Brainstorm", + "name": "DeepHermes-3-Llama-3-8B-Preview-16.5B-Brainstorm", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3136, + "BBH": 0.4762, + "MATH Level 5": 0.1057, + "GPQA": 0.3138, + "MUSR": 0.3928, + "MMLU-PRO": 0.3209 + } + }, + { + "model_id": "DavidAU/DeepSeek-BlackRoot-R1-Distill-Llama-3.1-8B", + "name": "DeepSeek-BlackRoot-R1-Distill-Llama-3.1-8B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3685, + "BBH": 0.4887, + "MATH Level 5": 0.0657, + "GPQA": 0.318, + "MUSR": 0.432, + "MMLU-PRO": 0.2976 + } + }, + { + "model_id": "DavidAU/DeepSeek-Grand-Horror-SMB-R1-Distill-Llama-3.1-16B", + "name": "DeepSeek-Grand-Horror-SMB-R1-Distill-Llama-3.1-16B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.2507, + "BBH": 0.4488, + "MATH Level 5": 0.0295, + "GPQA": 0.3138, + "MUSR": 0.4164, + "MMLU-PRO": 0.2709 + } + }, + { + "model_id": "DavidAU/DeepSeek-MOE-4X8B-R1-Distill-Llama-3.1-Deep-Thinker-Uncensored-24B", + "name": "DeepSeek-MOE-4X8B-R1-Distill-Llama-3.1-Deep-Thinker-Uncensored-24B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3883, + "BBH": 0.4886, + "MATH Level 5": 0.0816, + "GPQA": 0.323, + "MUSR": 0.4375, + "MMLU-PRO": 0.3024 + } + }, + { + "model_id": "DavidAU/DeepSeek-MOE-4X8B-R1-Distill-Llama-3.1-Mad-Scientist-24B", + "name": "DeepSeek-MOE-4X8B-R1-Distill-Llama-3.1-Mad-Scientist-24B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3436, + "BBH": 0.4769, + "MATH Level 5": 0.0755, + "GPQA": 0.3372, + "MUSR": 0.4231, + "MMLU-PRO": 0.297 + } + }, + { + "model_id": "DavidAU/DeepSeek-R1-Distill-Qwen-25.5B-Brainstorm", + "name": "DeepSeek-R1-Distill-Qwen-25.5B-Brainstorm", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3416, + "BBH": 0.5807, + "MATH Level 5": 0.5536, + "GPQA": 0.3859, + "MUSR": 0.5155, + "MMLU-PRO": 0.4624 + } + }, + { + "model_id": "DavidAU/DeepSeek-V2-Grand-Horror-SMB-R1-Distill-Llama-3.1-Uncensored-16.5B", + "name": "DeepSeek-V2-Grand-Horror-SMB-R1-Distill-Llama-3.1-Uncensored-16.5B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.2853, + "BBH": 0.4462, + "MATH Level 5": 0.0174, + "GPQA": 0.3054, + "MUSR": 0.4179, + "MMLU-PRO": 0.2778 + } + }, + { + "model_id": "DavidAU/DeepThought-MOE-8X3B-R1-Llama-3.2-Reasoning-18B", + "name": "DeepThought-MOE-8X3B-R1-Llama-3.2-Reasoning-18B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3793, + "BBH": 0.4232, + "MATH Level 5": 0.108, + "GPQA": 0.2794, + "MUSR": 0.356, + "MMLU-PRO": 0.272 + } + }, + { + "model_id": "DavidAU/Gemma-The-Writer-9B", + "name": "Gemma-The-Writer-9B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.174, + "BBH": 0.5905, + "MATH Level 5": 0.0876, + "GPQA": 0.3456, + "MUSR": 0.4099, + "MMLU-PRO": 0.3979 + } + }, + { + "model_id": "DavidAU/Gemma-The-Writer-DEADLINE-10B", + "name": "Gemma-The-Writer-DEADLINE-10B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.2332, + "BBH": 0.5896, + "MATH Level 5": 0.0989, + "GPQA": 0.3423, + "MUSR": 0.4189, + "MMLU-PRO": 0.3946 + } + }, + { + "model_id": "DavidAU/Gemma-The-Writer-J.GutenBerg-10B", + "name": "Gemma-The-Writer-J.GutenBerg-10B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.2858, + "BBH": 0.5909, + "MATH Level 5": 0.0921, + "GPQA": 0.3381, + "MUSR": 0.4176, + "MMLU-PRO": 0.3947 + } + }, + { + "model_id": "DavidAU/Gemma-The-Writer-Mighty-Sword-9B", + "name": "Gemma-The-Writer-Mighty-Sword-9B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.7528, + "BBH": 0.5912, + "MATH Level 5": 0.1911, + "GPQA": 0.3482, + "MUSR": 0.4112, + "MMLU-PRO": 0.3968 + } + }, + { + "model_id": "DavidAU/Gemma-The-Writer-N-Restless-Quill-10B-Uncensored", + "name": "Gemma-The-Writer-N-Restless-Quill-10B-Uncensored", + "developer": "DavidAU", + "scores": { + "IFEval": 0.7071, + "BBH": 0.5922, + "MATH Level 5": 0.2296, + "GPQA": 0.3414, + "MUSR": 0.4163, + "MMLU-PRO": 0.3966 + } + }, + { + "model_id": "DavidAU/L3-DARKEST-PLANET-16.5B", + "name": "L3-DARKEST-PLANET-16.5B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.6231, + "BBH": 0.523, + "MATH Level 5": 0.0899, + "GPQA": 0.2953, + "MUSR": 0.3754, + "MMLU-PRO": 0.363 + } + }, + { + "model_id": "DavidAU/L3-Dark-Planet-8B", + "name": "L3-Dark-Planet-8B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.4134, + "BBH": 0.5084, + "MATH Level 5": 0.0823, + "GPQA": 0.3003, + "MUSR": 0.3616, + "MMLU-PRO": 0.3737 + } + }, + { + "model_id": "DavidAU/L3-Jamet-12.2B-MK.V-Blackroot-Instruct", + "name": "L3-Jamet-12.2B-MK.V-Blackroot-Instruct", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3962, + "BBH": 0.4766, + "MATH Level 5": 0.0408, + "GPQA": 0.2785, + "MUSR": 0.402, + "MMLU-PRO": 0.3291 + } + }, + { + "model_id": "DavidAU/L3-Lumimaid-12.2B-v0.1-OAS-Instruct", + "name": "L3-Lumimaid-12.2B-v0.1-OAS-Instruct", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3924, + "BBH": 0.4693, + "MATH Level 5": 0.0461, + "GPQA": 0.2768, + "MUSR": 0.4194, + "MMLU-PRO": 0.3142 + } + }, + { + "model_id": "DavidAU/L3-SMB-Instruct-12.2B-F32", + "name": "L3-SMB-Instruct-12.2B-F32", + "developer": "DavidAU", + "scores": { + "IFEval": 0.4303, + "BBH": 0.4786, + "MATH Level 5": 0.0468, + "GPQA": 0.2819, + "MUSR": 0.4087, + "MMLU-PRO": 0.3312 + } + }, + { + "model_id": "DavidAU/L3-Stheno-Maid-Blackroot-Grand-HORROR-16B", + "name": "L3-Stheno-Maid-Blackroot-Grand-HORROR-16B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3439, + "BBH": 0.4736, + "MATH Level 5": 0.0219, + "GPQA": 0.271, + "MUSR": 0.4031, + "MMLU-PRO": 0.357 + } + }, + { + "model_id": "DavidAU/L3-Stheno-v3.2-12.2B-Instruct", + "name": "L3-Stheno-v3.2-12.2B-Instruct", + "developer": "DavidAU", + "scores": { + "IFEval": 0.4028, + "BBH": 0.4846, + "MATH Level 5": 0.0506, + "GPQA": 0.2752, + "MUSR": 0.4103, + "MMLU-PRO": 0.3345 + } + }, + { + "model_id": "DavidAU/L3.1-Dark-Planet-SpinFire-Uncensored-8B", + "name": "L3.1-Dark-Planet-SpinFire-Uncensored-8B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.7043, + "BBH": 0.5261, + "MATH Level 5": 0.0929, + "GPQA": 0.2794, + "MUSR": 0.3541, + "MMLU-PRO": 0.367 + } + }, + { + "model_id": "DavidAU/L3.1-MOE-2X8B-Deepseek-DeepHermes-e32-uncensored-abliterated-13.7B", + "name": "L3.1-MOE-2X8B-Deepseek-DeepHermes-e32-uncensored-abliterated-13.7B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.3345, + "BBH": 0.4421, + "MATH Level 5": 0.2606, + "GPQA": 0.3138, + "MUSR": 0.3749, + "MMLU-PRO": 0.2892 + } + }, + { + "model_id": "DavidAU/Qwen2.5-MOE-2X1.5B-DeepSeek-Uncensored-Censored-4B", + "name": "Qwen2.5-MOE-2X1.5B-DeepSeek-Uncensored-Censored-4B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.1783, + "BBH": 0.3033, + "MATH Level 5": 0.0249, + "GPQA": 0.2592, + "MUSR": 0.3715, + "MMLU-PRO": 0.1142 + } + }, + { + "model_id": "DavidAU/Qwen2.5-MOE-2X7B-DeepSeek-Abliterated-Censored-19B", + "name": "Qwen2.5-MOE-2X7B-DeepSeek-Abliterated-Censored-19B", + "developer": "DavidAU", + "scores": { + "IFEval": 0.2835, + "BBH": 0.3592, + "MATH Level 5": 0.2417, + "GPQA": 0.2651, + "MUSR": 0.3847, + "MMLU-PRO": 0.1636 + } + }, + { + "model_id": "DavidAU/Qwen2.5-MOE-6x1.5B-DeepSeek-Reasoning-e32", + "name": "Qwen2.5-MOE-6x1.5B-DeepSeek-Reasoning-e32", + "developer": "DavidAU", + "scores": { + "IFEval": 0.2107, + "BBH": 0.3286, + "MATH Level 5": 0.0665, + "GPQA": 0.2475, + "MUSR": 0.3404, + "MMLU-PRO": 0.1122 + } + }, + { + "model_id": "Davidsv/SUONG-1", + "name": "SUONG-1", + "developer": "Davidsv", + "scores": { + "IFEval": 0.2497, + "BBH": 0.2817, + "MATH Level 5": 0.0, + "GPQA": 0.2441, + "MUSR": 0.3578, + "MMLU-PRO": 0.1085 + } + }, + { + "model_id": "DavieLion/Llama-3.2-1B-SPIN-iter0", + "name": "Llama-3.2-1B-SPIN-iter0", + "developer": "DavieLion", + "scores": { + "IFEval": 0.1549, + "BBH": 0.2937, + "MATH Level 5": 0.006, + "GPQA": 0.2576, + "MUSR": 0.3565, + "MMLU-PRO": 0.1128 + } + }, + { + "model_id": "DavieLion/Llama-3.2-1B-SPIN-iter1", + "name": "Llama-3.2-1B-SPIN-iter1", + "developer": "DavieLion", + "scores": { + "IFEval": 0.1575, + "BBH": 0.294, + "MATH Level 5": 0.0023, + "GPQA": 0.2508, + "MUSR": 0.3646, + "MMLU-PRO": 0.1118 + } + }, + { + "model_id": "DavieLion/Llama-3.2-1B-SPIN-iter2", + "name": "Llama-3.2-1B-SPIN-iter2", + "developer": "DavieLion", + "scores": { + "IFEval": 0.1376, + "BBH": 0.298, + "MATH Level 5": 0.0053, + "GPQA": 0.2542, + "MUSR": 0.3553, + "MMLU-PRO": 0.1129 + } + }, + { + "model_id": "DavieLion/Llama-3.2-1B-SPIN-iter3", + "name": "Llama-3.2-1B-SPIN-iter3", + "developer": "DavieLion", + "scores": { + "IFEval": 0.1324, + "BBH": 0.2972, + "MATH Level 5": 0.0, + "GPQA": 0.2643, + "MUSR": 0.3527, + "MMLU-PRO": 0.1129 + } + }, + { + "model_id": "DavieLion/Lllma-3.2-1B", + "name": "Lllma-3.2-1B", + "developer": "DavieLion", + "scores": { + "IFEval": 0.1601, + "BBH": 0.2965, + "MATH Level 5": 0.0068, + "GPQA": 0.2441, + "MUSR": 0.3578, + "MMLU-PRO": 0.1126 + } + }, + { + "model_id": "DebateLabKIT/Llama-3.1-Argunaut-1-8B-SFT", + "name": "Llama-3.1-Argunaut-1-8B-SFT", + "developer": "DebateLabKIT", + "scores": { + "IFEval": 0.5519, + "BBH": 0.4824, + "MATH Level 5": 0.145, + "GPQA": 0.2836, + "MUSR": 0.4503, + "MMLU-PRO": 0.3472 + } + }, + { + "model_id": "Deci/DeciLM-7B", + "name": "DeciLM-7B", + "developer": "Deci", + "scores": { + "IFEval": 0.2813, + "BBH": 0.4423, + "MATH Level 5": 0.0287, + "GPQA": 0.2953, + "MUSR": 0.4359, + "MMLU-PRO": 0.2692 + } + }, + { + "model_id": "Deci/DeciLM-7B-instruct", + "name": "DeciLM-7B-instruct", + "developer": "Deci", + "scores": { + "IFEval": 0.488, + "BBH": 0.459, + "MATH Level 5": 0.0302, + "GPQA": 0.2894, + "MUSR": 0.3884, + "MMLU-PRO": 0.2608 + } + }, + { + "model_id": "DeepAutoAI/Explore_Llama-3.1-8B-Inst", + "name": "Explore_Llama-3.1-8B-Inst", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.7795, + "BBH": 0.5117, + "MATH Level 5": 0.2009, + "GPQA": 0.2836, + "MUSR": 0.391, + "MMLU-PRO": 0.3792 + } + }, + { + "model_id": "DeepAutoAI/Explore_Llama-3.2-1B-Inst", + "name": "Explore_Llama-3.2-1B-Inst", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.5649, + "BBH": 0.3505, + "MATH Level 5": 0.0748, + "GPQA": 0.2559, + "MUSR": 0.3183, + "MMLU-PRO": 0.1809 + } + }, + { + "model_id": "DeepAutoAI/Explore_Llama-3.2-1B-Inst_v0", + "name": "Explore_Llama-3.2-1B-Inst_v0", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.5597, + "BBH": 0.3365, + "MATH Level 5": 0.0597, + "GPQA": 0.2634, + "MUSR": 0.3103, + "MMLU-PRO": 0.1804 + } + }, + { + "model_id": "DeepAutoAI/Explore_Llama-3.2-1B-Inst_v1", + "name": "Explore_Llama-3.2-1B-Inst_v1", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.4999, + "BBH": 0.3141, + "MATH Level 5": 0.031, + "GPQA": 0.245, + "MUSR": 0.3781, + "MMLU-PRO": 0.1269 + } + }, + { + "model_id": "DeepAutoAI/Explore_Llama-3.2-1B-Inst_v1.1", + "name": "Explore_Llama-3.2-1B-Inst_v1.1", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.5844, + "BBH": 0.3513, + "MATH Level 5": 0.0718, + "GPQA": 0.2626, + "MUSR": 0.3117, + "MMLU-PRO": 0.1818 + } + }, + { + "model_id": "DeepAutoAI/causal_gpt2", + "name": "causal_gpt2", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.1813, + "BBH": 0.3026, + "MATH Level 5": 0.0053, + "GPQA": 0.2601, + "MUSR": 0.427, + "MMLU-PRO": 0.1131 + } + }, + { + "model_id": "DeepAutoAI/d2nwg_Llama-3.1-8B-Instruct-v0.0", + "name": "d2nwg_Llama-3.1-8B-Instruct-v0.0", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.7893, + "BBH": 0.508, + "MATH Level 5": 0.1805, + "GPQA": 0.2919, + "MUSR": 0.4135, + "MMLU-PRO": 0.3877 + } + }, + { + "model_id": "DeepAutoAI/d2nwg_causal_gpt2", + "name": "d2nwg_causal_gpt2", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.1916, + "BBH": 0.3027, + "MATH Level 5": 0.0045, + "GPQA": 0.2576, + "MUSR": 0.4297, + "MMLU-PRO": 0.1151 + } + }, + { + "model_id": "DeepAutoAI/d2nwg_causal_gpt2_v1", + "name": "d2nwg_causal_gpt2_v1", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.1989, + "BBH": 0.2992, + "MATH Level 5": 0.0038, + "GPQA": 0.2584, + "MUSR": 0.4337, + "MMLU-PRO": 0.1135 + } + }, + { + "model_id": "DeepAutoAI/ldm_soup_Llama-3.1-8B-Inst", + "name": "ldm_soup_Llama-3.1-8B-Inst", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.8033, + "BBH": 0.5121, + "MATH Level 5": 0.1888, + "GPQA": 0.2894, + "MUSR": 0.4161, + "MMLU-PRO": 0.3886 + } + }, + { + "model_id": "DeepAutoAI/ldm_soup_Llama-3.1-8B-Instruct-v0.0", + "name": "ldm_soup_Llama-3.1-8B-Instruct-v0.0", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.7889, + "BBH": 0.5125, + "MATH Level 5": 0.1918, + "GPQA": 0.2911, + "MUSR": 0.4121, + "MMLU-PRO": 0.3895 + } + }, + { + "model_id": "DeepAutoAI/ldm_soup_Llama-3.1-8B-Instruct-v0.1", + "name": "ldm_soup_Llama-3.1-8B-Instruct-v0.1", + "developer": "DeepAutoAI", + "scores": { + "IFEval": 0.7889, + "BBH": 0.5125, + "MATH Level 5": 0.1918, + "GPQA": 0.2911, + "MUSR": 0.4121, + "MMLU-PRO": 0.3895 + } + }, + { + "model_id": "DeepMount00/Lexora-Lite-3B", + "name": "Lexora-Lite-3B", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.5776, + "BBH": 0.4873, + "MATH Level 5": 0.2304, + "GPQA": 0.2743, + "MUSR": 0.3966, + "MMLU-PRO": 0.3602 + } + }, + { + "model_id": "DeepMount00/Lexora-Lite-3B_v2", + "name": "Lexora-Lite-3B_v2", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.4943, + "BBH": 0.4812, + "MATH Level 5": 0.2281, + "GPQA": 0.271, + "MUSR": 0.3822, + "MMLU-PRO": 0.3544 + } + }, + { + "model_id": "DeepMount00/Lexora-Medium-7B", + "name": "Lexora-Medium-7B", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.4103, + "BBH": 0.5145, + "MATH Level 5": 0.2221, + "GPQA": 0.3054, + "MUSR": 0.4439, + "MMLU-PRO": 0.4325 + } + }, + { + "model_id": "DeepMount00/Llama-3-8b-Ita", + "name": "Llama-3-8b-Ita", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.753, + "BBH": 0.4936, + "MATH Level 5": 0.0665, + "GPQA": 0.3054, + "MUSR": 0.4268, + "MMLU-PRO": 0.3852 + } + }, + { + "model_id": "DeepMount00/Llama-3.1-8b-ITA", + "name": "Llama-3.1-8b-ITA", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.7917, + "BBH": 0.5109, + "MATH Level 5": 0.1088, + "GPQA": 0.2878, + "MUSR": 0.4136, + "MMLU-PRO": 0.3876 + } + }, + { + "model_id": "DeepMount00/Llama-3.1-8b-Ita", + "name": "Llama-3.1-8b-Ita", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.5365, + "BBH": 0.517, + "MATH Level 5": 0.1707, + "GPQA": 0.3062, + "MUSR": 0.4487, + "MMLU-PRO": 0.396 + } + }, + { + "model_id": "DeepMount00/Llama-3.1-Distilled", + "name": "Llama-3.1-Distilled", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.7844, + "BBH": 0.5101, + "MATH Level 5": 0.2032, + "GPQA": 0.3037, + "MUSR": 0.4058, + "MMLU-PRO": 0.3782 + } + }, + { + "model_id": "DeepMount00/Qwen2-1.5B-Ita", + "name": "Qwen2-1.5B-Ita", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.5173, + "BBH": 0.3981, + "MATH Level 5": 0.114, + "GPQA": 0.2626, + "MUSR": 0.3504, + "MMLU-PRO": 0.2772 + } + }, + { + "model_id": "DeepMount00/Qwen2-1.5B-Ita_v2", + "name": "Qwen2-1.5B-Ita_v2", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.5, + "BBH": 0.3954, + "MATH Level 5": 0.0967, + "GPQA": 0.2592, + "MUSR": 0.3702, + "MMLU-PRO": 0.3032 + } + }, + { + "model_id": "DeepMount00/Qwen2-1.5B-Ita_v3", + "name": "Qwen2-1.5B-Ita_v3", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.489, + "BBH": 0.3948, + "MATH Level 5": 0.1042, + "GPQA": 0.2534, + "MUSR": 0.3742, + "MMLU-PRO": 0.3018 + } + }, + { + "model_id": "DeepMount00/Qwen2-1.5B-Ita_v5", + "name": "Qwen2-1.5B-Ita_v5", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.4987, + "BBH": 0.4032, + "MATH Level 5": 0.1178, + "GPQA": 0.2542, + "MUSR": 0.3422, + "MMLU-PRO": 0.2943 + } + }, + { + "model_id": "DeepMount00/Qwen2-1.5B-Ita_v6", + "name": "Qwen2-1.5B-Ita_v6", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.2999, + "BBH": 0.4249, + "MATH Level 5": 0.0846, + "GPQA": 0.2827, + "MUSR": 0.3755, + "MMLU-PRO": 0.2872 + } + }, + { + "model_id": "DeepMount00/Qwen2.5-7B-Instruct-MathCoder", + "name": "Qwen2.5-7B-Instruct-MathCoder", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.153, + "BBH": 0.2998, + "MATH Level 5": 0.0008, + "GPQA": 0.2626, + "MUSR": 0.3806, + "MMLU-PRO": 0.1118 + } + }, + { + "model_id": "DeepMount00/mergekit-ties-okvgjfz", + "name": "mergekit-ties-okvgjfz", + "developer": "DeepMount00", + "scores": { + "IFEval": 0.153, + "BBH": 0.2998, + "MATH Level 5": 0.0008, + "GPQA": 0.2626, + "MUSR": 0.3806, + "MMLU-PRO": 0.1118 + } + }, + { + "model_id": "Delta-Vector/Baldur-8B", + "name": "Baldur-8B", + "developer": "Delta-Vector", + "scores": { + "IFEval": 0.4782, + "BBH": 0.5306, + "MATH Level 5": 0.1435, + "GPQA": 0.302, + "MUSR": 0.4372, + "MMLU-PRO": 0.3654 + } + }, + { + "model_id": "Delta-Vector/Control-8B", + "name": "Control-8B", + "developer": "Delta-Vector", + "scores": { + "IFEval": 0.549, + "BBH": 0.5041, + "MATH Level 5": 0.139, + "GPQA": 0.3163, + "MUSR": 0.4355, + "MMLU-PRO": 0.3732 + } + }, + { + "model_id": "Delta-Vector/Control-8B-V1.1", + "name": "Control-8B-V1.1", + "developer": "Delta-Vector", + "scores": { + "IFEval": 0.5697, + "BBH": 0.4993, + "MATH Level 5": 0.1276, + "GPQA": 0.307, + "MUSR": 0.4237, + "MMLU-PRO": 0.3745 + } + }, + { + "model_id": "Delta-Vector/Darkens-8B", + "name": "Darkens-8B", + "developer": "Delta-Vector", + "scores": { + "IFEval": 0.2548, + "BBH": 0.5251, + "MATH Level 5": 0.0589, + "GPQA": 0.3247, + "MUSR": 0.4106, + "MMLU-PRO": 0.3736 + } + }, + { + "model_id": "Delta-Vector/Henbane-7b-attempt2", + "name": "Henbane-7b-attempt2", + "developer": "Delta-Vector", + "scores": { + "IFEval": 0.4157, + "BBH": 0.5061, + "MATH Level 5": 0.2273, + "GPQA": 0.2903, + "MUSR": 0.3973, + "MMLU-PRO": 0.4028 + } + }, + { + "model_id": "Delta-Vector/Odin-9B", + "name": "Odin-9B", + "developer": "Delta-Vector", + "scores": { + "IFEval": 0.3692, + "BBH": 0.544, + "MATH Level 5": 0.145, + "GPQA": 0.3414, + "MUSR": 0.4648, + "MMLU-PRO": 0.4047 + } + }, + { + "model_id": "Delta-Vector/Tor-8B", + "name": "Tor-8B", + "developer": "Delta-Vector", + "scores": { + "IFEval": 0.2382, + "BBH": 0.5209, + "MATH Level 5": 0.0589, + "GPQA": 0.3238, + "MUSR": 0.4092, + "MMLU-PRO": 0.373 + } + }, + { + "model_id": "DevQuasar/DevQuasar-R1-Uncensored-Llama-8B", + "name": "DevQuasar-R1-Uncensored-Llama-8B", + "developer": "DevQuasar", + "scores": { + "IFEval": 0.3849, + "BBH": 0.5118, + "MATH Level 5": 0.3308, + "GPQA": 0.3473, + "MUSR": 0.4436, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "Dongwei/DeepSeek-R1-Distill-Qwen-7B-GRPO", + "name": "DeepSeek-R1-Distill-Qwen-7B-GRPO", + "developer": "Dongwei", + "scores": { + "IFEval": 0.4038, + "BBH": 0.3443, + "MATH Level 5": 0.1956, + "GPQA": 0.2794, + "MUSR": 0.3663, + "MMLU-PRO": 0.2322 + } + }, + { + "model_id": "DoppelReflEx/L3-8B-R1-WolfCore", + "name": "L3-8B-R1-WolfCore", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3775, + "BBH": 0.5318, + "MATH Level 5": 0.1631, + "GPQA": 0.3289, + "MUSR": 0.4277, + "MMLU-PRO": 0.3717 + } + }, + { + "model_id": "DoppelReflEx/L3-8B-R1-WolfCore-V1.5-test", + "name": "L3-8B-R1-WolfCore-V1.5-test", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3955, + "BBH": 0.5315, + "MATH Level 5": 0.1231, + "GPQA": 0.3263, + "MUSR": 0.3841, + "MMLU-PRO": 0.3728 + } + }, + { + "model_id": "DoppelReflEx/L3-8B-WolfCore", + "name": "L3-8B-WolfCore", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4022, + "BBH": 0.5182, + "MATH Level 5": 0.0982, + "GPQA": 0.3096, + "MUSR": 0.3973, + "MMLU-PRO": 0.3705 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-FoxFrame-test", + "name": "MN-12B-FoxFrame-test", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4222, + "BBH": 0.5456, + "MATH Level 5": 0.1397, + "GPQA": 0.3079, + "MUSR": 0.4254, + "MMLU-PRO": 0.3503 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-FoxFrame2-test", + "name": "MN-12B-FoxFrame2-test", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4319, + "BBH": 0.5485, + "MATH Level 5": 0.1405, + "GPQA": 0.3146, + "MUSR": 0.4252, + "MMLU-PRO": 0.3569 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-FoxFrame3-test", + "name": "MN-12B-FoxFrame3-test", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4323, + "BBH": 0.5395, + "MATH Level 5": 0.1322, + "GPQA": 0.3012, + "MUSR": 0.4598, + "MMLU-PRO": 0.3529 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Kakigori", + "name": "MN-12B-Kakigori", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3593, + "BBH": 0.5416, + "MATH Level 5": 0.1193, + "GPQA": 0.3247, + "MUSR": 0.4052, + "MMLU-PRO": 0.3581 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-LilithFrame", + "name": "MN-12B-LilithFrame", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.436, + "BBH": 0.4956, + "MATH Level 5": 0.0589, + "GPQA": 0.3205, + "MUSR": 0.3843, + "MMLU-PRO": 0.3237 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-LilithFrame-Experiment-2", + "name": "MN-12B-LilithFrame-Experiment-2", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4299, + "BBH": 0.4983, + "MATH Level 5": 0.1073, + "GPQA": 0.3255, + "MUSR": 0.3804, + "MMLU-PRO": 0.3276 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-LilithFrame-Experiment-3", + "name": "MN-12B-LilithFrame-Experiment-3", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4128, + "BBH": 0.5468, + "MATH Level 5": 0.1344, + "GPQA": 0.328, + "MUSR": 0.4039, + "MMLU-PRO": 0.3604 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-LilithFrame-Experiment-4", + "name": "MN-12B-LilithFrame-Experiment-4", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3981, + "BBH": 0.5534, + "MATH Level 5": 0.1224, + "GPQA": 0.3171, + "MUSR": 0.4371, + "MMLU-PRO": 0.3649 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-GreenSnake", + "name": "MN-12B-Mimicore-GreenSnake", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.478, + "BBH": 0.5481, + "MATH Level 5": 0.139, + "GPQA": 0.3247, + "MUSR": 0.4306, + "MMLU-PRO": 0.3651 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-Nocturne", + "name": "MN-12B-Mimicore-Nocturne", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3957, + "BBH": 0.5703, + "MATH Level 5": 0.1057, + "GPQA": 0.3196, + "MUSR": 0.4569, + "MMLU-PRO": 0.3634 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-Orochi", + "name": "MN-12B-Mimicore-Orochi", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.462, + "BBH": 0.5498, + "MATH Level 5": 0.136, + "GPQA": 0.3129, + "MUSR": 0.4546, + "MMLU-PRO": 0.3447 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-Orochi-v2-Experiment", + "name": "MN-12B-Mimicore-Orochi-v2-Experiment", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.2842, + "BBH": 0.5323, + "MATH Level 5": 0.0612, + "GPQA": 0.2978, + "MUSR": 0.4574, + "MMLU-PRO": 0.3423 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-Orochi-v3-Experiment", + "name": "MN-12B-Mimicore-Orochi-v3-Experiment", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4102, + "BBH": 0.5438, + "MATH Level 5": 0.1216, + "GPQA": 0.2928, + "MUSR": 0.4438, + "MMLU-PRO": 0.3396 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-Orochi-v4-Experiment", + "name": "MN-12B-Mimicore-Orochi-v4-Experiment", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4321, + "BBH": 0.5463, + "MATH Level 5": 0.1208, + "GPQA": 0.3054, + "MUSR": 0.4449, + "MMLU-PRO": 0.352 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-WhiteSnake", + "name": "MN-12B-Mimicore-WhiteSnake", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4438, + "BBH": 0.5605, + "MATH Level 5": 0.1314, + "GPQA": 0.318, + "MUSR": 0.4569, + "MMLU-PRO": 0.3658 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-WhiteSnake-v2-Experiment-1", + "name": "MN-12B-Mimicore-WhiteSnake-v2-Experiment-1", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3909, + "BBH": 0.4866, + "MATH Level 5": 0.0785, + "GPQA": 0.3054, + "MUSR": 0.379, + "MMLU-PRO": 0.3114 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-WhiteSnake-v2-Experiment-2", + "name": "MN-12B-Mimicore-WhiteSnake-v2-Experiment-2", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3124, + "BBH": 0.5126, + "MATH Level 5": 0.1125, + "GPQA": 0.2961, + "MUSR": 0.3975, + "MMLU-PRO": 0.3314 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-WhiteSnake-v2-Experiment-3", + "name": "MN-12B-Mimicore-WhiteSnake-v2-Experiment-3", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4302, + "BBH": 0.4812, + "MATH Level 5": 0.0899, + "GPQA": 0.302, + "MUSR": 0.3684, + "MMLU-PRO": 0.3198 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Mimicore-WhiteSnake-v2-Experiment-4", + "name": "MN-12B-Mimicore-WhiteSnake-v2-Experiment-4", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4241, + "BBH": 0.5185, + "MATH Level 5": 0.114, + "GPQA": 0.3104, + "MUSR": 0.4002, + "MMLU-PRO": 0.3342 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-Unleashed-Twilight", + "name": "MN-12B-Unleashed-Twilight", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3505, + "BBH": 0.5521, + "MATH Level 5": 0.0959, + "GPQA": 0.3289, + "MUSR": 0.4384, + "MMLU-PRO": 0.3678 + } + }, + { + "model_id": "DoppelReflEx/MN-12B-WolFrame", + "name": "MN-12B-WolFrame", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4397, + "BBH": 0.5117, + "MATH Level 5": 0.1314, + "GPQA": 0.3104, + "MUSR": 0.4015, + "MMLU-PRO": 0.3393 + } + }, + { + "model_id": "DoppelReflEx/MiniusLight-24B", + "name": "MiniusLight-24B", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.2577, + "BBH": 0.6256, + "MATH Level 5": 0.1261, + "GPQA": 0.3582, + "MUSR": 0.4319, + "MMLU-PRO": 0.5091 + } + }, + { + "model_id": "DoppelReflEx/MiniusLight-24B-test", + "name": "MiniusLight-24B-test", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.0394, + "BBH": 0.6334, + "MATH Level 5": 0.0257, + "GPQA": 0.3683, + "MUSR": 0.4093, + "MMLU-PRO": 0.5182 + } + }, + { + "model_id": "DoppelReflEx/MiniusLight-24B-v1b-test", + "name": "MiniusLight-24B-v1b-test", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3791, + "BBH": 0.6617, + "MATH Level 5": 0.2394, + "GPQA": 0.3792, + "MUSR": 0.4557, + "MMLU-PRO": 0.5365 + } + }, + { + "model_id": "DoppelReflEx/MiniusLight-24B-v1c-test", + "name": "MiniusLight-24B-v1c-test", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.3786, + "BBH": 0.6753, + "MATH Level 5": 0.2968, + "GPQA": 0.3951, + "MUSR": 0.4634, + "MMLU-PRO": 0.5487 + } + }, + { + "model_id": "DoppelReflEx/MiniusLight-24B-v1d-test", + "name": "MiniusLight-24B-v1d-test", + "developer": "DoppelReflEx", + "scores": { + "IFEval": 0.4032, + "BBH": 0.6712, + "MATH Level 5": 0.2946, + "GPQA": 0.3951, + "MUSR": 0.4621, + "MMLU-PRO": 0.5489 + } + }, + { + "model_id": "DreadPoor/Again-8B-Model_Stock", + "name": "Again-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6724, + "BBH": 0.531, + "MATH Level 5": 0.1201, + "GPQA": 0.3012, + "MUSR": 0.3987, + "MMLU-PRO": 0.3518 + } + }, + { + "model_id": "DreadPoor/Alita99-8B-LINEAR", + "name": "Alita99-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.719, + "BBH": 0.5442, + "MATH Level 5": 0.1647, + "GPQA": 0.3163, + "MUSR": 0.4266, + "MMLU-PRO": 0.3809 + } + }, + { + "model_id": "DreadPoor/AnotherTest", + "name": "AnotherTest", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4701, + "BBH": 0.4683, + "MATH Level 5": 0.0619, + "GPQA": 0.2978, + "MUSR": 0.4213, + "MMLU-PRO": 0.2875 + } + }, + { + "model_id": "DreadPoor/Aspire-8B-model_stock", + "name": "Aspire-8B-model_stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7141, + "BBH": 0.5278, + "MATH Level 5": 0.1495, + "GPQA": 0.3146, + "MUSR": 0.4212, + "MMLU-PRO": 0.3763 + } + }, + { + "model_id": "DreadPoor/Aspire_1.3-8B_model-stock", + "name": "Aspire_1.3-8B_model-stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7062, + "BBH": 0.5302, + "MATH Level 5": 0.1692, + "GPQA": 0.3079, + "MUSR": 0.4105, + "MMLU-PRO": 0.3716 + } + }, + { + "model_id": "DreadPoor/Aspire_V2-8B-Model_Stock", + "name": "Aspire_V2-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7371, + "BBH": 0.533, + "MATH Level 5": 0.176, + "GPQA": 0.3205, + "MUSR": 0.3894, + "MMLU-PRO": 0.3697 + } + }, + { + "model_id": "DreadPoor/Aspire_V2.1-8B-Model_Stock", + "name": "Aspire_V2.1-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7238, + "BBH": 0.5236, + "MATH Level 5": 0.1767, + "GPQA": 0.3096, + "MUSR": 0.4136, + "MMLU-PRO": 0.3801 + } + }, + { + "model_id": "DreadPoor/Aspire_V2_ALT-8B-Model_Stock", + "name": "Aspire_V2_ALT-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7381, + "BBH": 0.5266, + "MATH Level 5": 0.173, + "GPQA": 0.3247, + "MUSR": 0.3975, + "MMLU-PRO": 0.3727 + } + }, + { + "model_id": "DreadPoor/Aspire_V2_ALT_ROW-8B-Model_Stock", + "name": "Aspire_V2_ALT_ROW-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7381, + "BBH": 0.5266, + "MATH Level 5": 0.173, + "GPQA": 0.3247, + "MUSR": 0.3975, + "MMLU-PRO": 0.3727 + } + }, + { + "model_id": "DreadPoor/Aspire_V3-8B-Model_Stock", + "name": "Aspire_V3-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.5119, + "BBH": 0.5268, + "MATH Level 5": 0.1858, + "GPQA": 0.3054, + "MUSR": 0.4015, + "MMLU-PRO": 0.3642 + } + }, + { + "model_id": "DreadPoor/Aspire_V4-8B-Model_Stock", + "name": "Aspire_V4-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7694, + "BBH": 0.5314, + "MATH Level 5": 0.1926, + "GPQA": 0.3045, + "MUSR": 0.3867, + "MMLU-PRO": 0.3708 + } + }, + { + "model_id": "DreadPoor/Aspire_V4_ALT-8B-Model_Stock", + "name": "Aspire_V4_ALT-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7366, + "BBH": 0.5268, + "MATH Level 5": 0.1813, + "GPQA": 0.3205, + "MUSR": 0.392, + "MMLU-PRO": 0.3682 + } + }, + { + "model_id": "DreadPoor/Asymmetric_Linearity-8B-Model_Stock", + "name": "Asymmetric_Linearity-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7174, + "BBH": 0.5465, + "MATH Level 5": 0.1647, + "GPQA": 0.3146, + "MUSR": 0.4199, + "MMLU-PRO": 0.3844 + } + }, + { + "model_id": "DreadPoor/Aurora_faustus-8B-LINEAR", + "name": "Aurora_faustus-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7281, + "BBH": 0.5516, + "MATH Level 5": 0.1707, + "GPQA": 0.307, + "MUSR": 0.4146, + "MMLU-PRO": 0.3842 + } + }, + { + "model_id": "DreadPoor/Aurora_faustus-8B-LORABLATED", + "name": "Aurora_faustus-8B-LORABLATED", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7527, + "BBH": 0.5392, + "MATH Level 5": 0.1488, + "GPQA": 0.302, + "MUSR": 0.4239, + "MMLU-PRO": 0.3673 + } + }, + { + "model_id": "DreadPoor/Aurora_faustus-8B-LORABLATED_ALT", + "name": "Aurora_faustus-8B-LORABLATED_ALT", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7378, + "BBH": 0.5388, + "MATH Level 5": 0.1586, + "GPQA": 0.2987, + "MUSR": 0.4225, + "MMLU-PRO": 0.3694 + } + }, + { + "model_id": "DreadPoor/Autumn_Dawn-8B-LINEAR", + "name": "Autumn_Dawn-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7293, + "BBH": 0.5459, + "MATH Level 5": 0.1858, + "GPQA": 0.2936, + "MUSR": 0.4186, + "MMLU-PRO": 0.3968 + } + }, + { + "model_id": "DreadPoor/BaeZel-8B-LINEAR", + "name": "BaeZel-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7378, + "BBH": 0.5464, + "MATH Level 5": 0.1813, + "GPQA": 0.3213, + "MUSR": 0.4227, + "MMLU-PRO": 0.3861 + } + }, + { + "model_id": "DreadPoor/BaeZel-8B-Model_Stock", + "name": "BaeZel-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7713, + "BBH": 0.5408, + "MATH Level 5": 0.1639, + "GPQA": 0.3138, + "MUSR": 0.4199, + "MMLU-PRO": 0.388 + } + }, + { + "model_id": "DreadPoor/BaeZel_V2-8B-Model_Stock", + "name": "BaeZel_V2-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7677, + "BBH": 0.5374, + "MATH Level 5": 0.1798, + "GPQA": 0.2995, + "MUSR": 0.4186, + "MMLU-PRO": 0.3947 + } + }, + { + "model_id": "DreadPoor/BaeZel_V2_ALT-8B-Model_Stock", + "name": "BaeZel_V2_ALT-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7677, + "BBH": 0.5374, + "MATH Level 5": 0.1798, + "GPQA": 0.2995, + "MUSR": 0.4186, + "MMLU-PRO": 0.3947 + } + }, + { + "model_id": "DreadPoor/BaeZel_V3-8B-Model_Stock", + "name": "BaeZel_V3-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7832, + "BBH": 0.5392, + "MATH Level 5": 0.1896, + "GPQA": 0.3205, + "MUSR": 0.4174, + "MMLU-PRO": 0.3888 + } + }, + { + "model_id": "DreadPoor/Blunt_Edge-8B-SLERP", + "name": "Blunt_Edge-8B-SLERP", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7497, + "BBH": 0.5389, + "MATH Level 5": 0.1858, + "GPQA": 0.3112, + "MUSR": 0.4174, + "MMLU-PRO": 0.3767 + } + }, + { + "model_id": "DreadPoor/BulkUp", + "name": "BulkUp", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.1778, + "BBH": 0.287, + "MATH Level 5": 0.0, + "GPQA": 0.2475, + "MUSR": 0.3447, + "MMLU-PRO": 0.111 + } + }, + { + "model_id": "DreadPoor/Cadence-8B-LINEAR", + "name": "Cadence-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7682, + "BBH": 0.5433, + "MATH Level 5": 0.1677, + "GPQA": 0.3029, + "MUSR": 0.4173, + "MMLU-PRO": 0.3803 + } + }, + { + "model_id": "DreadPoor/Caelid-8B-Model_Stock", + "name": "Caelid-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7247, + "BBH": 0.546, + "MATH Level 5": 0.1511, + "GPQA": 0.3104, + "MUSR": 0.4001, + "MMLU-PRO": 0.3816 + } + }, + { + "model_id": "DreadPoor/Casuar-9B-Model_Stock", + "name": "Casuar-9B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7765, + "BBH": 0.6107, + "MATH Level 5": 0.213, + "GPQA": 0.3448, + "MUSR": 0.4165, + "MMLU-PRO": 0.4156 + } + }, + { + "model_id": "DreadPoor/Condensed_Milk-8B-Model_Stock", + "name": "Condensed_Milk-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7536, + "BBH": 0.5435, + "MATH Level 5": 0.1745, + "GPQA": 0.3213, + "MUSR": 0.416, + "MMLU-PRO": 0.3876 + } + }, + { + "model_id": "DreadPoor/CoolerCoder-8B-LINEAR", + "name": "CoolerCoder-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4519, + "BBH": 0.4762, + "MATH Level 5": 0.0793, + "GPQA": 0.2903, + "MUSR": 0.3964, + "MMLU-PRO": 0.3159 + } + }, + { + "model_id": "DreadPoor/Damasteel-8B-LINEAR", + "name": "Damasteel-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7384, + "BBH": 0.5388, + "MATH Level 5": 0.1669, + "GPQA": 0.2987, + "MUSR": 0.4212, + "MMLU-PRO": 0.3779 + } + }, + { + "model_id": "DreadPoor/Dearly_Beloved-8B-TIES", + "name": "Dearly_Beloved-8B-TIES", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.8267, + "BBH": 0.405, + "MATH Level 5": 0.2115, + "GPQA": 0.2987, + "MUSR": 0.4175, + "MMLU-PRO": 0.2827 + } + }, + { + "model_id": "DreadPoor/Decayed-8B-LINEAR", + "name": "Decayed-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7676, + "BBH": 0.5417, + "MATH Level 5": 0.1715, + "GPQA": 0.3096, + "MUSR": 0.4186, + "MMLU-PRO": 0.3763 + } + }, + { + "model_id": "DreadPoor/Derivative-8B-Model_Stock", + "name": "Derivative-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7667, + "BBH": 0.5395, + "MATH Level 5": 0.179, + "GPQA": 0.3171, + "MUSR": 0.42, + "MMLU-PRO": 0.3811 + } + }, + { + "model_id": "DreadPoor/Derivative_V2-8B-Model_Stock", + "name": "Derivative_V2-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7537, + "BBH": 0.5393, + "MATH Level 5": 0.1798, + "GPQA": 0.307, + "MUSR": 0.4123, + "MMLU-PRO": 0.3856 + } + }, + { + "model_id": "DreadPoor/Derivative_V2_ALT-8B-Model_Stock", + "name": "Derivative_V2_ALT-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.772, + "BBH": 0.5365, + "MATH Level 5": 0.1881, + "GPQA": 0.3112, + "MUSR": 0.4135, + "MMLU-PRO": 0.3882 + } + }, + { + "model_id": "DreadPoor/Derivative_V3-8B-Model_Stock", + "name": "Derivative_V3-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6964, + "BBH": 0.5243, + "MATH Level 5": 0.1465, + "GPQA": 0.2945, + "MUSR": 0.415, + "MMLU-PRO": 0.3502 + } + }, + { + "model_id": "DreadPoor/Elusive_Dragon_Heart-8B-LINEAR", + "name": "Elusive_Dragon_Heart-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7131, + "BBH": 0.5456, + "MATH Level 5": 0.148, + "GPQA": 0.3062, + "MUSR": 0.4146, + "MMLU-PRO": 0.3814 + } + }, + { + "model_id": "DreadPoor/Emu_Eggs-9B-Model_Stock", + "name": "Emu_Eggs-9B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7607, + "BBH": 0.6052, + "MATH Level 5": 0.21, + "GPQA": 0.3331, + "MUSR": 0.4071, + "MMLU-PRO": 0.4227 + } + }, + { + "model_id": "DreadPoor/Eunoia_Vespera-8B-LINEAR", + "name": "Eunoia_Vespera-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7235, + "BBH": 0.5399, + "MATH Level 5": 0.1541, + "GPQA": 0.307, + "MUSR": 0.4185, + "MMLU-PRO": 0.3839 + } + }, + { + "model_id": "DreadPoor/Fu_sion_HA-8B-SLERP", + "name": "Fu_sion_HA-8B-SLERP", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7609, + "BBH": 0.5373, + "MATH Level 5": 0.1752, + "GPQA": 0.323, + "MUSR": 0.416, + "MMLU-PRO": 0.3825 + } + }, + { + "model_id": "DreadPoor/HOT_STINKING_GARBAGE", + "name": "HOT_STINKING_GARBAGE", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.5754, + "BBH": 0.4884, + "MATH Level 5": 0.0672, + "GPQA": 0.2752, + "MUSR": 0.425, + "MMLU-PRO": 0.3017 + } + }, + { + "model_id": "DreadPoor/H_the_eighth-8B-LINEAR", + "name": "H_the_eighth-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7469, + "BBH": 0.5384, + "MATH Level 5": 0.1775, + "GPQA": 0.328, + "MUSR": 0.4173, + "MMLU-PRO": 0.3824 + } + }, + { + "model_id": "DreadPoor/Happy_New_Year-8B-Model_Stock", + "name": "Happy_New_Year-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7616, + "BBH": 0.5368, + "MATH Level 5": 0.1594, + "GPQA": 0.3138, + "MUSR": 0.4186, + "MMLU-PRO": 0.3879 + } + }, + { + "model_id": "DreadPoor/Heart_Stolen-8B-Model_Stock", + "name": "Heart_Stolen-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7245, + "BBH": 0.5395, + "MATH Level 5": 0.1722, + "GPQA": 0.3171, + "MUSR": 0.4162, + "MMLU-PRO": 0.3794 + } + }, + { + "model_id": "DreadPoor/Heart_Stolen-ALT-8B-Model_Stock", + "name": "Heart_Stolen-ALT-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7184, + "BBH": 0.5263, + "MATH Level 5": 0.1563, + "GPQA": 0.3012, + "MUSR": 0.4055, + "MMLU-PRO": 0.3772 + } + }, + { + "model_id": "DreadPoor/Here_We_Go_Again-8B-SLERP", + "name": "Here_We_Go_Again-8B-SLERP", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7442, + "BBH": 0.546, + "MATH Level 5": 0.173, + "GPQA": 0.3188, + "MUSR": 0.4187, + "MMLU-PRO": 0.3873 + } + }, + { + "model_id": "DreadPoor/Howdy-8B-LINEAR", + "name": "Howdy-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7378, + "BBH": 0.5384, + "MATH Level 5": 0.1775, + "GPQA": 0.3146, + "MUSR": 0.4121, + "MMLU-PRO": 0.3807 + } + }, + { + "model_id": "DreadPoor/Incidental-8B-Model_Stock", + "name": "Incidental-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7482, + "BBH": 0.5452, + "MATH Level 5": 0.1616, + "GPQA": 0.3029, + "MUSR": 0.424, + "MMLU-PRO": 0.3873 + } + }, + { + "model_id": "DreadPoor/Irina-8B-model_stock", + "name": "Irina-8B-model_stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6799, + "BBH": 0.5237, + "MATH Level 5": 0.102, + "GPQA": 0.2844, + "MUSR": 0.4003, + "MMLU-PRO": 0.3574 + } + }, + { + "model_id": "DreadPoor/Kindling-8B-Model_Stock", + "name": "Kindling-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7308, + "BBH": 0.5492, + "MATH Level 5": 0.1752, + "GPQA": 0.318, + "MUSR": 0.4068, + "MMLU-PRO": 0.383 + } + }, + { + "model_id": "DreadPoor/L3.1-BaeZel-8B-Della", + "name": "L3.1-BaeZel-8B-Della", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.518, + "BBH": 0.5448, + "MATH Level 5": 0.1745, + "GPQA": 0.3196, + "MUSR": 0.42, + "MMLU-PRO": 0.3902 + } + }, + { + "model_id": "DreadPoor/Laughing_Stock-8B-Model_Stock", + "name": "Laughing_Stock-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.719, + "BBH": 0.5449, + "MATH Level 5": 0.1579, + "GPQA": 0.2894, + "MUSR": 0.4146, + "MMLU-PRO": 0.3764 + } + }, + { + "model_id": "DreadPoor/Lava_Lamp-8B-SLERP", + "name": "Lava_Lamp-8B-SLERP", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7381, + "BBH": 0.5368, + "MATH Level 5": 0.1737, + "GPQA": 0.3054, + "MUSR": 0.4187, + "MMLU-PRO": 0.375 + } + }, + { + "model_id": "DreadPoor/LemonP-8B-Model_Stock", + "name": "LemonP-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7676, + "BBH": 0.5439, + "MATH Level 5": 0.1767, + "GPQA": 0.3029, + "MUSR": 0.4081, + "MMLU-PRO": 0.4004 + } + }, + { + "model_id": "DreadPoor/Lydia_of_Whiterun-8B-LINEAR", + "name": "Lydia_of_Whiterun-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7603, + "BBH": 0.538, + "MATH Level 5": 0.1767, + "GPQA": 0.3163, + "MUSR": 0.4251, + "MMLU-PRO": 0.3801 + } + }, + { + "model_id": "DreadPoor/Matryoshka-8B-LINEAR", + "name": "Matryoshka-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7263, + "BBH": 0.5444, + "MATH Level 5": 0.1752, + "GPQA": 0.3205, + "MUSR": 0.4252, + "MMLU-PRO": 0.3866 + } + }, + { + "model_id": "DreadPoor/Mercury_In_Retrograde-8b-Model-Stock", + "name": "Mercury_In_Retrograde-8b-Model-Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7296, + "BBH": 0.5391, + "MATH Level 5": 0.1647, + "GPQA": 0.3163, + "MUSR": 0.4199, + "MMLU-PRO": 0.3829 + } + }, + { + "model_id": "DreadPoor/Minthy-8B-Model_Stock", + "name": "Minthy-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7658, + "BBH": 0.5353, + "MATH Level 5": 0.1918, + "GPQA": 0.3037, + "MUSR": 0.4094, + "MMLU-PRO": 0.3993 + } + }, + { + "model_id": "DreadPoor/Minthy_ALT-8B-Model_Stock", + "name": "Minthy_ALT-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6992, + "BBH": 0.5375, + "MATH Level 5": 0.176, + "GPQA": 0.3062, + "MUSR": 0.4225, + "MMLU-PRO": 0.3674 + } + }, + { + "model_id": "DreadPoor/Minthy_V2-8B-Model_Stock", + "name": "Minthy_V2-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7126, + "BBH": 0.5491, + "MATH Level 5": 0.1594, + "GPQA": 0.2945, + "MUSR": 0.4199, + "MMLU-PRO": 0.3737 + } + }, + { + "model_id": "DreadPoor/Minus_Penus-8B-Model_Stock", + "name": "Minus_Penus-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7311, + "BBH": 0.5344, + "MATH Level 5": 0.2002, + "GPQA": 0.3096, + "MUSR": 0.4019, + "MMLU-PRO": 0.3752 + } + }, + { + "model_id": "DreadPoor/Morphing-8B-Model_Stock", + "name": "Morphing-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7445, + "BBH": 0.5397, + "MATH Level 5": 0.1888, + "GPQA": 0.2936, + "MUSR": 0.4069, + "MMLU-PRO": 0.3852 + } + }, + { + "model_id": "DreadPoor/Not_Even_My_Final_Form-8B-Model_Stock", + "name": "Not_Even_My_Final_Form-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7722, + "BBH": 0.5351, + "MATH Level 5": 0.176, + "GPQA": 0.2953, + "MUSR": 0.4147, + "MMLU-PRO": 0.384 + } + }, + { + "model_id": "DreadPoor/Nother_One-8B-Model_Stock", + "name": "Nother_One-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6863, + "BBH": 0.5205, + "MATH Level 5": 0.1518, + "GPQA": 0.2894, + "MUSR": 0.387, + "MMLU-PRO": 0.3595 + } + }, + { + "model_id": "DreadPoor/Noxis-8B-LINEAR", + "name": "Noxis-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6913, + "BBH": 0.5421, + "MATH Level 5": 0.1979, + "GPQA": 0.3188, + "MUSR": 0.4231, + "MMLU-PRO": 0.366 + } + }, + { + "model_id": "DreadPoor/Nullsworn-12B-LINEAR", + "name": "Nullsworn-12B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4436, + "BBH": 0.5483, + "MATH Level 5": 0.1125, + "GPQA": 0.3079, + "MUSR": 0.435, + "MMLU-PRO": 0.3645 + } + }, + { + "model_id": "DreadPoor/Nwah-8B-Model_Stock", + "name": "Nwah-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7716, + "BBH": 0.5384, + "MATH Level 5": 0.1798, + "GPQA": 0.3104, + "MUSR": 0.4039, + "MMLU-PRO": 0.3807 + } + }, + { + "model_id": "DreadPoor/ONeil-model_stock-8B", + "name": "ONeil-model_stock-8B", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6786, + "BBH": 0.5548, + "MATH Level 5": 0.1012, + "GPQA": 0.3054, + "MUSR": 0.4173, + "MMLU-PRO": 0.3599 + } + }, + { + "model_id": "DreadPoor/Oh_Boy-8B-LINEAR", + "name": "Oh_Boy-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7503, + "BBH": 0.5375, + "MATH Level 5": 0.1782, + "GPQA": 0.3079, + "MUSR": 0.4108, + "MMLU-PRO": 0.3849 + } + }, + { + "model_id": "DreadPoor/OrangeJ-8B-Model_Stock", + "name": "OrangeJ-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7841, + "BBH": 0.5413, + "MATH Level 5": 0.176, + "GPQA": 0.3012, + "MUSR": 0.4028, + "MMLU-PRO": 0.3969 + } + }, + { + "model_id": "DreadPoor/Promissum_Mane-8B-LINEAR", + "name": "Promissum_Mane-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.715, + "BBH": 0.5458, + "MATH Level 5": 0.1556, + "GPQA": 0.3045, + "MUSR": 0.42, + "MMLU-PRO": 0.3851 + } + }, + { + "model_id": "DreadPoor/Promissum_Mane-8B-LINEAR-lorablated", + "name": "Promissum_Mane-8B-LINEAR-lorablated", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7156, + "BBH": 0.5435, + "MATH Level 5": 0.1533, + "GPQA": 0.3037, + "MUSR": 0.4198, + "MMLU-PRO": 0.3739 + } + }, + { + "model_id": "DreadPoor/RPMash-8B-Model_Stock", + "name": "RPMash-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4564, + "BBH": 0.5169, + "MATH Level 5": 0.108, + "GPQA": 0.2869, + "MUSR": 0.4054, + "MMLU-PRO": 0.3604 + } + }, + { + "model_id": "DreadPoor/RPMash_V3-8B-Model_Stock", + "name": "RPMash_V3-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7049, + "BBH": 0.5217, + "MATH Level 5": 0.1042, + "GPQA": 0.3003, + "MUSR": 0.3778, + "MMLU-PRO": 0.3614 + } + }, + { + "model_id": "DreadPoor/Rusted_Gold-8B-LINEAR", + "name": "Rusted_Gold-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7296, + "BBH": 0.5387, + "MATH Level 5": 0.1934, + "GPQA": 0.2987, + "MUSR": 0.4178, + "MMLU-PRO": 0.378 + } + }, + { + "model_id": "DreadPoor/Rusted_Platinum-8B-LINEAR", + "name": "Rusted_Platinum-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.718, + "BBH": 0.5428, + "MATH Level 5": 0.1722, + "GPQA": 0.2802, + "MUSR": 0.3967, + "MMLU-PRO": 0.373 + } + }, + { + "model_id": "DreadPoor/Rusted_Platinum-8B-Model_Stock", + "name": "Rusted_Platinum-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4408, + "BBH": 0.5243, + "MATH Level 5": 0.102, + "GPQA": 0.2685, + "MUSR": 0.3741, + "MMLU-PRO": 0.3546 + } + }, + { + "model_id": "DreadPoor/Sellen-8B-model_stock", + "name": "Sellen-8B-model_stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7113, + "BBH": 0.5232, + "MATH Level 5": 0.1337, + "GPQA": 0.2743, + "MUSR": 0.396, + "MMLU-PRO": 0.357 + } + }, + { + "model_id": "DreadPoor/Something-8B-Model_Stock", + "name": "Something-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.5043, + "BBH": 0.5395, + "MATH Level 5": 0.1798, + "GPQA": 0.3171, + "MUSR": 0.4187, + "MMLU-PRO": 0.3885 + } + }, + { + "model_id": "DreadPoor/Spring_Dusk-8B-SCE", + "name": "Spring_Dusk-8B-SCE", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6515, + "BBH": 0.5635, + "MATH Level 5": 0.0763, + "GPQA": 0.2878, + "MUSR": 0.46, + "MMLU-PRO": 0.3436 + } + }, + { + "model_id": "DreadPoor/Summer_Dawn-8B-SCE", + "name": "Summer_Dawn-8B-SCE", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6642, + "BBH": 0.5391, + "MATH Level 5": 0.1722, + "GPQA": 0.3003, + "MUSR": 0.412, + "MMLU-PRO": 0.3753 + } + }, + { + "model_id": "DreadPoor/Summer_Dusk-8B-TIES", + "name": "Summer_Dusk-8B-TIES", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4922, + "BBH": 0.536, + "MATH Level 5": 0.1805, + "GPQA": 0.307, + "MUSR": 0.4267, + "MMLU-PRO": 0.3856 + } + }, + { + "model_id": "DreadPoor/Summer_Rain-8B-SCE", + "name": "Summer_Rain-8B-SCE", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.5459, + "BBH": 0.5846, + "MATH Level 5": 0.0702, + "GPQA": 0.3037, + "MUSR": 0.4477, + "MMLU-PRO": 0.3551 + } + }, + { + "model_id": "DreadPoor/Summer_Rain-8B-TIES", + "name": "Summer_Rain-8B-TIES", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.5444, + "BBH": 0.5846, + "MATH Level 5": 0.0702, + "GPQA": 0.3037, + "MUSR": 0.4477, + "MMLU-PRO": 0.3551 + } + }, + { + "model_id": "DreadPoor/Sun-8B-Model_Stock", + "name": "Sun-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7758, + "BBH": 0.5264, + "MATH Level 5": 0.21, + "GPQA": 0.2995, + "MUSR": 0.4098, + "MMLU-PRO": 0.3835 + } + }, + { + "model_id": "DreadPoor/Sweetened_Condensed_Milk-8B-Model_Stock", + "name": "Sweetened_Condensed_Milk-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7417, + "BBH": 0.5406, + "MATH Level 5": 0.1873, + "GPQA": 0.3029, + "MUSR": 0.4107, + "MMLU-PRO": 0.3848 + } + }, + { + "model_id": "DreadPoor/TEST02-Ignore", + "name": "TEST02-Ignore", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6119, + "BBH": 0.5602, + "MATH Level 5": 0.0869, + "GPQA": 0.2844, + "MUSR": 0.4199, + "MMLU-PRO": 0.3468 + } + }, + { + "model_id": "DreadPoor/TEST03-ignore", + "name": "TEST03-ignore", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6967, + "BBH": 0.5383, + "MATH Level 5": 0.1654, + "GPQA": 0.3087, + "MUSR": 0.4186, + "MMLU-PRO": 0.3789 + } + }, + { + "model_id": "DreadPoor/TEST06-ignore", + "name": "TEST06-ignore", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7323, + "BBH": 0.5509, + "MATH Level 5": 0.1178, + "GPQA": 0.2869, + "MUSR": 0.4225, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "DreadPoor/TEST07-ignore", + "name": "TEST07-ignore", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.74, + "BBH": 0.5561, + "MATH Level 5": 0.1662, + "GPQA": 0.3087, + "MUSR": 0.4094, + "MMLU-PRO": 0.388 + } + }, + { + "model_id": "DreadPoor/TEST08-ignore", + "name": "TEST08-ignore", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7467, + "BBH": 0.5454, + "MATH Level 5": 0.182, + "GPQA": 0.3129, + "MUSR": 0.4081, + "MMLU-PRO": 0.3853 + } + }, + { + "model_id": "DreadPoor/Trinas_Nectar-8B-model_stock", + "name": "Trinas_Nectar-8B-model_stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7259, + "BBH": 0.5256, + "MATH Level 5": 0.1526, + "GPQA": 0.2861, + "MUSR": 0.4068, + "MMLU-PRO": 0.3618 + } + }, + { + "model_id": "DreadPoor/UNTESTED-VENN_1.2-8B-Model_Stock", + "name": "UNTESTED-VENN_1.2-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4718, + "BBH": 0.5475, + "MATH Level 5": 0.1541, + "GPQA": 0.3154, + "MUSR": 0.4449, + "MMLU-PRO": 0.3787 + } + }, + { + "model_id": "DreadPoor/VENN_1.2-8B-Model_Stock", + "name": "VENN_1.2-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7226, + "BBH": 0.5459, + "MATH Level 5": 0.1707, + "GPQA": 0.297, + "MUSR": 0.42, + "MMLU-PRO": 0.3721 + } + }, + { + "model_id": "DreadPoor/WIP-Acacia-8B-Model_Stock", + "name": "WIP-Acacia-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.6246, + "BBH": 0.5195, + "MATH Level 5": 0.1669, + "GPQA": 0.3062, + "MUSR": 0.4226, + "MMLU-PRO": 0.3737 + } + }, + { + "model_id": "DreadPoor/WIP_Damascus-8B-TIES", + "name": "WIP_Damascus-8B-TIES", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4776, + "BBH": 0.5411, + "MATH Level 5": 0.1654, + "GPQA": 0.307, + "MUSR": 0.4119, + "MMLU-PRO": 0.3761 + } + }, + { + "model_id": "DreadPoor/Wannabe-8B-Model_Stock", + "name": "Wannabe-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7205, + "BBH": 0.539, + "MATH Level 5": 0.1775, + "GPQA": 0.3012, + "MUSR": 0.4135, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "DreadPoor/What_A_Thrill-8B-Model_Stock", + "name": "What_A_Thrill-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7064, + "BBH": 0.5311, + "MATH Level 5": 0.182, + "GPQA": 0.297, + "MUSR": 0.408, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "DreadPoor/Winter-8B-SCE", + "name": "Winter-8B-SCE", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7536, + "BBH": 0.5262, + "MATH Level 5": 0.1918, + "GPQA": 0.2995, + "MUSR": 0.4071, + "MMLU-PRO": 0.3839 + } + }, + { + "model_id": "DreadPoor/Winter_Dawn-8B-TIES", + "name": "Winter_Dawn-8B-TIES", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.5496, + "BBH": 0.5309, + "MATH Level 5": 0.1858, + "GPQA": 0.3096, + "MUSR": 0.4279, + "MMLU-PRO": 0.391 + } + }, + { + "model_id": "DreadPoor/Winter_Dusk-8B-TIES", + "name": "Winter_Dusk-8B-TIES", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7153, + "BBH": 0.4952, + "MATH Level 5": 0.0718, + "GPQA": 0.2995, + "MUSR": 0.3688, + "MMLU-PRO": 0.3478 + } + }, + { + "model_id": "DreadPoor/Winter_Night-8B-Model_Stock", + "name": "Winter_Night-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.704, + "BBH": 0.5185, + "MATH Level 5": 0.1458, + "GPQA": 0.3062, + "MUSR": 0.3914, + "MMLU-PRO": 0.3666 + } + }, + { + "model_id": "DreadPoor/Yafune-8B-Model_Stock", + "name": "Yafune-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7533, + "BBH": 0.5467, + "MATH Level 5": 0.1662, + "GPQA": 0.3272, + "MUSR": 0.4173, + "MMLU-PRO": 0.3851 + } + }, + { + "model_id": "DreadPoor/Yearn_V3-8B-Model_Stock", + "name": "Yearn_V3-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.729, + "BBH": 0.5322, + "MATH Level 5": 0.1896, + "GPQA": 0.3054, + "MUSR": 0.3909, + "MMLU-PRO": 0.3802 + } + }, + { + "model_id": "DreadPoor/ZEUS-8B-V17-Abliterated_ALT", + "name": "ZEUS-8B-V17-Abliterated_ALT", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.5511, + "BBH": 0.5231, + "MATH Level 5": 0.1903, + "GPQA": 0.3079, + "MUSR": 0.4149, + "MMLU-PRO": 0.389 + } + }, + { + "model_id": "DreadPoor/Zelus-8B-Model_Stock", + "name": "Zelus-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7788, + "BBH": 0.5307, + "MATH Level 5": 0.1647, + "GPQA": 0.3062, + "MUSR": 0.4214, + "MMLU-PRO": 0.3841 + } + }, + { + "model_id": "DreadPoor/Zelus_V2-8B-Model_Stock", + "name": "Zelus_V2-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7898, + "BBH": 0.5345, + "MATH Level 5": 0.2054, + "GPQA": 0.3096, + "MUSR": 0.3961, + "MMLU-PRO": 0.3833 + } + }, + { + "model_id": "DreadPoor/felix_dies-mistral-7B-model_stock", + "name": "felix_dies-mistral-7B-model_stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.3008, + "BBH": 0.4901, + "MATH Level 5": 0.0536, + "GPQA": 0.2919, + "MUSR": 0.4518, + "MMLU-PRO": 0.3109 + } + }, + { + "model_id": "DreadPoor/hakuchido-8B-MODEL_STOCK", + "name": "hakuchido-8B-MODEL_STOCK", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7375, + "BBH": 0.5398, + "MATH Level 5": 0.1949, + "GPQA": 0.2953, + "MUSR": 0.4175, + "MMLU-PRO": 0.3782 + } + }, + { + "model_id": "DreadPoor/ichor-8B-Model_Stock", + "name": "ichor-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.5386, + "BBH": 0.5084, + "MATH Level 5": 0.1088, + "GPQA": 0.3238, + "MUSR": 0.4212, + "MMLU-PRO": 0.3151 + } + }, + { + "model_id": "DreadPoor/ichor_1.1-8B-Model_Stock", + "name": "ichor_1.1-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.8096, + "BBH": 0.5281, + "MATH Level 5": 0.1775, + "GPQA": 0.3062, + "MUSR": 0.4068, + "MMLU-PRO": 0.3856 + } + }, + { + "model_id": "DreadPoor/inexpertus-8B-Model_Stock", + "name": "inexpertus-8B-Model_Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7795, + "BBH": 0.528, + "MATH Level 5": 0.1707, + "GPQA": 0.3096, + "MUSR": 0.4118, + "MMLU-PRO": 0.3791 + } + }, + { + "model_id": "DreadPoor/inexpertus_1.1-8B-LINEAR", + "name": "inexpertus_1.1-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7527, + "BBH": 0.5525, + "MATH Level 5": 0.173, + "GPQA": 0.2978, + "MUSR": 0.4173, + "MMLU-PRO": 0.3827 + } + }, + { + "model_id": "DreadPoor/inexpertus_1.2-8B-LINEAR", + "name": "inexpertus_1.2-8B-LINEAR", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7348, + "BBH": 0.5523, + "MATH Level 5": 0.1586, + "GPQA": 0.2953, + "MUSR": 0.4133, + "MMLU-PRO": 0.3788 + } + }, + { + "model_id": "DreadPoor/mergekit-nuslerp-nqzkedi", + "name": "mergekit-nuslerp-nqzkedi", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7765, + "BBH": 0.5362, + "MATH Level 5": 0.1881, + "GPQA": 0.3012, + "MUSR": 0.4225, + "MMLU-PRO": 0.3919 + } + }, + { + "model_id": "DreadPoor/remember_to_breathe-8b-Model-Stock", + "name": "remember_to_breathe-8b-Model-Stock", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7104, + "BBH": 0.5412, + "MATH Level 5": 0.1488, + "GPQA": 0.3012, + "MUSR": 0.4145, + "MMLU-PRO": 0.3761 + } + }, + { + "model_id": "DreadPoor/test", + "name": "test", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4937, + "BBH": 0.5372, + "MATH Level 5": 0.1934, + "GPQA": 0.271, + "MUSR": 0.4351, + "MMLU-PRO": 0.3647 + } + }, + { + "model_id": "DreadPoor/test_ALT", + "name": "test_ALT", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.4997, + "BBH": 0.537, + "MATH Level 5": 0.1707, + "GPQA": 0.2693, + "MUSR": 0.4363, + "MMLU-PRO": 0.3492 + } + }, + { + "model_id": "DreadPoor/tests_pending-do_not_use_yet", + "name": "tests_pending-do_not_use_yet", + "developer": "DreadPoor", + "scores": { + "IFEval": 0.7691, + "BBH": 0.5408, + "MATH Level 5": 0.1979, + "GPQA": 0.297, + "MUSR": 0.4005, + "MMLU-PRO": 0.3827 + } + }, + { + "model_id": "ECE-ILAB-PRYMMAL/ILAB-Merging-3B-V2", + "name": "ILAB-Merging-3B-V2", + "developer": "ECE-ILAB-PRYMMAL", + "scores": { + "IFEval": 0.4029, + "BBH": 0.5402, + "MATH Level 5": 0.1518, + "GPQA": 0.3054, + "MUSR": 0.4332, + "MMLU-PRO": 0.3861 + } + }, + { + "model_id": "EVA-UNIT-01/EVA-Qwen2.5-14B-v0.2", + "name": "EVA-Qwen2.5-14B-v0.2", + "developer": "EVA-UNIT-01", + "scores": { + "IFEval": 0.4038, + "BBH": 0.609, + "MATH Level 5": 0.3406, + "GPQA": 0.3943, + "MUSR": 0.4794, + "MMLU-PRO": 0.5135 + } + }, + { + "model_id": "EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2", + "name": "EVA-Qwen2.5-72B-v0.2", + "developer": "EVA-UNIT-01", + "scores": { + "IFEval": 0.6879, + "BBH": 0.7088, + "MATH Level 5": 0.4313, + "GPQA": 0.4086, + "MUSR": 0.472, + "MMLU-PRO": 0.5813 + } + }, + { + "model_id": "Edgerunners/meta-llama-3-8b-instruct-hf-ortho-baukit-34fail-3000total-bf16", + "name": "meta-llama-3-8b-instruct-hf-ortho-baukit-34fail-3000total-bf16", + "developer": "Edgerunners", + "scores": { + "IFEval": 0.7147, + "BBH": 0.498, + "MATH Level 5": 0.0906, + "GPQA": 0.2601, + "MUSR": 0.3342, + "MMLU-PRO": 0.3636 + } + }, + { + "model_id": "EleutherAI/gpt-j-6b", + "name": "gpt-j-6b", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2522, + "BBH": 0.3191, + "MATH Level 5": 0.0136, + "GPQA": 0.2458, + "MUSR": 0.3658, + "MMLU-PRO": 0.1241 + } + }, + { + "model_id": "EleutherAI/gpt-neo-1.3B", + "name": "gpt-neo-1.3B", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2079, + "BBH": 0.3039, + "MATH Level 5": 0.0106, + "GPQA": 0.2559, + "MUSR": 0.3817, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "EleutherAI/gpt-neo-125m", + "name": "gpt-neo-125m", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.1905, + "BBH": 0.3115, + "MATH Level 5": 0.006, + "GPQA": 0.2534, + "MUSR": 0.3593, + "MMLU-PRO": 0.1026 + } + }, + { + "model_id": "EleutherAI/gpt-neo-2.7B", + "name": "gpt-neo-2.7B", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.259, + "BBH": 0.314, + "MATH Level 5": 0.0106, + "GPQA": 0.2659, + "MUSR": 0.3554, + "MMLU-PRO": 0.1163 + } + }, + { + "model_id": "EleutherAI/gpt-neox-20b", + "name": "gpt-neox-20b", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2587, + "BBH": 0.3165, + "MATH Level 5": 0.0136, + "GPQA": 0.2433, + "MUSR": 0.3647, + "MMLU-PRO": 0.1155 + } + }, + { + "model_id": "EleutherAI/pythia-1.4b", + "name": "pythia-1.4b", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2371, + "BBH": 0.315, + "MATH Level 5": 0.0151, + "GPQA": 0.2617, + "MUSR": 0.3538, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "EleutherAI/pythia-12b", + "name": "pythia-12b", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2471, + "BBH": 0.318, + "MATH Level 5": 0.0166, + "GPQA": 0.2466, + "MUSR": 0.3647, + "MMLU-PRO": 0.1109 + } + }, + { + "model_id": "EleutherAI/pythia-160m", + "name": "pythia-160m", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.1816, + "BBH": 0.297, + "MATH Level 5": 0.0091, + "GPQA": 0.2584, + "MUSR": 0.4179, + "MMLU-PRO": 0.112 + } + }, + { + "model_id": "EleutherAI/pythia-1b", + "name": "pythia-1b", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2208, + "BBH": 0.3004, + "MATH Level 5": 0.0091, + "GPQA": 0.2567, + "MUSR": 0.3552, + "MMLU-PRO": 0.1136 + } + }, + { + "model_id": "EleutherAI/pythia-2.8b", + "name": "pythia-2.8b", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2173, + "BBH": 0.3224, + "MATH Level 5": 0.0136, + "GPQA": 0.25, + "MUSR": 0.3486, + "MMLU-PRO": 0.1137 + } + }, + { + "model_id": "EleutherAI/pythia-410m", + "name": "pythia-410m", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2195, + "BBH": 0.3028, + "MATH Level 5": 0.0098, + "GPQA": 0.2592, + "MUSR": 0.3578, + "MMLU-PRO": 0.1128 + } + }, + { + "model_id": "EleutherAI/pythia-6.9b", + "name": "pythia-6.9b", + "developer": "EleutherAI", + "scores": { + "IFEval": 0.2281, + "BBH": 0.3232, + "MATH Level 5": 0.0144, + "GPQA": 0.2517, + "MUSR": 0.3591, + "MMLU-PRO": 0.1147 + } + }, + { + "model_id": "Enno-Ai/EnnoAi-Pro-French-Llama-3-8B-v0.4", + "name": "EnnoAi-Pro-French-Llama-3-8B-v0.4", + "developer": "Enno-Ai", + "scores": { + "IFEval": 0.4189, + "BBH": 0.4075, + "MATH Level 5": 0.0363, + "GPQA": 0.271, + "MUSR": 0.417, + "MMLU-PRO": 0.2635 + } + }, + { + "model_id": "Enno-Ai/EnnoAi-Pro-Llama-3-8B", + "name": "EnnoAi-Pro-Llama-3-8B", + "developer": "Enno-Ai", + "scores": { + "IFEval": 0.3195, + "BBH": 0.4152, + "MATH Level 5": 0.0219, + "GPQA": 0.2617, + "MUSR": 0.4071, + "MMLU-PRO": 0.2151 + } + }, + { + "model_id": "Enno-Ai/EnnoAi-Pro-Llama-3-8B-v0.3", + "name": "EnnoAi-Pro-Llama-3-8B-v0.3", + "developer": "Enno-Ai", + "scores": { + "IFEval": 0.5083, + "BBH": 0.4101, + "MATH Level 5": 0.0483, + "GPQA": 0.2651, + "MUSR": 0.4236, + "MMLU-PRO": 0.299 + } + }, + { + "model_id": "Enno-Ai/EnnoAi-Pro-Llama-3.1-8B-v0.9", + "name": "EnnoAi-Pro-Llama-3.1-8B-v0.9", + "developer": "Enno-Ai", + "scores": { + "IFEval": 0.4689, + "BBH": 0.416, + "MATH Level 5": 0.0378, + "GPQA": 0.2659, + "MUSR": 0.3832, + "MMLU-PRO": 0.2596 + } + }, + { + "model_id": "EnnoAi/EnnoAi-7B-French-Instruct-202502", + "name": "EnnoAi-7B-French-Instruct-202502", + "developer": "EnnoAi", + "scores": { + "IFEval": 0.5564, + "BBH": 0.5575, + "MATH Level 5": 0.3724, + "GPQA": 0.2953, + "MUSR": 0.46, + "MMLU-PRO": 0.4013 + } + }, + { + "model_id": "EnnoAi/EnnoAi-Pro-Llama-3.1-8B-v1.0", + "name": "EnnoAi-Pro-Llama-3.1-8B-v1.0", + "developer": "EnnoAi", + "scores": { + "IFEval": 0.4704, + "BBH": 0.416, + "MATH Level 5": 0.0378, + "GPQA": 0.2659, + "MUSR": 0.3832, + "MMLU-PRO": 0.2596 + } + }, + { + "model_id": "Epiculous/Azure_Dusk-v0.2", + "name": "Azure_Dusk-v0.2", + "developer": "Epiculous", + "scores": { + "IFEval": 0.3467, + "BBH": 0.412, + "MATH Level 5": 0.0295, + "GPQA": 0.2609, + "MUSR": 0.3835, + "MMLU-PRO": 0.3034 + } + }, + { + "model_id": "Epiculous/Crimson_Dawn-v0.2", + "name": "Crimson_Dawn-v0.2", + "developer": "Epiculous", + "scores": { + "IFEval": 0.3103, + "BBH": 0.4482, + "MATH Level 5": 0.0431, + "GPQA": 0.276, + "MUSR": 0.4152, + "MMLU-PRO": 0.2721 + } + }, + { + "model_id": "Epiculous/NovaSpark", + "name": "NovaSpark", + "developer": "Epiculous", + "scores": { + "IFEval": 0.6408, + "BBH": 0.5064, + "MATH Level 5": 0.1518, + "GPQA": 0.2978, + "MUSR": 0.3882, + "MMLU-PRO": 0.3649 + } + }, + { + "model_id": "Epiculous/Violet_Twilight-v0.2", + "name": "Violet_Twilight-v0.2", + "developer": "Epiculous", + "scores": { + "IFEval": 0.4532, + "BBH": 0.4615, + "MATH Level 5": 0.0287, + "GPQA": 0.2659, + "MUSR": 0.4299, + "MMLU-PRO": 0.3111 + } + }, + { + "model_id": "EpistemeAI/Alpaca-Llama3.1-8B", + "name": "Alpaca-Llama3.1-8B", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.1599, + "BBH": 0.4755, + "MATH Level 5": 0.0506, + "GPQA": 0.2903, + "MUSR": 0.3403, + "MMLU-PRO": 0.3246 + } + }, + { + "model_id": "EpistemeAI/Athena-gemma-2-2b-it", + "name": "Athena-gemma-2-2b-it", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.3134, + "BBH": 0.4264, + "MATH Level 5": 0.0491, + "GPQA": 0.2685, + "MUSR": 0.4351, + "MMLU-PRO": 0.2422 + } + }, + { + "model_id": "EpistemeAI/Athena-gemma-2-2b-it-Philos", + "name": "Athena-gemma-2-2b-it-Philos", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4621, + "BBH": 0.3795, + "MATH Level 5": 0.037, + "GPQA": 0.281, + "MUSR": 0.4314, + "MMLU-PRO": 0.2248 + } + }, + { + "model_id": "EpistemeAI/Athene-codegemma-2-7b-it-alpaca-v1.3", + "name": "Athene-codegemma-2-7b-it-alpaca-v1.3", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.403, + "BBH": 0.4332, + "MATH Level 5": 0.0619, + "GPQA": 0.2802, + "MUSR": 0.4503, + "MMLU-PRO": 0.2587 + } + }, + { + "model_id": "EpistemeAI/DeepPhi-3.5-mini-instruct", + "name": "DeepPhi-3.5-mini-instruct", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.1326, + "BBH": 0.2882, + "MATH Level 5": 0.0068, + "GPQA": 0.2332, + "MUSR": 0.3656, + "MMLU-PRO": 0.1103 + } + }, + { + "model_id": "EpistemeAI/DeepThinkers-Phi4", + "name": "DeepThinkers-Phi4", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.694, + "BBH": 0.679, + "MATH Level 5": 0.4585, + "GPQA": 0.3406, + "MUSR": 0.3981, + "MMLU-PRO": 0.5258 + } + }, + { + "model_id": "EpistemeAI/FineLlama3.1-8B-Instruct", + "name": "FineLlama3.1-8B-Instruct", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.08, + "BBH": 0.4557, + "MATH Level 5": 0.0347, + "GPQA": 0.2802, + "MUSR": 0.3482, + "MMLU-PRO": 0.3113 + } + }, + { + "model_id": "EpistemeAI/Fireball-12B", + "name": "Fireball-12B", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.1834, + "BBH": 0.5111, + "MATH Level 5": 0.0408, + "GPQA": 0.2617, + "MUSR": 0.4236, + "MMLU-PRO": 0.3344 + } + }, + { + "model_id": "EpistemeAI/Fireball-12B-v1.13a-philosophers", + "name": "Fireball-12B-v1.13a-philosophers", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.0876, + "BBH": 0.5103, + "MATH Level 5": 0.0461, + "GPQA": 0.3012, + "MUSR": 0.4081, + "MMLU-PRO": 0.3367 + } + }, + { + "model_id": "EpistemeAI/Fireball-Alpaca-Llama-3.1-8B-Philos-DPO-200", + "name": "Fireball-Alpaca-Llama-3.1-8B-Philos-DPO-200", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4577, + "BBH": 0.4838, + "MATH Level 5": 0.1231, + "GPQA": 0.3003, + "MUSR": 0.3945, + "MMLU-PRO": 0.3583 + } + }, + { + "model_id": "EpistemeAI/Fireball-Alpaca-Llama3.1.07-8B-Philos-Math-KTO-beta", + "name": "Fireball-Alpaca-Llama3.1.07-8B-Philos-Math-KTO-beta", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7274, + "BBH": 0.4865, + "MATH Level 5": 0.1526, + "GPQA": 0.2802, + "MUSR": 0.3619, + "MMLU-PRO": 0.3543 + } + }, + { + "model_id": "EpistemeAI/Fireball-Alpaca-Llama3.1.08-8B-Philos-C-R2", + "name": "Fireball-Alpaca-Llama3.1.08-8B-Philos-C-R2", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4673, + "BBH": 0.4932, + "MATH Level 5": 0.1239, + "GPQA": 0.2861, + "MUSR": 0.4624, + "MMLU-PRO": 0.3352 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.1-8B-Instruct-0.001-128K-auto", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-0.001-128K-auto", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4432, + "BBH": 0.4824, + "MATH Level 5": 0.1329, + "GPQA": 0.3121, + "MUSR": 0.4066, + "MMLU-PRO": 0.3516 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4457, + "BBH": 0.4897, + "MATH Level 5": 0.1208, + "GPQA": 0.2945, + "MUSR": 0.3762, + "MMLU-PRO": 0.3543 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.5975, + "BBH": 0.4904, + "MATH Level 5": 0.1337, + "GPQA": 0.302, + "MUSR": 0.401, + "MMLU-PRO": 0.3423 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.6691, + "BBH": 0.4668, + "MATH Level 5": 0.1337, + "GPQA": 0.2727, + "MUSR": 0.3418, + "MMLU-PRO": 0.3389 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7207, + "BBH": 0.461, + "MATH Level 5": 0.1314, + "GPQA": 0.2701, + "MUSR": 0.3432, + "MMLU-PRO": 0.3354 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.004-128K-code-COT", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.004-128K-code-COT", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4578, + "BBH": 0.4761, + "MATH Level 5": 0.1382, + "GPQA": 0.2936, + "MUSR": 0.3881, + "MMLU-PRO": 0.3471 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.004-128K-code-ds-auto", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.004-128K-code-ds-auto", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7205, + "BBH": 0.4818, + "MATH Level 5": 0.1435, + "GPQA": 0.2483, + "MUSR": 0.33, + "MMLU-PRO": 0.3548 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.1-8B-Instruct-Math", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Math", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4623, + "BBH": 0.4983, + "MATH Level 5": 0.108, + "GPQA": 0.2911, + "MUSR": 0.3641, + "MMLU-PRO": 0.3331 + } + }, + { + "model_id": "EpistemeAI/Fireball-Meta-Llama-3.2-8B-Instruct-agent-003-128k-code-DPO", + "name": "Fireball-Meta-Llama-3.2-8B-Instruct-agent-003-128k-code-DPO", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4611, + "BBH": 0.4801, + "MATH Level 5": 0.1254, + "GPQA": 0.3003, + "MUSR": 0.3998, + "MMLU-PRO": 0.3521 + } + }, + { + "model_id": "EpistemeAI/Fireball-Mistral-Nemo-Base-2407-v1-DPO2", + "name": "Fireball-Mistral-Nemo-Base-2407-v1-DPO2", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.1861, + "BBH": 0.4968, + "MATH Level 5": 0.0363, + "GPQA": 0.2919, + "MUSR": 0.404, + "MMLU-PRO": 0.3353 + } + }, + { + "model_id": "EpistemeAI/Fireball-R1-Llama-3.1-8B", + "name": "Fireball-R1-Llama-3.1-8B", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4427, + "BBH": 0.3643, + "MATH Level 5": 0.3112, + "GPQA": 0.2483, + "MUSR": 0.3288, + "MMLU-PRO": 0.1115 + } + }, + { + "model_id": "EpistemeAI/Fireball-R1-Llama-3.1-8B-Medical-COT", + "name": "Fireball-R1-Llama-3.1-8B-Medical-COT", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.3216, + "BBH": 0.3716, + "MATH Level 5": 0.327, + "GPQA": 0.2743, + "MUSR": 0.3114, + "MMLU-PRO": 0.1402 + } + }, + { + "model_id": "EpistemeAI/Fireball-R1.1-Llama-3.1-8B", + "name": "Fireball-R1.1-Llama-3.1-8B", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.3676, + "BBH": 0.3326, + "MATH Level 5": 0.1382, + "GPQA": 0.2517, + "MUSR": 0.3419, + "MMLU-PRO": 0.1115 + } + }, + { + "model_id": "EpistemeAI/Llama-3.2-3B-Agent007-Coder", + "name": "Llama-3.2-3B-Agent007-Coder", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.54, + "BBH": 0.4304, + "MATH Level 5": 0.111, + "GPQA": 0.2576, + "MUSR": 0.3668, + "MMLU-PRO": 0.2852 + } + }, + { + "model_id": "EpistemeAI/Mistral-Nemo-Instruct-12B-Philosophy-Math", + "name": "Mistral-Nemo-Instruct-12B-Philosophy-Math", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.0695, + "BBH": 0.5365, + "MATH Level 5": 0.0959, + "GPQA": 0.3314, + "MUSR": 0.4292, + "MMLU-PRO": 0.3296 + } + }, + { + "model_id": "EpistemeAI/OpenReasoner-Llama-3.2-3B-rs1.0", + "name": "OpenReasoner-Llama-3.2-3B-rs1.0", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7274, + "BBH": 0.4519, + "MATH Level 5": 0.1344, + "GPQA": 0.2718, + "MUSR": 0.3461, + "MMLU-PRO": 0.3134 + } + }, + { + "model_id": "EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Empathy", + "name": "Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Empathy", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7101, + "BBH": 0.4628, + "MATH Level 5": 0.1397, + "GPQA": 0.2768, + "MUSR": 0.3195, + "MMLU-PRO": 0.3311 + } + }, + { + "model_id": "EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Logic", + "name": "Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-Logic", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7122, + "BBH": 0.4566, + "MATH Level 5": 0.1246, + "GPQA": 0.2844, + "MUSR": 0.3235, + "MMLU-PRO": 0.335 + } + }, + { + "model_id": "EpistemeAI/Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-divergent", + "name": "Polypsyche-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto-divergent", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.6915, + "BBH": 0.4525, + "MATH Level 5": 0.1292, + "GPQA": 0.2668, + "MUSR": 0.3578, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "EpistemeAI/Reasoning-Llama-3.1-CoT-RE1-NMT", + "name": "Reasoning-Llama-3.1-CoT-RE1-NMT", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4829, + "BBH": 0.4736, + "MATH Level 5": 0.1299, + "GPQA": 0.2609, + "MUSR": 0.3182, + "MMLU-PRO": 0.3343 + } + }, + { + "model_id": "EpistemeAI/Reasoning-Llama-3.1-CoT-RE1-NMT-V2-ORPO", + "name": "Reasoning-Llama-3.1-CoT-RE1-NMT-V2-ORPO", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4553, + "BBH": 0.4804, + "MATH Level 5": 0.1292, + "GPQA": 0.307, + "MUSR": 0.3931, + "MMLU-PRO": 0.3598 + } + }, + { + "model_id": "EpistemeAI/Reasoning-Llama-3.2-1B-Instruct-v1.2", + "name": "Reasoning-Llama-3.2-1B-Instruct-v1.2", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.4087, + "BBH": 0.3324, + "MATH Level 5": 0.0506, + "GPQA": 0.2609, + "MUSR": 0.3222, + "MMLU-PRO": 0.1179 + } + }, + { + "model_id": "EpistemeAI/Reasoning-Llama-3.2-1B-Instruct-v1.3", + "name": "Reasoning-Llama-3.2-1B-Instruct-v1.3", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.3273, + "BBH": 0.3263, + "MATH Level 5": 0.0506, + "GPQA": 0.2584, + "MUSR": 0.326, + "MMLU-PRO": 0.1173 + } + }, + { + "model_id": "EpistemeAI/Reasoning-Llama-3.2-3B-Math-Instruct-RE1", + "name": "Reasoning-Llama-3.2-3B-Math-Instruct-RE1", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.512, + "BBH": 0.4381, + "MATH Level 5": 0.108, + "GPQA": 0.2643, + "MUSR": 0.3435, + "MMLU-PRO": 0.2789 + } + }, + { + "model_id": "EpistemeAI/Reasoning-Llama-3.2-3B-Math-Instruct-RE1-ORPO", + "name": "Reasoning-Llama-3.2-3B-Math-Instruct-RE1-ORPO", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.729, + "BBH": 0.4518, + "MATH Level 5": 0.1533, + "GPQA": 0.2735, + "MUSR": 0.3487, + "MMLU-PRO": 0.31 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-1.0-3B-Instruct-r01-Reflect-Math", + "name": "ReasoningCore-1.0-3B-Instruct-r01-Reflect-Math", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.5903, + "BBH": 0.4364, + "MATH Level 5": 0.148, + "GPQA": 0.2601, + "MUSR": 0.3314, + "MMLU-PRO": 0.2823 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-0", + "name": "ReasoningCore-3B-0", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7341, + "BBH": 0.4446, + "MATH Level 5": 0.1586, + "GPQA": 0.2727, + "MUSR": 0.3554, + "MMLU-PRO": 0.3172 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-Instruct-r01-Reflect", + "name": "ReasoningCore-3B-Instruct-r01-Reflect", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7335, + "BBH": 0.445, + "MATH Level 5": 0.1541, + "GPQA": 0.2735, + "MUSR": 0.3527, + "MMLU-PRO": 0.3144 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-R01", + "name": "ReasoningCore-3B-R01", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.2976, + "BBH": 0.4373, + "MATH Level 5": 0.1299, + "GPQA": 0.2609, + "MUSR": 0.3195, + "MMLU-PRO": 0.2591 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-RE1-V2", + "name": "ReasoningCore-3B-RE1-V2", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7393, + "BBH": 0.4462, + "MATH Level 5": 0.1563, + "GPQA": 0.2735, + "MUSR": 0.3541, + "MMLU-PRO": 0.3181 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-RE1-V2A", + "name": "ReasoningCore-3B-RE1-V2A", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.5733, + "BBH": 0.419, + "MATH Level 5": 0.0929, + "GPQA": 0.2777, + "MUSR": 0.3352, + "MMLU-PRO": 0.2736 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-RE1-V2B", + "name": "ReasoningCore-3B-RE1-V2B", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.5051, + "BBH": 0.4168, + "MATH Level 5": 0.1073, + "GPQA": 0.2617, + "MUSR": 0.3448, + "MMLU-PRO": 0.2673 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-RE1-V2C", + "name": "ReasoningCore-3B-RE1-V2C", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.5057, + "BBH": 0.4177, + "MATH Level 5": 0.0974, + "GPQA": 0.2609, + "MUSR": 0.3422, + "MMLU-PRO": 0.2691 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-T1-V1", + "name": "ReasoningCore-3B-T1-V1", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7208, + "BBH": 0.4517, + "MATH Level 5": 0.1458, + "GPQA": 0.276, + "MUSR": 0.354, + "MMLU-PRO": 0.312 + } + }, + { + "model_id": "EpistemeAI/ReasoningCore-3B-T1_1", + "name": "ReasoningCore-3B-T1_1", + "developer": "EpistemeAI", + "scores": { + "IFEval": 0.7275, + "BBH": 0.4524, + "MATH Level 5": 0.1541, + "GPQA": 0.276, + "MUSR": 0.3554, + "MMLU-PRO": 0.3117 + } + }, + { + "model_id": "EpistemeAI2/Athene-codegemma-2-7b-it-alpaca-v1.2", + "name": "Athene-codegemma-2-7b-it-alpaca-v1.2", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.4351, + "BBH": 0.4175, + "MATH Level 5": 0.0423, + "GPQA": 0.271, + "MUSR": 0.417, + "MMLU-PRO": 0.2297 + } + }, + { + "model_id": "EpistemeAI2/Fireball-12B-v1.2", + "name": "Fireball-12B-v1.2", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.1355, + "BBH": 0.5019, + "MATH Level 5": 0.0415, + "GPQA": 0.2987, + "MUSR": 0.4173, + "MMLU-PRO": 0.3337 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Alpaca-Llama3.1-8B-Philos", + "name": "Fireball-Alpaca-Llama3.1-8B-Philos", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.4986, + "BBH": 0.4978, + "MATH Level 5": 0.1186, + "GPQA": 0.2928, + "MUSR": 0.4277, + "MMLU-PRO": 0.3406 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Alpaca-Llama3.1.01-8B-Philos", + "name": "Fireball-Alpaca-Llama3.1.01-8B-Philos", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.4212, + "BBH": 0.4956, + "MATH Level 5": 0.136, + "GPQA": 0.2886, + "MUSR": 0.4371, + "MMLU-PRO": 0.3383 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Alpaca-Llama3.1.03-8B-Philos", + "name": "Fireball-Alpaca-Llama3.1.03-8B-Philos", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.3881, + "BBH": 0.4951, + "MATH Level 5": 0.1284, + "GPQA": 0.2785, + "MUSR": 0.428, + "MMLU-PRO": 0.3355 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Alpaca-Llama3.1.04-8B-Philos", + "name": "Fireball-Alpaca-Llama3.1.04-8B-Philos", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.4084, + "BBH": 0.493, + "MATH Level 5": 0.1201, + "GPQA": 0.2903, + "MUSR": 0.4372, + "MMLU-PRO": 0.3403 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Alpaca-Llama3.1.06-8B-Philos-dpo", + "name": "Fireball-Alpaca-Llama3.1.06-8B-Philos-dpo", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.4866, + "BBH": 0.4881, + "MATH Level 5": 0.1307, + "GPQA": 0.2978, + "MUSR": 0.3932, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Alpaca-Llama3.1.07-8B-Philos-Math", + "name": "Fireball-Alpaca-Llama3.1.07-8B-Philos-Math", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.5079, + "BBH": 0.4847, + "MATH Level 5": 0.1201, + "GPQA": 0.2961, + "MUSR": 0.4063, + "MMLU-PRO": 0.3531 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Alpaca-Llama3.1.08-8B-C-R1-KTO-Reflection", + "name": "Fireball-Alpaca-Llama3.1.08-8B-C-R1-KTO-Reflection", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.3952, + "BBH": 0.4955, + "MATH Level 5": 0.1246, + "GPQA": 0.2995, + "MUSR": 0.4048, + "MMLU-PRO": 0.3593 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Alpaca-Llama3.1.08-8B-Philos-C-R1", + "name": "Fireball-Alpaca-Llama3.1.08-8B-Philos-C-R1", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.5316, + "BBH": 0.4828, + "MATH Level 5": 0.1239, + "GPQA": 0.297, + "MUSR": 0.4103, + "MMLU-PRO": 0.3523 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Llama-3.1-8B-Philos-Reflection", + "name": "Fireball-Llama-3.1-8B-Philos-Reflection", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.3596, + "BBH": 0.4898, + "MATH Level 5": 0.1284, + "GPQA": 0.3079, + "MUSR": 0.3957, + "MMLU-PRO": 0.3551 + } + }, + { + "model_id": "EpistemeAI2/Fireball-MathMistral-Nemo-Base-2407-v2dpo", + "name": "Fireball-MathMistral-Nemo-Base-2407-v2dpo", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.3097, + "BBH": 0.4328, + "MATH Level 5": 0.037, + "GPQA": 0.2634, + "MUSR": 0.403, + "MMLU-PRO": 0.1148 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-math", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-math", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.5515, + "BBH": 0.4808, + "MATH Level 5": 0.1352, + "GPQA": 0.3045, + "MUSR": 0.3693, + "MMLU-PRO": 0.342 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.005-128K-code-COT", + "name": "Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.005-128K-code-COT", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.4633, + "BBH": 0.4791, + "MATH Level 5": 0.1171, + "GPQA": 0.3121, + "MUSR": 0.3774, + "MMLU-PRO": 0.3565 + } + }, + { + "model_id": "EpistemeAI2/Fireball-Phi-3-medium-4k-inst-Philos", + "name": "Fireball-Phi-3-medium-4k-inst-Philos", + "developer": "EpistemeAI2", + "scores": { + "IFEval": 0.5313, + "BBH": 0.6178, + "MATH Level 5": 0.1707, + "GPQA": 0.3322, + "MUSR": 0.4139, + "MMLU-PRO": 0.4599 + } + }, + { + "model_id": "Eric111/CatunaMayo", + "name": "CatunaMayo", + "developer": "Eric111", + "scores": { + "IFEval": 0.4074, + "BBH": 0.5244, + "MATH Level 5": 0.0846, + "GPQA": 0.2919, + "MUSR": 0.454, + "MMLU-PRO": 0.3178 + } + }, + { + "model_id": "Eric111/CatunaMayo-DPO", + "name": "CatunaMayo-DPO", + "developer": "Eric111", + "scores": { + "IFEval": 0.4215, + "BBH": 0.5224, + "MATH Level 5": 0.0816, + "GPQA": 0.2919, + "MUSR": 0.445, + "MMLU-PRO": 0.317 + } + }, + { + "model_id": "Etherll/Chocolatine-3B-Instruct-DPO-Revised-Ties", + "name": "Chocolatine-3B-Instruct-DPO-Revised-Ties", + "developer": "Etherll", + "scores": { + "IFEval": 0.3725, + "BBH": 0.5411, + "MATH Level 5": 0.1631, + "GPQA": 0.3238, + "MUSR": 0.4649, + "MMLU-PRO": 0.3978 + } + }, + { + "model_id": "Etherll/Chocolatine-3B-Instruct-DPO-Revised-Ties-v2", + "name": "Chocolatine-3B-Instruct-DPO-Revised-Ties-v2", + "developer": "Etherll", + "scores": { + "IFEval": 0.374, + "BBH": 0.5411, + "MATH Level 5": 0.1631, + "GPQA": 0.3238, + "MUSR": 0.4649, + "MMLU-PRO": 0.3978 + } + }, + { + "model_id": "Etherll/Herplete-LLM-Llama-3.1-8b", + "name": "Herplete-LLM-Llama-3.1-8b", + "developer": "Etherll", + "scores": { + "IFEval": 0.6106, + "BBH": 0.5347, + "MATH Level 5": 0.1548, + "GPQA": 0.3146, + "MUSR": 0.3991, + "MMLU-PRO": 0.3752 + } + }, + { + "model_id": "Etherll/Herplete-LLM-Llama-3.1-8b-Ties", + "name": "Herplete-LLM-Llama-3.1-8b-Ties", + "developer": "Etherll", + "scores": { + "IFEval": 0.6164, + "BBH": 0.5338, + "MATH Level 5": 0.1601, + "GPQA": 0.3171, + "MUSR": 0.4017, + "MMLU-PRO": 0.3752 + } + }, + { + "model_id": "Etherll/Qwen2.5-7B-della-test", + "name": "Qwen2.5-7B-della-test", + "developer": "Etherll", + "scores": { + "IFEval": 0.7625, + "BBH": 0.5447, + "MATH Level 5": 0.4894, + "GPQA": 0.3087, + "MUSR": 0.4047, + "MMLU-PRO": 0.4361 + } + }, + { + "model_id": "Etherll/Qwen2.5-Coder-7B-Instruct-Ties", + "name": "Qwen2.5-Coder-7B-Instruct-Ties", + "developer": "Etherll", + "scores": { + "IFEval": 0.5005, + "BBH": 0.4895, + "MATH Level 5": 0.2915, + "GPQA": 0.3297, + "MUSR": 0.4373, + "MMLU-PRO": 0.3503 + } + }, + { + "model_id": "Etherll/Replete-LLM-V3-Llama-3.1-8b", + "name": "Replete-LLM-V3-Llama-3.1-8b", + "developer": "Etherll", + "scores": { + "IFEval": 0.5263, + "BBH": 0.4543, + "MATH Level 5": 0.2273, + "GPQA": 0.2685, + "MUSR": 0.3516, + "MMLU-PRO": 0.347 + } + }, + { + "model_id": "Etherll/SuperHermes", + "name": "SuperHermes", + "developer": "Etherll", + "scores": { + "IFEval": 0.5459, + "BBH": 0.529, + "MATH Level 5": 0.1654, + "GPQA": 0.3238, + "MUSR": 0.44, + "MMLU-PRO": 0.3949 + } + }, + { + "model_id": "Eurdem/Defne-llama3.1-8B", + "name": "Defne-llama3.1-8B", + "developer": "Eurdem", + "scores": { + "IFEval": 0.5036, + "BBH": 0.5321, + "MATH Level 5": 0.1601, + "GPQA": 0.2961, + "MUSR": 0.4331, + "MMLU-PRO": 0.3866 + } + }, + { + "model_id": "FINGU-AI/Chocolatine-Fusion-14B", + "name": "Chocolatine-Fusion-14B", + "developer": "FINGU-AI", + "scores": { + "IFEval": 0.6949, + "BBH": 0.6413, + "MATH Level 5": 0.3852, + "GPQA": 0.3716, + "MUSR": 0.494, + "MMLU-PRO": 0.5262 + } + }, + { + "model_id": "FINGU-AI/L3-8B", + "name": "L3-8B", + "developer": "FINGU-AI", + "scores": { + "IFEval": 0.7517, + "BBH": 0.4986, + "MATH Level 5": 0.2545, + "GPQA": 0.2953, + "MUSR": 0.3828, + "MMLU-PRO": 0.3639 + } + }, + { + "model_id": "FINGU-AI/Phi-4-RRStock", + "name": "Phi-4-RRStock", + "developer": "FINGU-AI", + "scores": { + "IFEval": 0.2855, + "BBH": 0.6443, + "MATH Level 5": 0.0582, + "GPQA": 0.38, + "MUSR": 0.4479, + "MMLU-PRO": 0.4883 + } + }, + { + "model_id": "FINGU-AI/Q-Small-3B", + "name": "Q-Small-3B", + "developer": "FINGU-AI", + "scores": { + "IFEval": 0.4145, + "BBH": 0.4319, + "MATH Level 5": 0.0831, + "GPQA": 0.2668, + "MUSR": 0.4005, + "MMLU-PRO": 0.279 + } + }, + { + "model_id": "FINGU-AI/QwQ-Buddy-32B-Alpha", + "name": "QwQ-Buddy-32B-Alpha", + "developer": "FINGU-AI", + "scores": { + "IFEval": 0.3446, + "BBH": 0.6424, + "MATH Level 5": 0.3852, + "GPQA": 0.3792, + "MUSR": 0.506, + "MMLU-PRO": 0.5294 + } + }, + { + "model_id": "FINGU-AI/RomboUltima-32B", + "name": "RomboUltima-32B", + "developer": "FINGU-AI", + "scores": { + "IFEval": 0.6672, + "BBH": 0.6938, + "MATH Level 5": 0.5385, + "GPQA": 0.3716, + "MUSR": 0.4836, + "MMLU-PRO": 0.5789 + } + }, + { + "model_id": "FINGU-AI/Ultimos-32B", + "name": "Ultimos-32B", + "developer": "FINGU-AI", + "scores": { + "IFEval": 0.1592, + "BBH": 0.2906, + "MATH Level 5": 0.0, + "GPQA": 0.2492, + "MUSR": 0.3286, + "MMLU-PRO": 0.1111 + } + }, + { + "model_id": "FallenMerick/Chewy-Lemon-Cookie-11B", + "name": "Chewy-Lemon-Cookie-11B", + "developer": "FallenMerick", + "scores": { + "IFEval": 0.4875, + "BBH": 0.5251, + "MATH Level 5": 0.0544, + "GPQA": 0.2794, + "MUSR": 0.4546, + "MMLU-PRO": 0.3267 + } + }, + { + "model_id": "Felladrin/Llama-160M-Chat-v1", + "name": "Llama-160M-Chat-v1", + "developer": "Felladrin", + "scores": { + "IFEval": 0.1575, + "BBH": 0.3036, + "MATH Level 5": 0.006, + "GPQA": 0.2576, + "MUSR": 0.3661, + "MMLU-PRO": 0.1136 + } + }, + { + "model_id": "Felladrin/Minueza-32M-UltraChat", + "name": "Minueza-32M-UltraChat", + "developer": "Felladrin", + "scores": { + "IFEval": 0.1376, + "BBH": 0.2941, + "MATH Level 5": 0.0045, + "GPQA": 0.2559, + "MUSR": 0.3742, + "MMLU-PRO": 0.1133 + } + }, + { + "model_id": "FlofloB/100k_fineweb_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit", + "name": "100k_fineweb_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit", + "developer": "FlofloB", + "scores": { + "IFEval": 0.3083, + "BBH": 0.3323, + "MATH Level 5": 0.0408, + "GPQA": 0.2693, + "MUSR": 0.3302, + "MMLU-PRO": 0.1498 + } + }, + { + "model_id": "FlofloB/10k_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit", + "name": "10k_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit", + "developer": "FlofloB", + "scores": { + "IFEval": 0.5097, + "BBH": 0.5215, + "MATH Level 5": 0.0974, + "GPQA": 0.2995, + "MUSR": 0.431, + "MMLU-PRO": 0.3769 + } + }, + { + "model_id": "FlofloB/10k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit", + "name": "10k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit", + "developer": "FlofloB", + "scores": { + "IFEval": 0.2815, + "BBH": 0.3306, + "MATH Level 5": 0.031, + "GPQA": 0.2794, + "MUSR": 0.3302, + "MMLU-PRO": 0.1541 + } + }, + { + "model_id": "FlofloB/40k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit", + "name": "40k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit", + "developer": "FlofloB", + "scores": { + "IFEval": 0.3016, + "BBH": 0.3325, + "MATH Level 5": 0.0332, + "GPQA": 0.2676, + "MUSR": 0.3408, + "MMLU-PRO": 0.1485 + } + }, + { + "model_id": "FlofloB/83k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit", + "name": "83k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit", + "developer": "FlofloB", + "scores": { + "IFEval": 0.2869, + "BBH": 0.3347, + "MATH Level 5": 0.0302, + "GPQA": 0.2735, + "MUSR": 0.3289, + "MMLU-PRO": 0.1555 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1000k_fineweb", + "name": "smollm2-135M_pretrained_1000k_fineweb", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1485, + "BBH": 0.2918, + "MATH Level 5": 0.0091, + "GPQA": 0.2626, + "MUSR": 0.3581, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1000k_fineweb_uncovai_human_removed", + "name": "smollm2-135M_pretrained_1000k_fineweb_uncovai_human_removed", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1554, + "BBH": 0.3066, + "MATH Level 5": 0.006, + "GPQA": 0.2508, + "MUSR": 0.358, + "MMLU-PRO": 0.1143 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1000k_fineweb_uncovai_selected", + "name": "smollm2-135M_pretrained_1000k_fineweb_uncovai_selected", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1468, + "BBH": 0.2932, + "MATH Level 5": 0.0068, + "GPQA": 0.2659, + "MUSR": 0.4048, + "MMLU-PRO": 0.1157 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1200k_fineweb", + "name": "smollm2-135M_pretrained_1200k_fineweb", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1581, + "BBH": 0.2941, + "MATH Level 5": 0.0068, + "GPQA": 0.2643, + "MUSR": 0.3714, + "MMLU-PRO": 0.1076 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1200k_fineweb_uncovai_human_removed", + "name": "smollm2-135M_pretrained_1200k_fineweb_uncovai_human_removed", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1578, + "BBH": 0.295, + "MATH Level 5": 0.0008, + "GPQA": 0.2651, + "MUSR": 0.37, + "MMLU-PRO": 0.1139 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1200k_fineweb_uncovai_selected", + "name": "smollm2-135M_pretrained_1200k_fineweb_uncovai_selected", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1585, + "BBH": 0.296, + "MATH Level 5": 0.0076, + "GPQA": 0.2634, + "MUSR": 0.3567, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1400k_fineweb", + "name": "smollm2-135M_pretrained_1400k_fineweb", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1764, + "BBH": 0.2922, + "MATH Level 5": 0.0113, + "GPQA": 0.2659, + "MUSR": 0.3873, + "MMLU-PRO": 0.108 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1400k_fineweb_uncovai_human_removed", + "name": "smollm2-135M_pretrained_1400k_fineweb_uncovai_human_removed", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1707, + "BBH": 0.2992, + "MATH Level 5": 0.0106, + "GPQA": 0.2609, + "MUSR": 0.3939, + "MMLU-PRO": 0.1105 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_1400k_fineweb_uncovai_selected", + "name": "smollm2-135M_pretrained_1400k_fineweb_uncovai_selected", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1538, + "BBH": 0.2917, + "MATH Level 5": 0.0106, + "GPQA": 0.2685, + "MUSR": 0.3741, + "MMLU-PRO": 0.1137 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_200k_fineweb_uncovai_human_removed", + "name": "smollm2-135M_pretrained_200k_fineweb_uncovai_human_removed", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1475, + "BBH": 0.3029, + "MATH Level 5": 0.0038, + "GPQA": 0.2584, + "MUSR": 0.3578, + "MMLU-PRO": 0.112 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_200k_fineweb_uncovai_selected", + "name": "smollm2-135M_pretrained_200k_fineweb_uncovai_selected", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1345, + "BBH": 0.2927, + "MATH Level 5": 0.0076, + "GPQA": 0.2508, + "MUSR": 0.366, + "MMLU-PRO": 0.1131 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_400k_fineweb", + "name": "smollm2-135M_pretrained_400k_fineweb", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1511, + "BBH": 0.2972, + "MATH Level 5": 0.0121, + "GPQA": 0.2525, + "MUSR": 0.3794, + "MMLU-PRO": 0.1163 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_400k_fineweb_uncovai_human_removed", + "name": "smollm2-135M_pretrained_400k_fineweb_uncovai_human_removed", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1556, + "BBH": 0.3049, + "MATH Level 5": 0.0091, + "GPQA": 0.255, + "MUSR": 0.386, + "MMLU-PRO": 0.1138 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_400k_fineweb_uncovai_selected", + "name": "smollm2-135M_pretrained_400k_fineweb_uncovai_selected", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1584, + "BBH": 0.2925, + "MATH Level 5": 0.0068, + "GPQA": 0.2542, + "MUSR": 0.382, + "MMLU-PRO": 0.1158 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_600k_fineweb", + "name": "smollm2-135M_pretrained_600k_fineweb", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1639, + "BBH": 0.3014, + "MATH Level 5": 0.006, + "GPQA": 0.2659, + "MUSR": 0.3809, + "MMLU-PRO": 0.1126 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_600k_fineweb_uncovai_human_removed", + "name": "smollm2-135M_pretrained_600k_fineweb_uncovai_human_removed", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1641, + "BBH": 0.3, + "MATH Level 5": 0.0091, + "GPQA": 0.2626, + "MUSR": 0.3793, + "MMLU-PRO": 0.1147 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_600k_fineweb_uncovai_selected", + "name": "smollm2-135M_pretrained_600k_fineweb_uncovai_selected", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1606, + "BBH": 0.2983, + "MATH Level 5": 0.0076, + "GPQA": 0.2609, + "MUSR": 0.3846, + "MMLU-PRO": 0.1162 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_800k_fineweb", + "name": "smollm2-135M_pretrained_800k_fineweb", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1641, + "BBH": 0.2959, + "MATH Level 5": 0.0083, + "GPQA": 0.2492, + "MUSR": 0.3701, + "MMLU-PRO": 0.1152 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_800k_fineweb_uncovai_human_removed", + "name": "smollm2-135M_pretrained_800k_fineweb_uncovai_human_removed", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1623, + "BBH": 0.3038, + "MATH Level 5": 0.0068, + "GPQA": 0.2525, + "MUSR": 0.3993, + "MMLU-PRO": 0.1138 + } + }, + { + "model_id": "FlofloB/smollm2-135M_pretrained_800k_fineweb_uncovai_selected", + "name": "smollm2-135M_pretrained_800k_fineweb_uncovai_selected", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1474, + "BBH": 0.2943, + "MATH Level 5": 0.0045, + "GPQA": 0.2617, + "MUSR": 0.3766, + "MMLU-PRO": 0.113 + } + }, + { + "model_id": "FlofloB/smollm2_pretrained_200k_fineweb", + "name": "smollm2_pretrained_200k_fineweb", + "developer": "FlofloB", + "scores": { + "IFEval": 0.1527, + "BBH": 0.2995, + "MATH Level 5": 0.0038, + "GPQA": 0.2475, + "MUSR": 0.3699, + "MMLU-PRO": 0.1159 + } + }, + { + "model_id": "FlofloB/test_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit", + "name": "test_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit", + "developer": "FlofloB", + "scores": { + "IFEval": 0.5215, + "BBH": 0.5241, + "MATH Level 5": 0.1103, + "GPQA": 0.3112, + "MUSR": 0.4244, + "MMLU-PRO": 0.3721 + } + }, + { + "model_id": "FuJhen/ft-openhermes-25-mistral-7b-irca-dpo-pairs", + "name": "ft-openhermes-25-mistral-7b-irca-dpo-pairs", + "developer": "FuJhen", + "scores": { + "IFEval": 0.542, + "BBH": 0.4773, + "MATH Level 5": 0.0483, + "GPQA": 0.2785, + "MUSR": 0.4174, + "MMLU-PRO": 0.2956 + } + }, + { + "model_id": "FuJhen/mistral-instruct-7B-DPO", + "name": "mistral-instruct-7B-DPO", + "developer": "FuJhen", + "scores": { + "IFEval": 0.4968, + "BBH": 0.4624, + "MATH Level 5": 0.0385, + "GPQA": 0.2777, + "MUSR": 0.4016, + "MMLU-PRO": 0.3034 + } + }, + { + "model_id": "FuJhen/mistral_7b_v0.1_structedData_e2e", + "name": "mistral_7b_v0.1_structedData_e2e", + "developer": "FuJhen", + "scores": { + "IFEval": 0.1727, + "BBH": 0.4114, + "MATH Level 5": 0.0045, + "GPQA": 0.2794, + "MUSR": 0.3723, + "MMLU-PRO": 0.2811 + } + }, + { + "model_id": "FuJhen/mistral_7b_v0.1_structedData_viggo", + "name": "mistral_7b_v0.1_structedData_viggo", + "developer": "FuJhen", + "scores": { + "IFEval": 0.1783, + "BBH": 0.4524, + "MATH Level 5": 0.0287, + "GPQA": 0.2836, + "MUSR": 0.3738, + "MMLU-PRO": 0.2942 + } + }, + { + "model_id": "FuseAI/FuseChat-7B-v2.0", + "name": "FuseChat-7B-v2.0", + "developer": "FuseAI", + "scores": { + "IFEval": 0.3423, + "BBH": 0.4954, + "MATH Level 5": 0.0612, + "GPQA": 0.302, + "MUSR": 0.4797, + "MMLU-PRO": 0.3162 + } + }, + { + "model_id": "FuseAI/FuseChat-Llama-3.1-8B-Instruct", + "name": "FuseChat-Llama-3.1-8B-Instruct", + "developer": "FuseAI", + "scores": { + "IFEval": 0.7205, + "BBH": 0.512, + "MATH Level 5": 0.2477, + "GPQA": 0.3054, + "MUSR": 0.382, + "MMLU-PRO": 0.3733 + } + }, + { + "model_id": "FuseAI/FuseChat-Llama-3.2-3B-Instruct", + "name": "FuseChat-Llama-3.2-3B-Instruct", + "developer": "FuseAI", + "scores": { + "IFEval": 0.6849, + "BBH": 0.4658, + "MATH Level 5": 0.2424, + "GPQA": 0.2961, + "MUSR": 0.3914, + "MMLU-PRO": 0.3132 + } + }, + { + "model_id": "FuseAI/FuseChat-Qwen-2.5-7B-Instruct", + "name": "FuseChat-Qwen-2.5-7B-Instruct", + "developer": "FuseAI", + "scores": { + "IFEval": 0.5906, + "BBH": 0.5526, + "MATH Level 5": 0.4562, + "GPQA": 0.2961, + "MUSR": 0.3874, + "MMLU-PRO": 0.4118 + } + }, + { + "model_id": "GalrionSoftworks/MN-LooseCannon-12B-v1", + "name": "MN-LooseCannon-12B-v1", + "developer": "GalrionSoftworks", + "scores": { + "IFEval": 0.5418, + "BBH": 0.5128, + "MATH Level 5": 0.0853, + "GPQA": 0.2852, + "MUSR": 0.4138, + "MMLU-PRO": 0.3196 + } + }, + { + "model_id": "GalrionSoftworks/MagnusIntellectus-12B-v1", + "name": "MagnusIntellectus-12B-v1", + "developer": "GalrionSoftworks", + "scores": { + "IFEval": 0.4421, + "BBH": 0.5323, + "MATH Level 5": 0.065, + "GPQA": 0.2844, + "MUSR": 0.4428, + "MMLU-PRO": 0.3421 + } + }, + { + "model_id": "GenVRadmin/AryaBhatta-GemmaOrca-2-Merged", + "name": "AryaBhatta-GemmaOrca-2-Merged", + "developer": "GenVRadmin", + "scores": { + "IFEval": 0.3064, + "BBH": 0.3887, + "MATH Level 5": 0.0498, + "GPQA": 0.2685, + "MUSR": 0.455, + "MMLU-PRO": 0.2384 + } + }, + { + "model_id": "GenVRadmin/AryaBhatta-GemmaOrca-Merged", + "name": "AryaBhatta-GemmaOrca-Merged", + "developer": "GenVRadmin", + "scores": { + "IFEval": 0.3064, + "BBH": 0.4131, + "MATH Level 5": 0.0514, + "GPQA": 0.2559, + "MUSR": 0.3524, + "MMLU-PRO": 0.2228 + } + }, + { + "model_id": "GenVRadmin/AryaBhatta-GemmaUltra-Merged", + "name": "AryaBhatta-GemmaUltra-Merged", + "developer": "GenVRadmin", + "scores": { + "IFEval": 0.3021, + "BBH": 0.4141, + "MATH Level 5": 0.0536, + "GPQA": 0.2534, + "MUSR": 0.4279, + "MMLU-PRO": 0.2266 + } + }, + { + "model_id": "GenVRadmin/llama38bGenZ_Vikas-Merged", + "name": "llama38bGenZ_Vikas-Merged", + "developer": "GenVRadmin", + "scores": { + "IFEval": 0.3, + "BBH": 0.4536, + "MATH Level 5": 0.0574, + "GPQA": 0.2953, + "MUSR": 0.4402, + "MMLU-PRO": 0.2622 + } + }, + { + "model_id": "GoToCompany/gemma2-9b-cpt-sahabatai-v1-instruct", + "name": "gemma2-9b-cpt-sahabatai-v1-instruct", + "developer": "GoToCompany", + "scores": { + "IFEval": 0.6551, + "BBH": 0.5955, + "MATH Level 5": 0.2054, + "GPQA": 0.3347, + "MUSR": 0.4779, + "MMLU-PRO": 0.4264 + } + }, + { + "model_id": "GoToCompany/llama3-8b-cpt-sahabatai-v1-instruct", + "name": "llama3-8b-cpt-sahabatai-v1-instruct", + "developer": "GoToCompany", + "scores": { + "IFEval": 0.5238, + "BBH": 0.4951, + "MATH Level 5": 0.1276, + "GPQA": 0.2668, + "MUSR": 0.4488, + "MMLU-PRO": 0.3453 + } + }, + { + "model_id": "Goekdeniz-Guelmez/Josiefied-Qwen2.5-0.5B-Instruct-abliterated-v1", + "name": "Josiefied-Qwen2.5-0.5B-Instruct-abliterated-v1", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.3417, + "BBH": 0.3292, + "MATH Level 5": 0.0023, + "GPQA": 0.2576, + "MUSR": 0.3249, + "MMLU-PRO": 0.1638 + } + }, + { + "model_id": "Goekdeniz-Guelmez/Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v1", + "name": "Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v1", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.4769, + "BBH": 0.4186, + "MATH Level 5": 0.2085, + "GPQA": 0.2433, + "MUSR": 0.3675, + "MMLU-PRO": 0.2783 + } + }, + { + "model_id": "Goekdeniz-Guelmez/Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v2", + "name": "Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v2", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.4216, + "BBH": 0.4042, + "MATH Level 5": 0.1269, + "GPQA": 0.2399, + "MUSR": 0.3769, + "MMLU-PRO": 0.2562 + } + }, + { + "model_id": "Goekdeniz-Guelmez/Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v3", + "name": "Josiefied-Qwen2.5-1.5B-Instruct-abliterated-v3", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.4253, + "BBH": 0.4053, + "MATH Level 5": 0.1307, + "GPQA": 0.2433, + "MUSR": 0.3702, + "MMLU-PRO": 0.2556 + } + }, + { + "model_id": "Goekdeniz-Guelmez/Josiefied-Qwen2.5-14B-Instruct-abliterated-v4", + "name": "Josiefied-Qwen2.5-14B-Instruct-abliterated-v4", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.8292, + "BBH": 0.6356, + "MATH Level 5": 0.5423, + "GPQA": 0.3423, + "MUSR": 0.4287, + "MMLU-PRO": 0.5018 + } + }, + { + "model_id": "Goekdeniz-Guelmez/Josiefied-Qwen2.5-7B-Instruct-abliterated-v2", + "name": "Josiefied-Qwen2.5-7B-Instruct-abliterated-v2", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.7814, + "BBH": 0.531, + "MATH Level 5": 0.4532, + "GPQA": 0.2987, + "MUSR": 0.4354, + "MMLU-PRO": 0.412 + } + }, + { + "model_id": "Goekdeniz-Guelmez/j.o.s.i.e.v4o-1.5b-dpo-stage1-v1", + "name": "j.o.s.i.e.v4o-1.5b-dpo-stage1-v1", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.4188, + "BBH": 0.4124, + "MATH Level 5": 0.1201, + "GPQA": 0.2508, + "MUSR": 0.3529, + "MMLU-PRO": 0.2555 + } + }, + { + "model_id": "Goekdeniz-Guelmez/josie-3b-v6.0", + "name": "josie-3b-v6.0", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.601, + "BBH": 0.4496, + "MATH Level 5": 0.2938, + "GPQA": 0.2903, + "MUSR": 0.3861, + "MMLU-PRO": 0.322 + } + }, + { + "model_id": "Goekdeniz-Guelmez/josie-7b-v6.0", + "name": "josie-7b-v6.0", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.7412, + "BBH": 0.5105, + "MATH Level 5": 0.4358, + "GPQA": 0.2827, + "MUSR": 0.4154, + "MMLU-PRO": 0.3807 + } + }, + { + "model_id": "Goekdeniz-Guelmez/josie-7b-v6.0-step2000", + "name": "josie-7b-v6.0-step2000", + "developer": "Goekdeniz-Guelmez", + "scores": { + "IFEval": 0.7628, + "BBH": 0.5098, + "MATH Level 5": 0.0, + "GPQA": 0.2802, + "MUSR": 0.4579, + "MMLU-PRO": 0.4033 + } + }, + { + "model_id": "GreenNode/GreenNode-small-9B-it", + "name": "GreenNode-small-9B-it", + "developer": "GreenNode", + "scores": { + "IFEval": 0.7436, + "BBH": 0.5994, + "MATH Level 5": 0.1745, + "GPQA": 0.3196, + "MUSR": 0.4204, + "MMLU-PRO": 0.3927 + } + }, + { + "model_id": "GritLM/GritLM-7B-KTO", + "name": "GritLM-7B-KTO", + "developer": "GritLM", + "scores": { + "IFEval": 0.531, + "BBH": 0.4853, + "MATH Level 5": 0.0272, + "GPQA": 0.2978, + "MUSR": 0.371, + "MMLU-PRO": 0.268 + } + }, + { + "model_id": "GritLM/GritLM-8x7B-KTO", + "name": "GritLM-8x7B-KTO", + "developer": "GritLM", + "scores": { + "IFEval": 0.5714, + "BBH": 0.582, + "MATH Level 5": 0.1224, + "GPQA": 0.2961, + "MUSR": 0.4217, + "MMLU-PRO": 0.3648 + } + }, + { + "model_id": "Groq/Llama-3-Groq-8B-Tool-Use", + "name": "Llama-3-Groq-8B-Tool-Use", + "developer": "Groq", + "scores": { + "IFEval": 0.6098, + "BBH": 0.4863, + "MATH Level 5": 0.0604, + "GPQA": 0.2676, + "MUSR": 0.366, + "MMLU-PRO": 0.3399 + } + }, + { + "model_id": "Gryphe/Pantheon-RP-1.0-8b-Llama-3", + "name": "Pantheon-RP-1.0-8b-Llama-3", + "developer": "Gryphe", + "scores": { + "IFEval": 0.3933, + "BBH": 0.4539, + "MATH Level 5": 0.0634, + "GPQA": 0.276, + "MUSR": 0.3832, + "MMLU-PRO": 0.3067 + } + }, + { + "model_id": "Gryphe/Pantheon-RP-1.5-12b-Nemo", + "name": "Pantheon-RP-1.5-12b-Nemo", + "developer": "Gryphe", + "scores": { + "IFEval": 0.4763, + "BBH": 0.5196, + "MATH Level 5": 0.0491, + "GPQA": 0.2727, + "MUSR": 0.442, + "MMLU-PRO": 0.3302 + } + }, + { + "model_id": "Gryphe/Pantheon-RP-1.6-12b-Nemo", + "name": "Pantheon-RP-1.6-12b-Nemo", + "developer": "Gryphe", + "scores": { + "IFEval": 0.4481, + "BBH": 0.5204, + "MATH Level 5": 0.0461, + "GPQA": 0.2777, + "MUSR": 0.4288, + "MMLU-PRO": 0.3311 + } + }, + { + "model_id": "Gryphe/Pantheon-RP-1.6-12b-Nemo-KTO", + "name": "Pantheon-RP-1.6-12b-Nemo-KTO", + "developer": "Gryphe", + "scores": { + "IFEval": 0.4636, + "BBH": 0.5277, + "MATH Level 5": 0.0529, + "GPQA": 0.2953, + "MUSR": 0.4248, + "MMLU-PRO": 0.3382 + } + }, + { + "model_id": "Gryphe/Pantheon-RP-Pure-1.6.2-22b-Small", + "name": "Pantheon-RP-Pure-1.6.2-22b-Small", + "developer": "Gryphe", + "scores": { + "IFEval": 0.6931, + "BBH": 0.5305, + "MATH Level 5": 0.2024, + "GPQA": 0.3289, + "MUSR": 0.3765, + "MMLU-PRO": 0.3942 + } + }, + { + "model_id": "GuilhermeNaturaUmana/Nature-Reason-1.2-reallysmall", + "name": "Nature-Reason-1.2-reallysmall", + "developer": "GuilhermeNaturaUmana", + "scores": { + "IFEval": 0.4985, + "BBH": 0.5645, + "MATH Level 5": 0.2576, + "GPQA": 0.3003, + "MUSR": 0.4373, + "MMLU-PRO": 0.4429 + } + }, + { + "model_id": "Gunulhona/Gemma-Ko-Merge", + "name": "Gemma-Ko-Merge", + "developer": "Gunulhona", + "scores": { + "IFEval": 0.6416, + "BBH": 0.5813, + "MATH Level 5": 0.1881, + "GPQA": 0.3356, + "MUSR": 0.4047, + "MMLU-PRO": 0.3879 + } + }, + { + "model_id": "Gunulhona/Gemma-Ko-Merge-PEFT", + "name": "Gemma-Ko-Merge-PEFT", + "developer": "Gunulhona", + "scores": { + "IFEval": 0.4441, + "BBH": 0.4863, + "MATH Level 5": 0.0, + "GPQA": 0.307, + "MUSR": 0.3986, + "MMLU-PRO": 0.3098 + } + }, + { + "model_id": "HPAI-BSC/Llama3-Aloe-8B-Alpha", + "name": "Llama3-Aloe-8B-Alpha", + "developer": "HPAI-BSC", + "scores": { + "IFEval": 0.5081, + "BBH": 0.4831, + "MATH Level 5": 0.0612, + "GPQA": 0.2945, + "MUSR": 0.3673, + "MMLU-PRO": 0.3295 + } + }, + { + "model_id": "HPAI-BSC/Llama3.1-Aloe-Beta-8B", + "name": "Llama3.1-Aloe-Beta-8B", + "developer": "HPAI-BSC", + "scores": { + "IFEval": 0.7253, + "BBH": 0.5093, + "MATH Level 5": 0.1828, + "GPQA": 0.2685, + "MUSR": 0.3835, + "MMLU-PRO": 0.358 + } + }, + { + "model_id": "HPAI-BSC/Qwen2.5-Aloe-Beta-7B", + "name": "Qwen2.5-Aloe-Beta-7B", + "developer": "HPAI-BSC", + "scores": { + "IFEval": 0.4554, + "BBH": 0.5049, + "MATH Level 5": 0.3542, + "GPQA": 0.2911, + "MUSR": 0.426, + "MMLU-PRO": 0.4354 + } + }, + { + "model_id": "HarbingerX/Zeitgeist-3b-V1", + "name": "Zeitgeist-3b-V1", + "developer": "HarbingerX", + "scores": { + "IFEval": 0.6712, + "BBH": 0.4441, + "MATH Level 5": 0.1035, + "GPQA": 0.2819, + "MUSR": 0.3579, + "MMLU-PRO": 0.3009 + } + }, + { + "model_id": "HarbingerX/Zeitgeist-3b-V1.2", + "name": "Zeitgeist-3b-V1.2", + "developer": "HarbingerX", + "scores": { + "IFEval": 0.6754, + "BBH": 0.4441, + "MATH Level 5": 0.1012, + "GPQA": 0.2777, + "MUSR": 0.3579, + "MMLU-PRO": 0.3056 + } + }, + { + "model_id": "Hastagaras/L3.2-JametMini-3B-MK.III", + "name": "L3.2-JametMini-3B-MK.III", + "developer": "Hastagaras", + "scores": { + "IFEval": 0.6183, + "BBH": 0.4539, + "MATH Level 5": 0.1458, + "GPQA": 0.2827, + "MUSR": 0.3686, + "MMLU-PRO": 0.2983 + } + }, + { + "model_id": "Hastagaras/Llama-3.1-Jamet-8B-MK.I", + "name": "Llama-3.1-Jamet-8B-MK.I", + "developer": "Hastagaras", + "scores": { + "IFEval": 0.7338, + "BBH": 0.5049, + "MATH Level 5": 0.1269, + "GPQA": 0.2743, + "MUSR": 0.3726, + "MMLU-PRO": 0.3482 + } + }, + { + "model_id": "Hastagaras/Zabuza-8B-Llama-3.1", + "name": "Zabuza-8B-Llama-3.1", + "developer": "Hastagaras", + "scores": { + "IFEval": 0.6265, + "BBH": 0.4539, + "MATH Level 5": 0.0551, + "GPQA": 0.2643, + "MUSR": 0.3568, + "MMLU-PRO": 0.2923 + } + }, + { + "model_id": "HelpingAI/Cipher-20B", + "name": "Cipher-20B", + "developer": "HelpingAI", + "scores": { + "IFEval": 0.5378, + "BBH": 0.6032, + "MATH Level 5": 0.1994, + "GPQA": 0.2953, + "MUSR": 0.4003, + "MMLU-PRO": 0.3744 + } + }, + { + "model_id": "HelpingAI/Dhanishtha-Large", + "name": "Dhanishtha-Large", + "developer": "HelpingAI", + "scores": { + "IFEval": 0.2457, + "BBH": 0.4604, + "MATH Level 5": 0.3852, + "GPQA": 0.3029, + "MUSR": 0.3845, + "MMLU-PRO": 0.2755 + } + }, + { + "model_id": "HelpingAI/Priya-10B", + "name": "Priya-10B", + "developer": "HelpingAI", + "scores": { + "IFEval": 0.4043, + "BBH": 0.4441, + "MATH Level 5": 0.0189, + "GPQA": 0.2559, + "MUSR": 0.3793, + "MMLU-PRO": 0.2493 + } + }, + { + "model_id": "HelpingAI/Priya-3B", + "name": "Priya-3B", + "developer": "HelpingAI", + "scores": { + "IFEval": 0.4526, + "BBH": 0.3961, + "MATH Level 5": 0.0144, + "GPQA": 0.2567, + "MUSR": 0.3713, + "MMLU-PRO": 0.2339 + } + }, + { + "model_id": "HeraiHench/DeepSeek-R1-Qwen-Coder-8B", + "name": "DeepSeek-R1-Qwen-Coder-8B", + "developer": "HeraiHench", + "scores": { + "IFEval": 0.1869, + "BBH": 0.2913, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3738, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "HeraiHench/Double-Down-Qwen-Math-7B", + "name": "Double-Down-Qwen-Math-7B", + "developer": "HeraiHench", + "scores": { + "IFEval": 0.167, + "BBH": 0.2845, + "MATH Level 5": 0.0008, + "GPQA": 0.2651, + "MUSR": 0.3737, + "MMLU-PRO": 0.1112 + } + }, + { + "model_id": "HeraiHench/Marge-Qwen-Math-7B", + "name": "Marge-Qwen-Math-7B", + "developer": "HeraiHench", + "scores": { + "IFEval": 0.1262, + "BBH": 0.3069, + "MATH Level 5": 0.0053, + "GPQA": 0.2391, + "MUSR": 0.3939, + "MMLU-PRO": 0.1056 + } + }, + { + "model_id": "HeraiHench/Phi-4-slerp-ReasoningRP-14B", + "name": "Phi-4-slerp-ReasoningRP-14B", + "developer": "HeraiHench", + "scores": { + "IFEval": 0.1575, + "BBH": 0.4196, + "MATH Level 5": 0.0, + "GPQA": 0.2936, + "MUSR": 0.3116, + "MMLU-PRO": 0.19 + } + }, + { + "model_id": "HiroseKoichi/Llama-Salad-4x8B-V3", + "name": "Llama-Salad-4x8B-V3", + "developer": "HiroseKoichi", + "scores": { + "IFEval": 0.6654, + "BBH": 0.5245, + "MATH Level 5": 0.0959, + "GPQA": 0.3029, + "MUSR": 0.374, + "MMLU-PRO": 0.3518 + } + }, + { + "model_id": "HoangHa/Pensez-Llama3.1-8B", + "name": "Pensez-Llama3.1-8B", + "developer": "HoangHa", + "scores": { + "IFEval": 0.3887, + "BBH": 0.4669, + "MATH Level 5": 0.1148, + "GPQA": 0.2886, + "MUSR": 0.3597, + "MMLU-PRO": 0.3126 + } + }, + { + "model_id": "HuggingFaceH4/zephyr-7b-alpha", + "name": "zephyr-7b-alpha", + "developer": "HuggingFaceH4", + "scores": { + "IFEval": 0.5191, + "BBH": 0.4583, + "MATH Level 5": 0.0196, + "GPQA": 0.2978, + "MUSR": 0.395, + "MMLU-PRO": 0.2795 + } + }, + { + "model_id": "HuggingFaceH4/zephyr-7b-beta", + "name": "zephyr-7b-beta", + "developer": "HuggingFaceH4", + "scores": { + "IFEval": 0.495, + "BBH": 0.4316, + "MATH Level 5": 0.0287, + "GPQA": 0.2903, + "MUSR": 0.3925, + "MMLU-PRO": 0.2781 + } + }, + { + "model_id": "HuggingFaceH4/zephyr-7b-gemma-v0.1", + "name": "zephyr-7b-gemma-v0.1", + "developer": "HuggingFaceH4", + "scores": { + "IFEval": 0.3364, + "BBH": 0.4624, + "MATH Level 5": 0.0816, + "GPQA": 0.2945, + "MUSR": 0.374, + "MMLU-PRO": 0.2847 + } + }, + { + "model_id": "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1", + "name": "zephyr-orpo-141b-A35b-v0.1", + "developer": "HuggingFaceH4", + "scores": { + "IFEval": 0.6511, + "BBH": 0.629, + "MATH Level 5": 0.2047, + "GPQA": 0.3784, + "MUSR": 0.4465, + "MMLU-PRO": 0.4586 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM-1.7B", + "name": "SmolLM-1.7B", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.2362, + "BBH": 0.3181, + "MATH Level 5": 0.0166, + "GPQA": 0.2416, + "MUSR": 0.3421, + "MMLU-PRO": 0.1148 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM-1.7B-Instruct", + "name": "SmolLM-1.7B-Instruct", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.2348, + "BBH": 0.2885, + "MATH Level 5": 0.0211, + "GPQA": 0.2601, + "MUSR": 0.3487, + "MMLU-PRO": 0.1166 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM-135M", + "name": "SmolLM-135M", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.2125, + "BBH": 0.3046, + "MATH Level 5": 0.0136, + "GPQA": 0.2584, + "MUSR": 0.4366, + "MMLU-PRO": 0.1122 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM-135M-Instruct", + "name": "SmolLM-135M-Instruct", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.1214, + "BBH": 0.3015, + "MATH Level 5": 0.0053, + "GPQA": 0.2592, + "MUSR": 0.3635, + "MMLU-PRO": 0.1176 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM-360M", + "name": "SmolLM-360M", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.2134, + "BBH": 0.3065, + "MATH Level 5": 0.0113, + "GPQA": 0.2676, + "MUSR": 0.4018, + "MMLU-PRO": 0.1124 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM-360M-Instruct", + "name": "SmolLM-360M-Instruct", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.1952, + "BBH": 0.2885, + "MATH Level 5": 0.0181, + "GPQA": 0.2643, + "MUSR": 0.3472, + "MMLU-PRO": 0.1166 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM2-1.7B", + "name": "SmolLM2-1.7B", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.244, + "BBH": 0.3453, + "MATH Level 5": 0.0264, + "GPQA": 0.2794, + "MUSR": 0.3485, + "MMLU-PRO": 0.2138 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM2-1.7B-Instruct", + "name": "SmolLM2-1.7B-Instruct", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.5368, + "BBH": 0.3599, + "MATH Level 5": 0.0582, + "GPQA": 0.2794, + "MUSR": 0.3421, + "MMLU-PRO": 0.2054 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM2-135M", + "name": "SmolLM2-135M", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.1818, + "BBH": 0.3044, + "MATH Level 5": 0.0121, + "GPQA": 0.2483, + "MUSR": 0.4112, + "MMLU-PRO": 0.1095 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM2-135M-Instruct", + "name": "SmolLM2-135M-Instruct", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.2883, + "BBH": 0.3124, + "MATH Level 5": 0.003, + "GPQA": 0.2357, + "MUSR": 0.3662, + "MMLU-PRO": 0.1115 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM2-360M", + "name": "SmolLM2-360M", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.2115, + "BBH": 0.3233, + "MATH Level 5": 0.0121, + "GPQA": 0.2458, + "MUSR": 0.3954, + "MMLU-PRO": 0.1169 + } + }, + { + "model_id": "HuggingFaceTB/SmolLM2-360M-Instruct", + "name": "SmolLM2-360M-Instruct", + "developer": "HuggingFaceTB", + "scores": { + "IFEval": 0.3842, + "BBH": 0.3144, + "MATH Level 5": 0.0151, + "GPQA": 0.255, + "MUSR": 0.3461, + "MMLU-PRO": 0.1117 + } + }, + { + "model_id": "HumanLLMs/Humanish-LLama3-8B-Instruct", + "name": "Humanish-LLama3-8B-Instruct", + "developer": "HumanLLMs", + "scores": { + "IFEval": 0.6498, + "BBH": 0.4968, + "MATH Level 5": 0.1027, + "GPQA": 0.2559, + "MUSR": 0.3582, + "MMLU-PRO": 0.3702 + } + }, + { + "model_id": "HumanLLMs/Humanish-Mistral-Nemo-Instruct-2407", + "name": "Humanish-Mistral-Nemo-Instruct-2407", + "developer": "HumanLLMs", + "scores": { + "IFEval": 0.5451, + "BBH": 0.5262, + "MATH Level 5": 0.1367, + "GPQA": 0.2878, + "MUSR": 0.3968, + "MMLU-PRO": 0.3521 + } + }, + { + "model_id": "HumanLLMs/Humanish-Qwen2.5-7B-Instruct", + "name": "Humanish-Qwen2.5-7B-Instruct", + "developer": "HumanLLMs", + "scores": { + "IFEval": 0.7284, + "BBH": 0.5364, + "MATH Level 5": 0.5, + "GPQA": 0.2987, + "MUSR": 0.3981, + "MMLU-PRO": 0.4398 + } + }, + { + "model_id": "IDEA-CCNL/Ziya-LLaMA-13B-v1", + "name": "Ziya-LLaMA-13B-v1", + "developer": "IDEA-CCNL", + "scores": { + "IFEval": 0.1697, + "BBH": 0.2877, + "MATH Level 5": 0.0, + "GPQA": 0.2492, + "MUSR": 0.3751, + "MMLU-PRO": 0.1101 + } + }, + { + "model_id": "INSAIT-Institute/BgGPT-Gemma-2-27B-IT-v1.0", + "name": "BgGPT-Gemma-2-27B-IT-v1.0", + "developer": "INSAIT-Institute", + "scores": { + "IFEval": 0.0, + "BBH": 0.2912, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3575, + "MMLU-PRO": 0.1167 + } + }, + { + "model_id": "IlyaGusev/gemma-2-2b-it-abliterated", + "name": "gemma-2-2b-it-abliterated", + "developer": "IlyaGusev", + "scores": { + "IFEval": 0.5331, + "BBH": 0.4119, + "MATH Level 5": 0.0612, + "GPQA": 0.2651, + "MUSR": 0.3782, + "MMLU-PRO": 0.2538 + } + }, + { + "model_id": "IlyaGusev/gemma-2-9b-it-abliterated", + "name": "gemma-2-9b-it-abliterated", + "developer": "IlyaGusev", + "scores": { + "IFEval": 0.7473, + "BBH": 0.5906, + "MATH Level 5": 0.1775, + "GPQA": 0.3456, + "MUSR": 0.4034, + "MMLU-PRO": 0.3915 + } + }, + { + "model_id": "Infinirc/Infinirc-Llama3-8B-2G-Release-v1.0", + "name": "Infinirc-Llama3-8B-2G-Release-v1.0", + "developer": "Infinirc", + "scores": { + "IFEval": 0.2024, + "BBH": 0.4351, + "MATH Level 5": 0.0166, + "GPQA": 0.2995, + "MUSR": 0.4609, + "MMLU-PRO": 0.216 + } + }, + { + "model_id": "Intel/neural-chat-7b-v3", + "name": "neural-chat-7b-v3", + "developer": "Intel", + "scores": { + "IFEval": 0.2778, + "BBH": 0.5048, + "MATH Level 5": 0.0295, + "GPQA": 0.2919, + "MUSR": 0.5055, + "MMLU-PRO": 0.2699 + } + }, + { + "model_id": "Intel/neural-chat-7b-v3-1", + "name": "neural-chat-7b-v3-1", + "developer": "Intel", + "scores": { + "IFEval": 0.4687, + "BBH": 0.5052, + "MATH Level 5": 0.0355, + "GPQA": 0.2903, + "MUSR": 0.4979, + "MMLU-PRO": 0.2678 + } + }, + { + "model_id": "Intel/neural-chat-7b-v3-2", + "name": "neural-chat-7b-v3-2", + "developer": "Intel", + "scores": { + "IFEval": 0.4988, + "BBH": 0.5032, + "MATH Level 5": 0.0476, + "GPQA": 0.2903, + "MUSR": 0.4895, + "MMLU-PRO": 0.2667 + } + }, + { + "model_id": "Intel/neural-chat-7b-v3-3", + "name": "neural-chat-7b-v3-3", + "developer": "Intel", + "scores": { + "IFEval": 0.4763, + "BBH": 0.4877, + "MATH Level 5": 0.0408, + "GPQA": 0.2894, + "MUSR": 0.486, + "MMLU-PRO": 0.2625 + } + }, + { + "model_id": "IntervitensInc/internlm2_5-20b-llamafied", + "name": "internlm2_5-20b-llamafied", + "developer": "IntervitensInc", + "scores": { + "IFEval": 0.341, + "BBH": 0.7478, + "MATH Level 5": 0.1715, + "GPQA": 0.3381, + "MUSR": 0.4475, + "MMLU-PRO": 0.4051 + } + }, + { + "model_id": "Invalid-Null/PeiYangMe-0.5", + "name": "PeiYangMe-0.5", + "developer": "Invalid-Null", + "scores": { + "IFEval": 0.1409, + "BBH": 0.2791, + "MATH Level 5": 0.0, + "GPQA": 0.2441, + "MUSR": 0.3738, + "MMLU-PRO": 0.1109 + } + }, + { + "model_id": "Invalid-Null/PeiYangMe-0.7", + "name": "PeiYangMe-0.7", + "developer": "Invalid-Null", + "scores": { + "IFEval": 0.1491, + "BBH": 0.3028, + "MATH Level 5": 0.0113, + "GPQA": 0.2332, + "MUSR": 0.3857, + "MMLU-PRO": 0.1101 + } + }, + { + "model_id": "Isaak-Carter/JOSIEv4o-8b-stage1-v4", + "name": "JOSIEv4o-8b-stage1-v4", + "developer": "Isaak-Carter", + "scores": { + "IFEval": 0.2477, + "BBH": 0.4758, + "MATH Level 5": 0.0453, + "GPQA": 0.2911, + "MUSR": 0.3641, + "MMLU-PRO": 0.3292 + } + }, + { + "model_id": "Isaak-Carter/Josiefied-Qwen2.5-7B-Instruct-abliterated", + "name": "Josiefied-Qwen2.5-7B-Instruct-abliterated", + "developer": "Isaak-Carter", + "scores": { + "IFEval": 0.7317, + "BBH": 0.5396, + "MATH Level 5": 0.4924, + "GPQA": 0.3029, + "MUSR": 0.4087, + "MMLU-PRO": 0.4276 + } + }, + { + "model_id": "Isaak-Carter/Josiefied-Qwen2.5-7B-Instruct-abliterated-v2", + "name": "Josiefied-Qwen2.5-7B-Instruct-abliterated-v2", + "developer": "Isaak-Carter", + "scores": { + "IFEval": 0.7841, + "BBH": 0.5311, + "MATH Level 5": 0.4721, + "GPQA": 0.2987, + "MUSR": 0.4354, + "MMLU-PRO": 0.4128 + } + }, + { + "model_id": "J-LAB/Thynk_orpo", + "name": "Thynk_orpo", + "developer": "J-LAB", + "scores": { + "IFEval": 0.2102, + "BBH": 0.4463, + "MATH Level 5": 0.148, + "GPQA": 0.2928, + "MUSR": 0.4515, + "MMLU-PRO": 0.3231 + } + }, + { + "model_id": "JackFram/llama-160m", + "name": "llama-160m", + "developer": "JackFram", + "scores": { + "IFEval": 0.1791, + "BBH": 0.2888, + "MATH Level 5": 0.0083, + "GPQA": 0.2617, + "MUSR": 0.3792, + "MMLU-PRO": 0.1128 + } + }, + { + "model_id": "JackFram/llama-68m", + "name": "llama-68m", + "developer": "JackFram", + "scores": { + "IFEval": 0.1726, + "BBH": 0.2936, + "MATH Level 5": 0.006, + "GPQA": 0.2584, + "MUSR": 0.391, + "MMLU-PRO": 0.1144 + } + }, + { + "model_id": "Jacoby746/Casual-Magnum-34B", + "name": "Casual-Magnum-34B", + "developer": "Jacoby746", + "scores": { + "IFEval": 0.193, + "BBH": 0.6032, + "MATH Level 5": 0.0921, + "GPQA": 0.3725, + "MUSR": 0.4078, + "MMLU-PRO": 0.5184 + } + }, + { + "model_id": "Jacoby746/Inf-Silent-Kunoichi-v0.1-2x7B", + "name": "Inf-Silent-Kunoichi-v0.1-2x7B", + "developer": "Jacoby746", + "scores": { + "IFEval": 0.388, + "BBH": 0.5185, + "MATH Level 5": 0.071, + "GPQA": 0.2894, + "MUSR": 0.428, + "MMLU-PRO": 0.3271 + } + }, + { + "model_id": "Jacoby746/Inf-Silent-Kunoichi-v0.2-2x7B", + "name": "Inf-Silent-Kunoichi-v0.2-2x7B", + "developer": "Jacoby746", + "scores": { + "IFEval": 0.3636, + "BBH": 0.5209, + "MATH Level 5": 0.0627, + "GPQA": 0.3003, + "MUSR": 0.432, + "MMLU-PRO": 0.3272 + } + }, + { + "model_id": "Jacoby746/Proto-Athena-4x7B", + "name": "Proto-Athena-4x7B", + "developer": "Jacoby746", + "scores": { + "IFEval": 0.3703, + "BBH": 0.5107, + "MATH Level 5": 0.065, + "GPQA": 0.2945, + "MUSR": 0.4348, + "MMLU-PRO": 0.3206 + } + }, + { + "model_id": "Jacoby746/Proto-Athena-v0.2-4x7B", + "name": "Proto-Athena-v0.2-4x7B", + "developer": "Jacoby746", + "scores": { + "IFEval": 0.3752, + "BBH": 0.5068, + "MATH Level 5": 0.0634, + "GPQA": 0.2987, + "MUSR": 0.4213, + "MMLU-PRO": 0.3197 + } + }, + { + "model_id": "Jacoby746/Proto-Harpy-Blazing-Light-v0.1-2x7B", + "name": "Proto-Harpy-Blazing-Light-v0.1-2x7B", + "developer": "Jacoby746", + "scores": { + "IFEval": 0.4905, + "BBH": 0.5187, + "MATH Level 5": 0.0748, + "GPQA": 0.2953, + "MUSR": 0.445, + "MMLU-PRO": 0.3301 + } + }, + { + "model_id": "Jacoby746/Proto-Harpy-Spark-v0.1-7B", + "name": "Proto-Harpy-Spark-v0.1-7B", + "developer": "Jacoby746", + "scores": { + "IFEval": 0.4333, + "BBH": 0.4736, + "MATH Level 5": 0.0619, + "GPQA": 0.3054, + "MUSR": 0.4317, + "MMLU-PRO": 0.3069 + } + }, + { + "model_id": "JayHyeon/Qwen-0.5B-DPO-1epoch", + "name": "Qwen-0.5B-DPO-1epoch", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2647, + "BBH": 0.3191, + "MATH Level 5": 0.0287, + "GPQA": 0.2525, + "MUSR": 0.3352, + "MMLU-PRO": 0.1558 + } + }, + { + "model_id": "JayHyeon/Qwen-0.5B-DPO-5epoch", + "name": "Qwen-0.5B-DPO-5epoch", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.257, + "BBH": 0.3112, + "MATH Level 5": 0.04, + "GPQA": 0.2433, + "MUSR": 0.338, + "MMLU-PRO": 0.1533 + } + }, + { + "model_id": "JayHyeon/Qwen-0.5B-IRPO-1epoch", + "name": "Qwen-0.5B-IRPO-1epoch", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2589, + "BBH": 0.3164, + "MATH Level 5": 0.0317, + "GPQA": 0.2466, + "MUSR": 0.3286, + "MMLU-PRO": 0.15 + } + }, + { + "model_id": "JayHyeon/Qwen-0.5B-IRPO-5epoch", + "name": "Qwen-0.5B-IRPO-5epoch", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2487, + "BBH": 0.3189, + "MATH Level 5": 0.0325, + "GPQA": 0.2399, + "MUSR": 0.3287, + "MMLU-PRO": 0.1507 + } + }, + { + "model_id": "JayHyeon/Qwen-0.5B-eDPO-1epoch", + "name": "Qwen-0.5B-eDPO-1epoch", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2623, + "BBH": 0.3181, + "MATH Level 5": 0.0347, + "GPQA": 0.2424, + "MUSR": 0.3327, + "MMLU-PRO": 0.1553 + } + }, + { + "model_id": "JayHyeon/Qwen-0.5B-eDPO-5epoch", + "name": "Qwen-0.5B-eDPO-5epoch", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2477, + "BBH": 0.3096, + "MATH Level 5": 0.0234, + "GPQA": 0.2492, + "MUSR": 0.3326, + "MMLU-PRO": 0.1523 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-Instruct-SFT", + "name": "Qwen2.5-0.5B-Instruct-SFT", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2768, + "BBH": 0.3254, + "MATH Level 5": 0.0393, + "GPQA": 0.2827, + "MUSR": 0.3342, + "MMLU-PRO": 0.152 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-Instruct-SFT-DPO-1epoch_v1", + "name": "Qwen2.5-0.5B-Instruct-SFT-DPO-1epoch_v1", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2469, + "BBH": 0.326, + "MATH Level 5": 0.065, + "GPQA": 0.2727, + "MUSR": 0.3434, + "MMLU-PRO": 0.1575 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-Instruct-SFT-IRPO-1epoch_v1", + "name": "Qwen2.5-0.5B-Instruct-SFT-IRPO-1epoch_v1", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2606, + "BBH": 0.3308, + "MATH Level 5": 0.0498, + "GPQA": 0.2802, + "MUSR": 0.3288, + "MMLU-PRO": 0.1626 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-Instruct-SFT-MDPO-1epoch_v1", + "name": "Qwen2.5-0.5B-Instruct-SFT-MDPO-1epoch_v1", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2529, + "BBH": 0.3262, + "MATH Level 5": 0.0566, + "GPQA": 0.2685, + "MUSR": 0.3301, + "MMLU-PRO": 0.1576 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT", + "name": "Qwen2.5-0.5B-SFT", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.1964, + "BBH": 0.3121, + "MATH Level 5": 0.0272, + "GPQA": 0.2785, + "MUSR": 0.3394, + "MMLU-PRO": 0.1673 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-1e-4", + "name": "Qwen2.5-0.5B-SFT-1e-4", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.202, + "BBH": 0.3017, + "MATH Level 5": 0.0189, + "GPQA": 0.2508, + "MUSR": 0.3446, + "MMLU-PRO": 0.1619 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-1e-4-2ep", + "name": "Qwen2.5-0.5B-SFT-1e-4-2ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.214, + "BBH": 0.3172, + "MATH Level 5": 0.0264, + "GPQA": 0.2466, + "MUSR": 0.3473, + "MMLU-PRO": 0.1537 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-1e-4-3ep", + "name": "Qwen2.5-0.5B-SFT-1e-4-3ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2257, + "BBH": 0.3064, + "MATH Level 5": 0.0264, + "GPQA": 0.2483, + "MUSR": 0.3661, + "MMLU-PRO": 0.1532 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-1e-4-5ep", + "name": "Qwen2.5-0.5B-SFT-1e-4-5ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.1987, + "BBH": 0.3104, + "MATH Level 5": 0.0196, + "GPQA": 0.2534, + "MUSR": 0.3407, + "MMLU-PRO": 0.1558 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-1e-5", + "name": "Qwen2.5-0.5B-SFT-1e-5", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.1986, + "BBH": 0.314, + "MATH Level 5": 0.0378, + "GPQA": 0.2685, + "MUSR": 0.346, + "MMLU-PRO": 0.1698 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-1e-5-2ep", + "name": "Qwen2.5-0.5B-SFT-1e-5-2ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.1971, + "BBH": 0.3225, + "MATH Level 5": 0.0529, + "GPQA": 0.2693, + "MUSR": 0.3368, + "MMLU-PRO": 0.1651 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-1e-5-3ep", + "name": "Qwen2.5-0.5B-SFT-1e-5-3ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2241, + "BBH": 0.3247, + "MATH Level 5": 0.0536, + "GPQA": 0.2701, + "MUSR": 0.3353, + "MMLU-PRO": 0.1689 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-1e-5-5ep", + "name": "Qwen2.5-0.5B-SFT-1e-5-5ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2292, + "BBH": 0.3259, + "MATH Level 5": 0.0521, + "GPQA": 0.2794, + "MUSR": 0.3235, + "MMLU-PRO": 0.1688 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-4", + "name": "Qwen2.5-0.5B-SFT-2e-4", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2034, + "BBH": 0.2936, + "MATH Level 5": 0.0242, + "GPQA": 0.2576, + "MUSR": 0.3434, + "MMLU-PRO": 0.1413 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-4-2ep", + "name": "Qwen2.5-0.5B-SFT-2e-4-2ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.1831, + "BBH": 0.2984, + "MATH Level 5": 0.0249, + "GPQA": 0.2424, + "MUSR": 0.3568, + "MMLU-PRO": 0.1484 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-4-3ep", + "name": "Qwen2.5-0.5B-SFT-2e-4-3ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.199, + "BBH": 0.311, + "MATH Level 5": 0.0151, + "GPQA": 0.2609, + "MUSR": 0.3449, + "MMLU-PRO": 0.1416 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-4-5ep", + "name": "Qwen2.5-0.5B-SFT-2e-4-5ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.1897, + "BBH": 0.2936, + "MATH Level 5": 0.0181, + "GPQA": 0.2693, + "MUSR": 0.3874, + "MMLU-PRO": 0.1336 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5", + "name": "Qwen2.5-0.5B-SFT-2e-5", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2068, + "BBH": 0.3204, + "MATH Level 5": 0.037, + "GPQA": 0.2693, + "MUSR": 0.3487, + "MMLU-PRO": 0.1678 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2201, + "BBH": 0.3217, + "MATH Level 5": 0.0408, + "GPQA": 0.2777, + "MUSR": 0.3367, + "MMLU-PRO": 0.171 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_3e-7-3ep_0alp_5lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_3e-7-3ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2411, + "BBH": 0.3167, + "MATH Level 5": 0.0347, + "GPQA": 0.271, + "MUSR": 0.3301, + "MMLU-PRO": 0.1562 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-6-1ep_0alp_5lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-6-1ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2369, + "BBH": 0.326, + "MATH Level 5": 0.0453, + "GPQA": 0.276, + "MUSR": 0.3355, + "MMLU-PRO": 0.157 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-6-2ep_0alp_5lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-6-2ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2262, + "BBH": 0.3262, + "MATH Level 5": 0.0347, + "GPQA": 0.2794, + "MUSR": 0.3408, + "MMLU-PRO": 0.1541 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-6-3ep_0alp_5lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-6-3ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2508, + "BBH": 0.3199, + "MATH Level 5": 0.0408, + "GPQA": 0.276, + "MUSR": 0.3355, + "MMLU-PRO": 0.1555 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-7-1ep_0alp_5lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-7-1ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.239, + "BBH": 0.3182, + "MATH Level 5": 0.04, + "GPQA": 0.2676, + "MUSR": 0.3328, + "MMLU-PRO": 0.156 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-7-2ep_0alp_5lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-7-2ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2423, + "BBH": 0.3154, + "MATH Level 5": 0.0347, + "GPQA": 0.2676, + "MUSR": 0.3328, + "MMLU-PRO": 0.1548 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-7-3ep_0alp_5lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPOP_5e-7-3ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2493, + "BBH": 0.319, + "MATH Level 5": 0.0438, + "GPQA": 0.2651, + "MUSR": 0.3341, + "MMLU-PRO": 0.1561 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-6-1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-6-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2542, + "BBH": 0.3167, + "MATH Level 5": 0.0408, + "GPQA": 0.2718, + "MUSR": 0.3289, + "MMLU-PRO": 0.158 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-6-2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-6-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2451, + "BBH": 0.316, + "MATH Level 5": 0.0408, + "GPQA": 0.2743, + "MUSR": 0.3302, + "MMLU-PRO": 0.1561 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-6-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2557, + "BBH": 0.3142, + "MATH Level 5": 0.04, + "GPQA": 0.2743, + "MUSR": 0.3315, + "MMLU-PRO": 0.1575 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-7-2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-7-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2605, + "BBH": 0.3167, + "MATH Level 5": 0.0363, + "GPQA": 0.2701, + "MUSR": 0.3341, + "MMLU-PRO": 0.1577 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-7-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_1e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2578, + "BBH": 0.3173, + "MATH Level 5": 0.0355, + "GPQA": 0.2634, + "MUSR": 0.3288, + "MMLU-PRO": 0.1583 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_2e-6-1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_2e-6-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2335, + "BBH": 0.3198, + "MATH Level 5": 0.0385, + "GPQA": 0.2752, + "MUSR": 0.3276, + "MMLU-PRO": 0.1581 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_2e-6-2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_2e-6-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2472, + "BBH": 0.3226, + "MATH Level 5": 0.0506, + "GPQA": 0.276, + "MUSR": 0.3262, + "MMLU-PRO": 0.1538 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_2e-6-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_2e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2474, + "BBH": 0.3229, + "MATH Level 5": 0.0415, + "GPQA": 0.2727, + "MUSR": 0.3275, + "MMLU-PRO": 0.1539 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2403, + "BBH": 0.3245, + "MATH Level 5": 0.0431, + "GPQA": 0.2819, + "MUSR": 0.3262, + "MMLU-PRO": 0.1573 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2368, + "BBH": 0.3224, + "MATH Level 5": 0.0461, + "GPQA": 0.2743, + "MUSR": 0.3355, + "MMLU-PRO": 0.1516 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2372, + "BBH": 0.3248, + "MATH Level 5": 0.0476, + "GPQA": 0.2701, + "MUSR": 0.3394, + "MMLU-PRO": 0.155 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-7-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_3e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2499, + "BBH": 0.3181, + "MATH Level 5": 0.0415, + "GPQA": 0.2651, + "MUSR": 0.3288, + "MMLU-PRO": 0.1574 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2381, + "BBH": 0.3242, + "MATH Level 5": 0.0498, + "GPQA": 0.2743, + "MUSR": 0.3328, + "MMLU-PRO": 0.1572 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2421, + "BBH": 0.3225, + "MATH Level 5": 0.04, + "GPQA": 0.2802, + "MUSR": 0.3408, + "MMLU-PRO": 0.1496 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2381, + "BBH": 0.3265, + "MATH Level 5": 0.0446, + "GPQA": 0.276, + "MUSR": 0.3408, + "MMLU-PRO": 0.1499 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-7_1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-7_1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2526, + "BBH": 0.3177, + "MATH Level 5": 0.0438, + "GPQA": 0.2735, + "MUSR": 0.3342, + "MMLU-PRO": 0.1572 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-7_2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-7_2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2457, + "BBH": 0.316, + "MATH Level 5": 0.0446, + "GPQA": 0.2727, + "MUSR": 0.3302, + "MMLU-PRO": 0.1572 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-7_3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_5e-7_3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2442, + "BBH": 0.3194, + "MATH Level 5": 0.0483, + "GPQA": 0.2735, + "MUSR": 0.3315, + "MMLU-PRO": 0.1567 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2604, + "BBH": 0.3178, + "MATH Level 5": 0.0355, + "GPQA": 0.276, + "MUSR": 0.3288, + "MMLU-PRO": 0.1567 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.249, + "BBH": 0.3173, + "MATH Level 5": 0.0393, + "GPQA": 0.271, + "MUSR": 0.3302, + "MMLU-PRO": 0.1569 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-DPO_7e-7_3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2604, + "BBH": 0.315, + "MATH Level 5": 0.0378, + "GPQA": 0.2743, + "MUSR": 0.3342, + "MMLU-PRO": 0.1566 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_1e-7-1ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_1e-7-1ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.255, + "BBH": 0.3211, + "MATH Level 5": 0.0491, + "GPQA": 0.2701, + "MUSR": 0.3288, + "MMLU-PRO": 0.1571 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_1e-7-2ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_1e-7-2ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2478, + "BBH": 0.3198, + "MATH Level 5": 0.0423, + "GPQA": 0.2668, + "MUSR": 0.3315, + "MMLU-PRO": 0.1587 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_1e-7-3ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_1e-7-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2475, + "BBH": 0.3225, + "MATH Level 5": 0.04, + "GPQA": 0.271, + "MUSR": 0.3301, + "MMLU-PRO": 0.1556 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_3e-7-3ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_3e-7-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.259, + "BBH": 0.3185, + "MATH Level 5": 0.0363, + "GPQA": 0.2727, + "MUSR": 0.3275, + "MMLU-PRO": 0.1586 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-1ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-1ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2323, + "BBH": 0.3179, + "MATH Level 5": 0.0453, + "GPQA": 0.2827, + "MUSR": 0.3262, + "MMLU-PRO": 0.1548 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-2ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-2ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2315, + "BBH": 0.326, + "MATH Level 5": 0.0415, + "GPQA": 0.2701, + "MUSR": 0.3383, + "MMLU-PRO": 0.1521 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-3ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-6-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2298, + "BBH": 0.332, + "MATH Level 5": 0.0431, + "GPQA": 0.2659, + "MUSR": 0.3329, + "MMLU-PRO": 0.1567 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-1ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-1ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2469, + "BBH": 0.3179, + "MATH Level 5": 0.0415, + "GPQA": 0.2794, + "MUSR": 0.3302, + "MMLU-PRO": 0.1575 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-2ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-2ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.252, + "BBH": 0.3168, + "MATH Level 5": 0.037, + "GPQA": 0.2752, + "MUSR": 0.3328, + "MMLU-PRO": 0.1576 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-3ep_1alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-IRPO_5e-7-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2666, + "BBH": 0.3191, + "MATH Level 5": 0.0347, + "GPQA": 0.2718, + "MUSR": 0.3289, + "MMLU-PRO": 0.1567 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2499, + "BBH": 0.3178, + "MATH Level 5": 0.037, + "GPQA": 0.2651, + "MUSR": 0.3341, + "MMLU-PRO": 0.1562 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2417, + "BBH": 0.3178, + "MATH Level 5": 0.04, + "GPQA": 0.2685, + "MUSR": 0.3328, + "MMLU-PRO": 0.1575 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_0.5_1e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2562, + "BBH": 0.319, + "MATH Level 5": 0.0423, + "GPQA": 0.2659, + "MUSR": 0.3341, + "MMLU-PRO": 0.1576 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_1e-6-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_1e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2408, + "BBH": 0.3165, + "MATH Level 5": 0.0431, + "GPQA": 0.2735, + "MUSR": 0.3315, + "MMLU-PRO": 0.1557 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_1e-6_1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_1e-6_1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2481, + "BBH": 0.3204, + "MATH Level 5": 0.0476, + "GPQA": 0.276, + "MUSR": 0.3302, + "MMLU-PRO": 0.1592 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_1e-6_2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_1e-6_2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2545, + "BBH": 0.3186, + "MATH Level 5": 0.0498, + "GPQA": 0.2718, + "MUSR": 0.3289, + "MMLU-PRO": 0.1561 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_2e-6-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_2e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.252, + "BBH": 0.3204, + "MATH Level 5": 0.0393, + "GPQA": 0.2727, + "MUSR": 0.3262, + "MMLU-PRO": 0.1538 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_2e-6_1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_2e-6_1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2315, + "BBH": 0.3213, + "MATH Level 5": 0.0453, + "GPQA": 0.2802, + "MUSR": 0.3222, + "MMLU-PRO": 0.1582 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_2e-6_2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_2e-6_2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2515, + "BBH": 0.3187, + "MATH Level 5": 0.0431, + "GPQA": 0.2718, + "MUSR": 0.3289, + "MMLU-PRO": 0.1539 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_3e-6-1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_3e-6-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2472, + "BBH": 0.3213, + "MATH Level 5": 0.0347, + "GPQA": 0.2727, + "MUSR": 0.3262, + "MMLU-PRO": 0.1588 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_3e-6-2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_3e-6-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.246, + "BBH": 0.3234, + "MATH Level 5": 0.0378, + "GPQA": 0.2794, + "MUSR": 0.3302, + "MMLU-PRO": 0.1533 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_3e-6-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_3e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2524, + "BBH": 0.3256, + "MATH Level 5": 0.0536, + "GPQA": 0.2777, + "MUSR": 0.3368, + "MMLU-PRO": 0.1531 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-6-1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-6-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2265, + "BBH": 0.3252, + "MATH Level 5": 0.0476, + "GPQA": 0.2735, + "MUSR": 0.3262, + "MMLU-PRO": 0.1568 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-6-2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-6-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2302, + "BBH": 0.3224, + "MATH Level 5": 0.0438, + "GPQA": 0.2768, + "MUSR": 0.3408, + "MMLU-PRO": 0.15 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-6-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2524, + "BBH": 0.3278, + "MATH Level 5": 0.0408, + "GPQA": 0.2777, + "MUSR": 0.3395, + "MMLU-PRO": 0.1521 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-7-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2658, + "BBH": 0.3175, + "MATH Level 5": 0.0363, + "GPQA": 0.2617, + "MUSR": 0.3302, + "MMLU-PRO": 0.1575 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-7_1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-7_1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2487, + "BBH": 0.3189, + "MATH Level 5": 0.0378, + "GPQA": 0.2718, + "MUSR": 0.3275, + "MMLU-PRO": 0.1595 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-7_2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_5e-7_2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.256, + "BBH": 0.3159, + "MATH Level 5": 0.0378, + "GPQA": 0.2768, + "MUSR": 0.3275, + "MMLU-PRO": 0.1562 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_7e-7-3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_7e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2499, + "BBH": 0.3156, + "MATH Level 5": 0.04, + "GPQA": 0.2701, + "MUSR": 0.3302, + "MMLU-PRO": 0.1556 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_7e-7_1ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_7e-7_1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2496, + "BBH": 0.3177, + "MATH Level 5": 0.0453, + "GPQA": 0.2626, + "MUSR": 0.3315, + "MMLU-PRO": 0.1567 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_7e-7_2ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-2ep-MDPO_7e-7_2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2515, + "BBH": 0.3172, + "MATH Level 5": 0.0438, + "GPQA": 0.2701, + "MUSR": 0.3275, + "MMLU-PRO": 0.1553 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-3ep", + "name": "Qwen2.5-0.5B-SFT-2e-5-3ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2281, + "BBH": 0.324, + "MATH Level 5": 0.0453, + "GPQA": 0.2617, + "MUSR": 0.3301, + "MMLU-PRO": 0.1746 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep", + "name": "Qwen2.5-0.5B-SFT-2e-5-5ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2348, + "BBH": 0.3308, + "MATH Level 5": 0.0506, + "GPQA": 0.2643, + "MUSR": 0.3409, + "MMLU-PRO": 0.1695 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2526, + "BBH": 0.3238, + "MATH Level 5": 0.0393, + "GPQA": 0.2676, + "MUSR": 0.3528, + "MMLU-PRO": 0.1574 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam_1ep", + "name": "Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam_1ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2481, + "BBH": 0.3175, + "MATH Level 5": 0.0385, + "GPQA": 0.2626, + "MUSR": 0.3475, + "MMLU-PRO": 0.1597 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam_2ep", + "name": "Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_5e-7_3ep_0alp_0lam_2ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2548, + "BBH": 0.3199, + "MATH Level 5": 0.0385, + "GPQA": 0.2651, + "MUSR": 0.3435, + "MMLU-PRO": 0.1562 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam", + "name": "Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2423, + "BBH": 0.3219, + "MATH Level 5": 0.034, + "GPQA": 0.2701, + "MUSR": 0.3515, + "MMLU-PRO": 0.1563 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam_1ep", + "name": "Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam_1ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2493, + "BBH": 0.3191, + "MATH Level 5": 0.0393, + "GPQA": 0.2685, + "MUSR": 0.3475, + "MMLU-PRO": 0.1592 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam_2ep", + "name": "Qwen2.5-0.5B-SFT-2e-5-5ep-MDPO_7e-7_3ep_0alp_0lam_2ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2478, + "BBH": 0.3218, + "MATH Level 5": 0.0415, + "GPQA": 0.2693, + "MUSR": 0.3515, + "MMLU-PRO": 0.1556 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-5e-5", + "name": "Qwen2.5-0.5B-SFT-5e-5", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.201, + "BBH": 0.3109, + "MATH Level 5": 0.034, + "GPQA": 0.2676, + "MUSR": 0.3381, + "MMLU-PRO": 0.1672 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-5e-5-2ep", + "name": "Qwen2.5-0.5B-SFT-5e-5-2ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2175, + "BBH": 0.318, + "MATH Level 5": 0.0378, + "GPQA": 0.2601, + "MUSR": 0.3368, + "MMLU-PRO": 0.1627 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-5e-5-3ep", + "name": "Qwen2.5-0.5B-SFT-5e-5-3ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2199, + "BBH": 0.3297, + "MATH Level 5": 0.0302, + "GPQA": 0.2534, + "MUSR": 0.3593, + "MMLU-PRO": 0.1651 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-5e-5-5ep", + "name": "Qwen2.5-0.5B-SFT-5e-5-5ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2077, + "BBH": 0.3276, + "MATH Level 5": 0.0272, + "GPQA": 0.2685, + "MUSR": 0.3766, + "MMLU-PRO": 0.1587 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-7e-5", + "name": "Qwen2.5-0.5B-SFT-7e-5", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2093, + "BBH": 0.3158, + "MATH Level 5": 0.0302, + "GPQA": 0.2567, + "MUSR": 0.3367, + "MMLU-PRO": 0.1622 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-7e-5-2ep", + "name": "Qwen2.5-0.5B-SFT-7e-5-2ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2156, + "BBH": 0.31, + "MATH Level 5": 0.0393, + "GPQA": 0.2424, + "MUSR": 0.3367, + "MMLU-PRO": 0.1567 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-7e-5-3ep", + "name": "Qwen2.5-0.5B-SFT-7e-5-3ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2381, + "BBH": 0.3199, + "MATH Level 5": 0.0332, + "GPQA": 0.2366, + "MUSR": 0.3554, + "MMLU-PRO": 0.1522 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-7e-5-5ep", + "name": "Qwen2.5-0.5B-SFT-7e-5-5ep", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.212, + "BBH": 0.32, + "MATH Level 5": 0.0219, + "GPQA": 0.2458, + "MUSR": 0.3713, + "MMLU-PRO": 0.1628 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-DPO-1epoch_v1", + "name": "Qwen2.5-0.5B-SFT-DPO-1epoch_v1", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2025, + "BBH": 0.3268, + "MATH Level 5": 0.0363, + "GPQA": 0.2727, + "MUSR": 0.3209, + "MMLU-PRO": 0.133 + } + }, + { + "model_id": "JayHyeon/Qwen2.5-0.5B-SFT-MDPO-1epoch_v1", + "name": "Qwen2.5-0.5B-SFT-MDPO-1epoch_v1", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.1964, + "BBH": 0.3293, + "MATH Level 5": 0.0468, + "GPQA": 0.276, + "MUSR": 0.3262, + "MMLU-PRO": 0.1337 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_1e-6-3ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_1e-6-3ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2532, + "BBH": 0.314, + "MATH Level 5": 0.0491, + "GPQA": 0.2743, + "MUSR": 0.3315, + "MMLU-PRO": 0.1566 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_1e-7-3ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_1e-7-3ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.267, + "BBH": 0.3189, + "MATH Level 5": 0.0408, + "GPQA": 0.2668, + "MUSR": 0.3288, + "MMLU-PRO": 0.1562 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_3e-6-1ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_3e-6-1ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2481, + "BBH": 0.3261, + "MATH Level 5": 0.0438, + "GPQA": 0.2601, + "MUSR": 0.3368, + "MMLU-PRO": 0.1565 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_3e-6-2ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_3e-6-2ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2383, + "BBH": 0.3218, + "MATH Level 5": 0.0431, + "GPQA": 0.2794, + "MUSR": 0.3342, + "MMLU-PRO": 0.1503 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_3e-6-3ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_3e-6-3ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2471, + "BBH": 0.3224, + "MATH Level 5": 0.04, + "GPQA": 0.2701, + "MUSR": 0.3328, + "MMLU-PRO": 0.1533 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_3e-7-1ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_3e-7-1ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2447, + "BBH": 0.3181, + "MATH Level 5": 0.0438, + "GPQA": 0.2617, + "MUSR": 0.3341, + "MMLU-PRO": 0.1565 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_3e-7-2ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_3e-7-2ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2551, + "BBH": 0.3194, + "MATH Level 5": 0.0446, + "GPQA": 0.2617, + "MUSR": 0.3262, + "MMLU-PRO": 0.1567 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_3e-7-3ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_3e-7-3ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2538, + "BBH": 0.3153, + "MATH Level 5": 0.0415, + "GPQA": 0.2676, + "MUSR": 0.3261, + "MMLU-PRO": 0.1583 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_5e-7-1ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_5e-7-1ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2402, + "BBH": 0.3168, + "MATH Level 5": 0.0378, + "GPQA": 0.2718, + "MUSR": 0.3328, + "MMLU-PRO": 0.1568 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_5e-7-2ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_5e-7-2ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2484, + "BBH": 0.3211, + "MATH Level 5": 0.0438, + "GPQA": 0.2701, + "MUSR": 0.3288, + "MMLU-PRO": 0.1573 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPOP_5e-7-3ep_0alp_5lam", + "name": "Qwen_0.5-DPOP_5e-7-3ep_0alp_5lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2578, + "BBH": 0.3203, + "MATH Level 5": 0.0423, + "GPQA": 0.271, + "MUSR": 0.3289, + "MMLU-PRO": 0.1583 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_1e-6-3ep_0alp_0lam", + "name": "Qwen_0.5-DPO_1e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2316, + "BBH": 0.3258, + "MATH Level 5": 0.0529, + "GPQA": 0.2693, + "MUSR": 0.3221, + "MMLU-PRO": 0.158 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_1e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-DPO_1e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.236, + "BBH": 0.3225, + "MATH Level 5": 0.0438, + "GPQA": 0.271, + "MUSR": 0.3222, + "MMLU-PRO": 0.1596 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_3e-6-1ep_0alp_0lam", + "name": "Qwen_0.5-DPO_3e-6-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2337, + "BBH": 0.3132, + "MATH Level 5": 0.0347, + "GPQA": 0.2609, + "MUSR": 0.3235, + "MMLU-PRO": 0.1533 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_3e-6-2ep_0alp_0lam", + "name": "Qwen_0.5-DPO_3e-6-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2569, + "BBH": 0.3276, + "MATH Level 5": 0.0544, + "GPQA": 0.2718, + "MUSR": 0.3156, + "MMLU-PRO": 0.1565 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_3e-6-3ep_0alp_0lam", + "name": "Qwen_0.5-DPO_3e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.246, + "BBH": 0.3267, + "MATH Level 5": 0.0431, + "GPQA": 0.2685, + "MUSR": 0.3209, + "MMLU-PRO": 0.1543 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_3e-7-1ep_0alp_0lam", + "name": "Qwen_0.5-DPO_3e-7-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2529, + "BBH": 0.3229, + "MATH Level 5": 0.0551, + "GPQA": 0.2676, + "MUSR": 0.3195, + "MMLU-PRO": 0.1597 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_3e-7-2ep_0alp_0lam", + "name": "Qwen_0.5-DPO_3e-7-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2505, + "BBH": 0.3256, + "MATH Level 5": 0.0476, + "GPQA": 0.2718, + "MUSR": 0.3195, + "MMLU-PRO": 0.1599 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_3e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-DPO_3e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2387, + "BBH": 0.3258, + "MATH Level 5": 0.0446, + "GPQA": 0.2743, + "MUSR": 0.3169, + "MMLU-PRO": 0.1589 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_5e-7-1ep_0alp_0lam", + "name": "Qwen_0.5-DPO_5e-7-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2532, + "BBH": 0.3218, + "MATH Level 5": 0.0634, + "GPQA": 0.2685, + "MUSR": 0.3209, + "MMLU-PRO": 0.1593 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_5e-7-2ep_0alp_0lam", + "name": "Qwen_0.5-DPO_5e-7-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2456, + "BBH": 0.3299, + "MATH Level 5": 0.0536, + "GPQA": 0.271, + "MUSR": 0.3181, + "MMLU-PRO": 0.1602 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-DPO_5e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-DPO_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2423, + "BBH": 0.3271, + "MATH Level 5": 0.0514, + "GPQA": 0.2743, + "MUSR": 0.3181, + "MMLU-PRO": 0.1595 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IPO_5e-7-1ep_0alp_0lam", + "name": "Qwen_0.5-IPO_5e-7-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2574, + "BBH": 0.3279, + "MATH Level 5": 0.0559, + "GPQA": 0.2693, + "MUSR": 0.3169, + "MMLU-PRO": 0.1651 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IPO_5e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-IPO_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.3072, + "BBH": 0.3264, + "MATH Level 5": 0.0582, + "GPQA": 0.2567, + "MUSR": 0.3156, + "MMLU-PRO": 0.1624 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_1e-6-3ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_1e-6-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2551, + "BBH": 0.3242, + "MATH Level 5": 0.0468, + "GPQA": 0.2668, + "MUSR": 0.3182, + "MMLU-PRO": 0.1574 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_1e-7-3ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_1e-7-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2636, + "BBH": 0.3198, + "MATH Level 5": 0.0514, + "GPQA": 0.276, + "MUSR": 0.3262, + "MMLU-PRO": 0.1586 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_3e-6-1ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_3e-6-1ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2323, + "BBH": 0.3255, + "MATH Level 5": 0.037, + "GPQA": 0.2508, + "MUSR": 0.3169, + "MMLU-PRO": 0.1612 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_3e-6-2ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_3e-6-2ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2414, + "BBH": 0.3314, + "MATH Level 5": 0.0347, + "GPQA": 0.2517, + "MUSR": 0.3342, + "MMLU-PRO": 0.1532 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_3e-6-3ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_3e-6-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2678, + "BBH": 0.3362, + "MATH Level 5": 0.0514, + "GPQA": 0.2542, + "MUSR": 0.3382, + "MMLU-PRO": 0.1561 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_3e-7-1ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_3e-7-1ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2561, + "BBH": 0.3231, + "MATH Level 5": 0.0536, + "GPQA": 0.2718, + "MUSR": 0.3196, + "MMLU-PRO": 0.1589 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_3e-7-3ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_3e-7-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2639, + "BBH": 0.3257, + "MATH Level 5": 0.0476, + "GPQA": 0.2701, + "MUSR": 0.3209, + "MMLU-PRO": 0.1587 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_5e-7-1ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_5e-7-1ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2518, + "BBH": 0.3214, + "MATH Level 5": 0.0574, + "GPQA": 0.2735, + "MUSR": 0.3169, + "MMLU-PRO": 0.1585 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_5e-7-2ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_5e-7-2ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2438, + "BBH": 0.3266, + "MATH Level 5": 0.0619, + "GPQA": 0.2727, + "MUSR": 0.3196, + "MMLU-PRO": 0.1554 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-IRPO_5e-7-3ep_1alp_0lam", + "name": "Qwen_0.5-IRPO_5e-7-3ep_1alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2465, + "BBH": 0.3246, + "MATH Level 5": 0.0529, + "GPQA": 0.2718, + "MUSR": 0.3182, + "MMLU-PRO": 0.1563 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.1_3e-6-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.1_3e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2506, + "BBH": 0.3261, + "MATH Level 5": 0.0498, + "GPQA": 0.2819, + "MUSR": 0.3382, + "MMLU-PRO": 0.1522 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.1_5e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.1_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2457, + "BBH": 0.318, + "MATH Level 5": 0.0347, + "GPQA": 0.2634, + "MUSR": 0.3315, + "MMLU-PRO": 0.1566 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.3_3e-6-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.3_3e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2454, + "BBH": 0.3216, + "MATH Level 5": 0.0506, + "GPQA": 0.2802, + "MUSR": 0.3382, + "MMLU-PRO": 0.1544 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.3_5e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.3_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2342, + "BBH": 0.3189, + "MATH Level 5": 0.04, + "GPQA": 0.2701, + "MUSR": 0.3302, + "MMLU-PRO": 0.158 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.5_1e-5-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.5_1e-5-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.232, + "BBH": 0.3234, + "MATH Level 5": 0.0393, + "GPQA": 0.2743, + "MUSR": 0.3369, + "MMLU-PRO": 0.1543 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.5_3e-7-1ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.5_3e-7-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2418, + "BBH": 0.3175, + "MATH Level 5": 0.0423, + "GPQA": 0.2626, + "MUSR": 0.3288, + "MMLU-PRO": 0.158 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.5_3e-7-2ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.5_3e-7-2ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2493, + "BBH": 0.3197, + "MATH Level 5": 0.0423, + "GPQA": 0.2701, + "MUSR": 0.3315, + "MMLU-PRO": 0.1571 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.5_3e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.5_3e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.252, + "BBH": 0.3198, + "MATH Level 5": 0.0423, + "GPQA": 0.2634, + "MUSR": 0.3262, + "MMLU-PRO": 0.1551 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.5_4e-6-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.5_4e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.258, + "BBH": 0.3248, + "MATH Level 5": 0.0476, + "GPQA": 0.2752, + "MUSR": 0.3422, + "MMLU-PRO": 0.1539 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.5_6e-6-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.5_6e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.232, + "BBH": 0.3265, + "MATH Level 5": 0.0385, + "GPQA": 0.271, + "MUSR": 0.3395, + "MMLU-PRO": 0.1537 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.5_7e-6-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.5_7e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2488, + "BBH": 0.3273, + "MATH Level 5": 0.0461, + "GPQA": 0.2718, + "MUSR": 0.3342, + "MMLU-PRO": 0.1531 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.5_7e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.5_7e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2524, + "BBH": 0.313, + "MATH Level 5": 0.0446, + "GPQA": 0.271, + "MUSR": 0.3289, + "MMLU-PRO": 0.1564 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.7_3e-6-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.7_3e-6-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2514, + "BBH": 0.3221, + "MATH Level 5": 0.0438, + "GPQA": 0.2752, + "MUSR": 0.3315, + "MMLU-PRO": 0.1538 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.7_5e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.7_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2457, + "BBH": 0.318, + "MATH Level 5": 0.0385, + "GPQA": 0.2668, + "MUSR": 0.3275, + "MMLU-PRO": 0.1572 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-MDPO_0.9_5e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-MDPO_0.9_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2636, + "BBH": 0.3181, + "MATH Level 5": 0.0476, + "GPQA": 0.2659, + "MUSR": 0.3235, + "MMLU-PRO": 0.1574 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VDPO_3e-6-1ep_3vpo_const", + "name": "Qwen_0.5-VDPO_3e-6-1ep_3vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2483, + "BBH": 0.3174, + "MATH Level 5": 0.0378, + "GPQA": 0.2542, + "MUSR": 0.3328, + "MMLU-PRO": 0.1558 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VDPO_5e-7-1ep_0alp_0lam", + "name": "Qwen_0.5-VDPO_5e-7-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2518, + "BBH": 0.3218, + "MATH Level 5": 0.0529, + "GPQA": 0.2718, + "MUSR": 0.3235, + "MMLU-PRO": 0.1595 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VDPO_5e-7-1ep_10vpo_const", + "name": "Qwen_0.5-VDPO_5e-7-1ep_10vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2536, + "BBH": 0.3234, + "MATH Level 5": 0.0491, + "GPQA": 0.276, + "MUSR": 0.3236, + "MMLU-PRO": 0.1597 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VDPO_5e-7-1ep_1vpo_const", + "name": "Qwen_0.5-VDPO_5e-7-1ep_1vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2448, + "BBH": 0.324, + "MATH Level 5": 0.0604, + "GPQA": 0.2752, + "MUSR": 0.3249, + "MMLU-PRO": 0.1587 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VDPO_5e-7-1ep_3vpo_const", + "name": "Qwen_0.5-VDPO_5e-7-1ep_3vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2505, + "BBH": 0.3227, + "MATH Level 5": 0.0468, + "GPQA": 0.271, + "MUSR": 0.3209, + "MMLU-PRO": 0.1589 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VDPO_5e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-VDPO_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2472, + "BBH": 0.3255, + "MATH Level 5": 0.0498, + "GPQA": 0.2752, + "MUSR": 0.3208, + "MMLU-PRO": 0.1587 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VDPO_5e-7-3ep_1vpo_const", + "name": "Qwen_0.5-VDPO_5e-7-3ep_1vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2417, + "BBH": 0.3256, + "MATH Level 5": 0.0582, + "GPQA": 0.2727, + "MUSR": 0.3275, + "MMLU-PRO": 0.1562 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VDPO_5e-7-3ep_3vpo_const", + "name": "Qwen_0.5-VDPO_5e-7-3ep_3vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2527, + "BBH": 0.3235, + "MATH Level 5": 0.0536, + "GPQA": 0.2785, + "MUSR": 0.3235, + "MMLU-PRO": 0.158 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-1ep_0alp_0lam", + "name": "Qwen_0.5-VIPO_5e-7-1ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2669, + "BBH": 0.3314, + "MATH Level 5": 0.071, + "GPQA": 0.2676, + "MUSR": 0.3168, + "MMLU-PRO": 0.1634 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-1ep_10vpo_const", + "name": "Qwen_0.5-VIPO_5e-7-1ep_10vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2702, + "BBH": 0.33, + "MATH Level 5": 0.074, + "GPQA": 0.2752, + "MUSR": 0.3208, + "MMLU-PRO": 0.1635 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-1ep_1vpo_const", + "name": "Qwen_0.5-VIPO_5e-7-1ep_1vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.248, + "BBH": 0.3309, + "MATH Level 5": 0.068, + "GPQA": 0.2643, + "MUSR": 0.3208, + "MMLU-PRO": 0.1649 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-1ep_30vpo_const", + "name": "Qwen_0.5-VIPO_5e-7-1ep_30vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2622, + "BBH": 0.3282, + "MATH Level 5": 0.074, + "GPQA": 0.2693, + "MUSR": 0.3221, + "MMLU-PRO": 0.1634 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-1ep_3vpo_const", + "name": "Qwen_0.5-VIPO_5e-7-1ep_3vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2609, + "BBH": 0.3298, + "MATH Level 5": 0.065, + "GPQA": 0.2701, + "MUSR": 0.3168, + "MMLU-PRO": 0.1651 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-3ep_0alp_0lam", + "name": "Qwen_0.5-VIPO_5e-7-3ep_0alp_0lam", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.293, + "BBH": 0.322, + "MATH Level 5": 0.0627, + "GPQA": 0.2685, + "MUSR": 0.3116, + "MMLU-PRO": 0.1591 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-3ep_10vpo_const", + "name": "Qwen_0.5-VIPO_5e-7-3ep_10vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2881, + "BBH": 0.3255, + "MATH Level 5": 0.0725, + "GPQA": 0.2752, + "MUSR": 0.3102, + "MMLU-PRO": 0.1582 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-3ep_1vpo_const", + "name": "Qwen_0.5-VIPO_5e-7-3ep_1vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2887, + "BBH": 0.3237, + "MATH Level 5": 0.0748, + "GPQA": 0.2802, + "MUSR": 0.3142, + "MMLU-PRO": 0.1609 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-3ep_30vpo_const", + "name": "Qwen_0.5-VIPO_5e-7-3ep_30vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2905, + "BBH": 0.3254, + "MATH Level 5": 0.077, + "GPQA": 0.2735, + "MUSR": 0.3129, + "MMLU-PRO": 0.1574 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-VIPO_5e-7-3ep_3vpo_const", + "name": "Qwen_0.5-VIPO_5e-7-3ep_3vpo_const", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2905, + "BBH": 0.3238, + "MATH Level 5": 0.0702, + "GPQA": 0.2735, + "MUSR": 0.3089, + "MMLU-PRO": 0.1592 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-cDPO_5e-7-3ep_0vpo_const_0.1", + "name": "Qwen_0.5-cDPO_5e-7-3ep_0vpo_const_0.1", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2393, + "BBH": 0.3244, + "MATH Level 5": 0.0514, + "GPQA": 0.2777, + "MUSR": 0.3222, + "MMLU-PRO": 0.1573 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-cDPO_5e-7-3ep_0vpo_const_0.3", + "name": "Qwen_0.5-cDPO_5e-7-3ep_0vpo_const_0.3", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2475, + "BBH": 0.3209, + "MATH Level 5": 0.0461, + "GPQA": 0.281, + "MUSR": 0.3275, + "MMLU-PRO": 0.1567 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-rDPO_3e-6-1ep_0vpo_const_0.1", + "name": "Qwen_0.5-rDPO_3e-6-1ep_0vpo_const_0.1", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2321, + "BBH": 0.3278, + "MATH Level 5": 0.0476, + "GPQA": 0.2576, + "MUSR": 0.3022, + "MMLU-PRO": 0.1496 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-rDPO_5e-7-3ep_0vpo_const_0.1", + "name": "Qwen_0.5-rDPO_5e-7-3ep_0vpo_const_0.1", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2542, + "BBH": 0.3253, + "MATH Level 5": 0.0529, + "GPQA": 0.271, + "MUSR": 0.3181, + "MMLU-PRO": 0.1609 + } + }, + { + "model_id": "JayHyeon/Qwen_0.5-rDPO_5e-7-3ep_0vpo_const_0.3", + "name": "Qwen_0.5-rDPO_5e-7-3ep_0vpo_const_0.3", + "developer": "JayHyeon", + "scores": { + "IFEval": 0.2739, + "BBH": 0.3245, + "MATH Level 5": 0.0461, + "GPQA": 0.2508, + "MUSR": 0.3089, + "MMLU-PRO": 0.1597 + } + }, + { + "model_id": "Jimmy19991222/Llama-3-Instruct-8B-SimPO-v0.2", + "name": "Llama-3-Instruct-8B-SimPO-v0.2", + "developer": "Jimmy19991222", + "scores": { + "IFEval": 0.654, + "BBH": 0.4984, + "MATH Level 5": 0.0619, + "GPQA": 0.3146, + "MUSR": 0.4013, + "MMLU-PRO": 0.3686 + } + }, + { + "model_id": "Jimmy19991222/llama-3-8b-instruct-gapo-v2-bert-f1-beta10-gamma0.3-lr1.0e-6-1minus-rerun", + "name": "llama-3-8b-instruct-gapo-v2-bert-f1-beta10-gamma0.3-lr1.0e-6-1minus-rerun", + "developer": "Jimmy19991222", + "scores": { + "IFEval": 0.6717, + "BBH": 0.488, + "MATH Level 5": 0.0604, + "GPQA": 0.2945, + "MUSR": 0.4041, + "MMLU-PRO": 0.3634 + } + }, + { + "model_id": "Jimmy19991222/llama-3-8b-instruct-gapo-v2-bert_f1-beta10-gamma0.3-lr1.0e-6-scale-log", + "name": "llama-3-8b-instruct-gapo-v2-bert_f1-beta10-gamma0.3-lr1.0e-6-scale-log", + "developer": "Jimmy19991222", + "scores": { + "IFEval": 0.6556, + "BBH": 0.4935, + "MATH Level 5": 0.0544, + "GPQA": 0.3045, + "MUSR": 0.4, + "MMLU-PRO": 0.3658 + } + }, + { + "model_id": "Jimmy19991222/llama-3-8b-instruct-gapo-v2-bert_p-beta10-gamma0.3-lr1.0e-6-scale-log", + "name": "llama-3-8b-instruct-gapo-v2-bert_p-beta10-gamma0.3-lr1.0e-6-scale-log", + "developer": "Jimmy19991222", + "scores": { + "IFEval": 0.6315, + "BBH": 0.4916, + "MATH Level 5": 0.065, + "GPQA": 0.2861, + "MUSR": 0.3935, + "MMLU-PRO": 0.3611 + } + }, + { + "model_id": "Jimmy19991222/llama-3-8b-instruct-gapo-v2-bleu-beta0.1-no-length-scale-gamma0.4", + "name": "llama-3-8b-instruct-gapo-v2-bleu-beta0.1-no-length-scale-gamma0.4", + "developer": "Jimmy19991222", + "scores": { + "IFEval": 0.6285, + "BBH": 0.4986, + "MATH Level 5": 0.0514, + "GPQA": 0.2928, + "MUSR": 0.4014, + "MMLU-PRO": 0.3545 + } + }, + { + "model_id": "Jimmy19991222/llama-3-8b-instruct-gapo-v2-rouge2-beta10-1minus-gamma0.3-rerun", + "name": "llama-3-8b-instruct-gapo-v2-rouge2-beta10-1minus-gamma0.3-rerun", + "developer": "Jimmy19991222", + "scores": { + "IFEval": 0.6678, + "BBH": 0.494, + "MATH Level 5": 0.0612, + "GPQA": 0.3062, + "MUSR": 0.3987, + "MMLU-PRO": 0.3658 + } + }, + { + "model_id": "Jimmy19991222/llama-3-8b-instruct-gapo-v2-rouge2-beta10-gamma0.3-lr1.0e-6-scale-log", + "name": "llama-3-8b-instruct-gapo-v2-rouge2-beta10-gamma0.3-lr1.0e-6-scale-log", + "developer": "Jimmy19991222", + "scores": { + "IFEval": 0.6605, + "BBH": 0.4916, + "MATH Level 5": 0.0657, + "GPQA": 0.3037, + "MUSR": 0.4, + "MMLU-PRO": 0.3664 + } + }, + { + "model_id": "Jimmy19991222/llama-3-8b-instruct-gapo-v2-rougeL-beta10-gamma0.3-lr1.0e-6-scale-log", + "name": "llama-3-8b-instruct-gapo-v2-rougeL-beta10-gamma0.3-lr1.0e-6-scale-log", + "developer": "Jimmy19991222", + "scores": { + "IFEval": 0.6492, + "BBH": 0.4952, + "MATH Level 5": 0.0642, + "GPQA": 0.302, + "MUSR": 0.3961, + "MMLU-PRO": 0.3711 + } + }, + { + "model_id": "Joseph717171/Hermes-3-Llama-3.1-8B_TIES_with_Base_Embeds_Initialized_to_Special_Instruct_Toks_dtypeF32", + "name": "Hermes-3-Llama-3.1-8B_TIES_with_Base_Embeds_Initialized_to_Special_Instruct_Toks_dtypeF32", + "developer": "Joseph717171", + "scores": { + "IFEval": 0.6185, + "BBH": 0.5177, + "MATH Level 5": 0.0514, + "GPQA": 0.2827, + "MUSR": 0.4369, + "MMLU-PRO": 0.3144 + } + }, + { + "model_id": "Joseph717171/Llama-3.1-SuperNova-8B-Lite_TIES_with_Base", + "name": "Llama-3.1-SuperNova-8B-Lite_TIES_with_Base", + "developer": "Joseph717171", + "scores": { + "IFEval": 0.8096, + "BBH": 0.5147, + "MATH Level 5": 0.1835, + "GPQA": 0.3096, + "MUSR": 0.411, + "MMLU-PRO": 0.388 + } + }, + { + "model_id": "Josephgflowers/Cinder-Phi-2-V1-F16-gguf", + "name": "Cinder-Phi-2-V1-F16-gguf", + "developer": "Josephgflowers", + "scores": { + "IFEval": 0.2357, + "BBH": 0.4397, + "MATH Level 5": 0.0242, + "GPQA": 0.2819, + "MUSR": 0.3435, + "MMLU-PRO": 0.2161 + } + }, + { + "model_id": "Josephgflowers/Differential-Attention-Liquid-Metal-Tinyllama", + "name": "Differential-Attention-Liquid-Metal-Tinyllama", + "developer": "Josephgflowers", + "scores": { + "IFEval": 0.2227, + "BBH": 0.2926, + "MATH Level 5": 0.0325, + "GPQA": 0.2508, + "MUSR": 0.3356, + "MMLU-PRO": 0.1214 + } + }, + { + "model_id": "Josephgflowers/TinyLlama-Cinder-Agent-v1", + "name": "TinyLlama-Cinder-Agent-v1", + "developer": "Josephgflowers", + "scores": { + "IFEval": 0.267, + "BBH": 0.3116, + "MATH Level 5": 0.0347, + "GPQA": 0.2441, + "MUSR": 0.3395, + "MMLU-PRO": 0.1161 + } + }, + { + "model_id": "Josephgflowers/TinyLlama-v1.1-Cinders-World", + "name": "TinyLlama-v1.1-Cinders-World", + "developer": "Josephgflowers", + "scores": { + "IFEval": 0.2469, + "BBH": 0.2998, + "MATH Level 5": 0.0347, + "GPQA": 0.2441, + "MUSR": 0.3356, + "MMLU-PRO": 0.1198 + } + }, + { + "model_id": "Josephgflowers/TinyLlama_v1.1_math_code-world-test-1", + "name": "TinyLlama_v1.1_math_code-world-test-1", + "developer": "Josephgflowers", + "scores": { + "IFEval": 0.0078, + "BBH": 0.3146, + "MATH Level 5": 0.0196, + "GPQA": 0.2341, + "MUSR": 0.3499, + "MMLU-PRO": 0.1132 + } + }, + { + "model_id": "Josephgflowers/Tinyllama-STEM-Cinder-Agent-v1", + "name": "Tinyllama-STEM-Cinder-Agent-v1", + "developer": "Josephgflowers", + "scores": { + "IFEval": 0.2126, + "BBH": 0.3084, + "MATH Level 5": 0.0672, + "GPQA": 0.2349, + "MUSR": 0.3341, + "MMLU-PRO": 0.1086 + } + }, + { + "model_id": "Josephgflowers/Tinyllama-r1", + "name": "Tinyllama-r1", + "developer": "Josephgflowers", + "scores": { + "IFEval": 0.2119, + "BBH": 0.3015, + "MATH Level 5": 0.0325, + "GPQA": 0.2567, + "MUSR": 0.3315, + "MMLU-PRO": 0.1134 + } + }, + { + "model_id": "JungZoona/T3Q-Qwen2.5-14B-Instruct-1M-e3", + "name": "T3Q-Qwen2.5-14B-Instruct-1M-e3", + "developer": "JungZoona", + "scores": { + "IFEval": 0.7324, + "BBH": 0.7586, + "MATH Level 5": 0.2863, + "GPQA": 0.4169, + "MUSR": 0.5911, + "MMLU-PRO": 0.5884 + } + }, + { + "model_id": "JungZoona/T3Q-qwen2.5-14b-v1.0-e3", + "name": "T3Q-qwen2.5-14b-v1.0-e3", + "developer": "JungZoona", + "scores": { + "IFEval": 0.7324, + "BBH": 0.7586, + "MATH Level 5": 0.2863, + "GPQA": 0.4169, + "MUSR": 0.5911, + "MMLU-PRO": 0.5884 + } + }, + { + "model_id": "Junhoee/Qwen-Megumin", + "name": "Qwen-Megumin", + "developer": "Junhoee", + "scores": { + "IFEval": 0.7141, + "BBH": 0.5285, + "MATH Level 5": 0.4902, + "GPQA": 0.2961, + "MUSR": 0.398, + "MMLU-PRO": 0.4199 + } + }, + { + "model_id": "KSU-HW-SEC/Llama3-70b-SVA-FT-1415", + "name": "Llama3-70b-SVA-FT-1415", + "developer": "KSU-HW-SEC", + "scores": { + "IFEval": 0.618, + "BBH": 0.665, + "MATH Level 5": 0.2198, + "GPQA": 0.375, + "MUSR": 0.4565, + "MMLU-PRO": 0.5243 + } + }, + { + "model_id": "KSU-HW-SEC/Llama3-70b-SVA-FT-500", + "name": "Llama3-70b-SVA-FT-500", + "developer": "KSU-HW-SEC", + "scores": { + "IFEval": 0.6105, + "BBH": 0.6692, + "MATH Level 5": 0.2137, + "GPQA": 0.3809, + "MUSR": 0.4511, + "MMLU-PRO": 0.5227 + } + }, + { + "model_id": "KSU-HW-SEC/Llama3-70b-SVA-FT-final", + "name": "Llama3-70b-SVA-FT-final", + "developer": "KSU-HW-SEC", + "scores": { + "IFEval": 0.6165, + "BBH": 0.665, + "MATH Level 5": 0.2198, + "GPQA": 0.375, + "MUSR": 0.4565, + "MMLU-PRO": 0.5243 + } + }, + { + "model_id": "KSU-HW-SEC/Llama3.1-70b-SVA-FT-1000step", + "name": "Llama3.1-70b-SVA-FT-1000step", + "developer": "KSU-HW-SEC", + "scores": { + "IFEval": 0.7238, + "BBH": 0.6903, + "MATH Level 5": 0.321, + "GPQA": 0.396, + "MUSR": 0.4592, + "MMLU-PRO": 0.5252 + } + }, + { + "model_id": "Khetterman/DarkAtom-12B-v3", + "name": "DarkAtom-12B-v3", + "developer": "Khetterman", + "scores": { + "IFEval": 0.6173, + "BBH": 0.5154, + "MATH Level 5": 0.111, + "GPQA": 0.2978, + "MUSR": 0.4468, + "MMLU-PRO": 0.3546 + } + }, + { + "model_id": "Khetterman/Kosmos-8B-v1", + "name": "Kosmos-8B-v1", + "developer": "Khetterman", + "scores": { + "IFEval": 0.4129, + "BBH": 0.5234, + "MATH Level 5": 0.0989, + "GPQA": 0.2987, + "MUSR": 0.3919, + "MMLU-PRO": 0.3669 + } + }, + { + "model_id": "Kimargin/GPT-NEO-1.3B-wiki", + "name": "GPT-NEO-1.3B-wiki", + "developer": "Kimargin", + "scores": { + "IFEval": 0.1921, + "BBH": 0.3026, + "MATH Level 5": 0.0144, + "GPQA": 0.245, + "MUSR": 0.3883, + "MMLU-PRO": 0.1099 + } + }, + { + "model_id": "KingNish/Qwen2.5-0.5b-Test-ft", + "name": "Qwen2.5-0.5b-Test-ft", + "developer": "KingNish", + "scores": { + "IFEval": 0.2671, + "BBH": 0.3232, + "MATH Level 5": 0.0355, + "GPQA": 0.2634, + "MUSR": 0.3421, + "MMLU-PRO": 0.1689 + } + }, + { + "model_id": "KingNish/Reasoning-0.5b", + "name": "Reasoning-0.5b", + "developer": "KingNish", + "scores": { + "IFEval": 0.2174, + "BBH": 0.3354, + "MATH Level 5": 0.0219, + "GPQA": 0.2676, + "MUSR": 0.3513, + "MMLU-PRO": 0.1641 + } + }, + { + "model_id": "KingNish/Reasoning-Llama-3b-v0.1", + "name": "Reasoning-Llama-3b-v0.1", + "developer": "KingNish", + "scores": { + "IFEval": 0.6225, + "BBH": 0.4343, + "MATH Level 5": 0.1299, + "GPQA": 0.2592, + "MUSR": 0.3168, + "MMLU-PRO": 0.3029 + } + }, + { + "model_id": "KingNish/qwen-1b-continued", + "name": "qwen-1b-continued", + "developer": "KingNish", + "scores": { + "IFEval": 0.1255, + "BBH": 0.2991, + "MATH Level 5": 0.0091, + "GPQA": 0.2676, + "MUSR": 0.3859, + "MMLU-PRO": 0.1261 + } + }, + { + "model_id": "KingNish/qwen-1b-continued-v2", + "name": "qwen-1b-continued-v2", + "developer": "KingNish", + "scores": { + "IFEval": 0.1579, + "BBH": 0.3119, + "MATH Level 5": 0.0106, + "GPQA": 0.25, + "MUSR": 0.3393, + "MMLU-PRO": 0.1193 + } + }, + { + "model_id": "KingNish/qwen-1b-continued-v2.1", + "name": "qwen-1b-continued-v2.1", + "developer": "KingNish", + "scores": { + "IFEval": 0.1127, + "BBH": 0.3042, + "MATH Level 5": 0.0091, + "GPQA": 0.2676, + "MUSR": 0.4154, + "MMLU-PRO": 0.1278 + } + }, + { + "model_id": "KingNish/qwen-1b-continued-v2.2", + "name": "qwen-1b-continued-v2.2", + "developer": "KingNish", + "scores": { + "IFEval": 0.1413, + "BBH": 0.3059, + "MATH Level 5": 0.0151, + "GPQA": 0.2567, + "MUSR": 0.3513, + "MMLU-PRO": 0.1262 + } + }, + { + "model_id": "Kquant03/CognitiveFusion2-4x7B-BF16", + "name": "CognitiveFusion2-4x7B-BF16", + "developer": "Kquant03", + "scores": { + "IFEval": 0.3567, + "BBH": 0.4108, + "MATH Level 5": 0.0574, + "GPQA": 0.2861, + "MUSR": 0.4146, + "MMLU-PRO": 0.2793 + } + }, + { + "model_id": "Kquant03/L3-Pneuma-8B", + "name": "L3-Pneuma-8B", + "developer": "Kquant03", + "scores": { + "IFEval": 0.2374, + "BBH": 0.4955, + "MATH Level 5": 0.0506, + "GPQA": 0.307, + "MUSR": 0.4172, + "MMLU-PRO": 0.3184 + } + }, + { + "model_id": "Krystalan/DRT-o1-14B", + "name": "DRT-o1-14B", + "developer": "Krystalan", + "scores": { + "IFEval": 0.4068, + "BBH": 0.6379, + "MATH Level 5": 0.4826, + "GPQA": 0.3523, + "MUSR": 0.4795, + "MMLU-PRO": 0.5179 + } + }, + { + "model_id": "Krystalan/DRT-o1-7B", + "name": "DRT-o1-7B", + "developer": "Krystalan", + "scores": { + "IFEval": 0.3928, + "BBH": 0.5468, + "MATH Level 5": 0.4479, + "GPQA": 0.3213, + "MUSR": 0.5087, + "MMLU-PRO": 0.4151 + } + }, + { + "model_id": "Kukedlc/NeuralExperiment-7b-MagicCoder-v7.5", + "name": "NeuralExperiment-7b-MagicCoder-v7.5", + "developer": "Kukedlc", + "scores": { + "IFEval": 0.4553, + "BBH": 0.3988, + "MATH Level 5": 0.0665, + "GPQA": 0.2961, + "MUSR": 0.4282, + "MMLU-PRO": 0.2824 + } + }, + { + "model_id": "Kukedlc/NeuralLLaMa-3-8b-DT-v0.1", + "name": "NeuralLLaMa-3-8b-DT-v0.1", + "developer": "Kukedlc", + "scores": { + "IFEval": 0.4371, + "BBH": 0.4987, + "MATH Level 5": 0.0808, + "GPQA": 0.3029, + "MUSR": 0.4071, + "MMLU-PRO": 0.3792 + } + }, + { + "model_id": "Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.3", + "name": "NeuralLLaMa-3-8b-ORPO-v0.3", + "developer": "Kukedlc", + "scores": { + "IFEval": 0.5276, + "BBH": 0.4557, + "MATH Level 5": 0.0483, + "GPQA": 0.2391, + "MUSR": 0.37, + "MMLU-PRO": 0.3057 + } + }, + { + "model_id": "Kukedlc/NeuralSynthesis-7B-v0.1", + "name": "NeuralSynthesis-7B-v0.1", + "developer": "Kukedlc", + "scores": { + "IFEval": 0.4185, + "BBH": 0.5145, + "MATH Level 5": 0.0634, + "GPQA": 0.281, + "MUSR": 0.4333, + "MMLU-PRO": 0.3049 + } + }, + { + "model_id": "Kukedlc/NeuralSynthesis-7B-v0.3", + "name": "NeuralSynthesis-7B-v0.3", + "developer": "Kukedlc", + "scores": { + "IFEval": 0.4078, + "BBH": 0.5138, + "MATH Level 5": 0.0778, + "GPQA": 0.2802, + "MUSR": 0.4346, + "MMLU-PRO": 0.305 + } + }, + { + "model_id": "Kukedlc/NeuralSynthesis-7b-v0.4-slerp", + "name": "NeuralSynthesis-7b-v0.4-slerp", + "developer": "Kukedlc", + "scores": { + "IFEval": 0.3947, + "BBH": 0.5143, + "MATH Level 5": 0.0627, + "GPQA": 0.2777, + "MUSR": 0.4332, + "MMLU-PRO": 0.3043 + } + }, + { + "model_id": "Kukedlc/Qwen-2.5-7b-Spanish-o1-CoT", + "name": "Qwen-2.5-7b-Spanish-o1-CoT", + "developer": "Kukedlc", + "scores": { + "IFEval": 0.421, + "BBH": 0.5602, + "MATH Level 5": 0.2727, + "GPQA": 0.3205, + "MUSR": 0.4777, + "MMLU-PRO": 0.4363 + } + }, + { + "model_id": "Kumar955/Hemanth-llm", + "name": "Hemanth-llm", + "developer": "Kumar955", + "scores": { + "IFEval": 0.5045, + "BBH": 0.5225, + "MATH Level 5": 0.0702, + "GPQA": 0.2827, + "MUSR": 0.4486, + "MMLU-PRO": 0.3113 + } + }, + { + "model_id": "L-RAGE/3_PRYMMAL-ECE-7B-SLERP-V1", + "name": "3_PRYMMAL-ECE-7B-SLERP-V1", + "developer": "L-RAGE", + "scores": { + "IFEval": 0.2742, + "BBH": 0.4228, + "MATH Level 5": 0.108, + "GPQA": 0.2819, + "MUSR": 0.3841, + "MMLU-PRO": 0.2925 + } + }, + { + "model_id": "LEESM/llama-2-7b-hf-lora-oki100p", + "name": "llama-2-7b-hf-lora-oki100p", + "developer": "LEESM", + "scores": { + "IFEval": 0.2513, + "BBH": 0.3492, + "MATH Level 5": 0.0166, + "GPQA": 0.2693, + "MUSR": 0.3687, + "MMLU-PRO": 0.1856 + } + }, + { + "model_id": "LEESM/llama-2-7b-hf-lora-oki10p", + "name": "llama-2-7b-hf-lora-oki10p", + "developer": "LEESM", + "scores": { + "IFEval": 0.227, + "BBH": 0.3531, + "MATH Level 5": 0.0166, + "GPQA": 0.2542, + "MUSR": 0.3475, + "MMLU-PRO": 0.1679 + } + }, + { + "model_id": "LEESM/llama-3-8b-bnb-4b-kowiki231101", + "name": "llama-3-8b-bnb-4b-kowiki231101", + "developer": "LEESM", + "scores": { + "IFEval": 0.1685, + "BBH": 0.4131, + "MATH Level 5": 0.0136, + "GPQA": 0.271, + "MUSR": 0.3551, + "MMLU-PRO": 0.2425 + } + }, + { + "model_id": "LEESM/llama-3-Korean-Bllossom-8B-trexlab-oki10p", + "name": "llama-3-Korean-Bllossom-8B-trexlab-oki10p", + "developer": "LEESM", + "scores": { + "IFEval": 0.2137, + "BBH": 0.4343, + "MATH Level 5": 0.0468, + "GPQA": 0.2752, + "MUSR": 0.3869, + "MMLU-PRO": 0.3177 + } + }, + { + "model_id": "LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct", + "name": "EXAONE-3.0-7.8B-Instruct", + "developer": "LGAI-EXAONE", + "scores": { + "IFEval": 0.7193, + "BBH": 0.4174, + "MATH Level 5": 0.3044, + "GPQA": 0.2659, + "MUSR": 0.3661, + "MMLU-PRO": 0.3577 + } + }, + { + "model_id": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct", + "name": "EXAONE-3.5-2.4B-Instruct", + "developer": "LGAI-EXAONE", + "scores": { + "IFEval": 0.795, + "BBH": 0.4092, + "MATH Level 5": 0.3678, + "GPQA": 0.2659, + "MUSR": 0.3661, + "MMLU-PRO": 0.328 + } + }, + { + "model_id": "LGAI-EXAONE/EXAONE-3.5-32B-Instruct", + "name": "EXAONE-3.5-32B-Instruct", + "developer": "LGAI-EXAONE", + "scores": { + "IFEval": 0.8392, + "BBH": 0.5761, + "MATH Level 5": 0.5128, + "GPQA": 0.2878, + "MUSR": 0.3807, + "MMLU-PRO": 0.4637 + } + }, + { + "model_id": "LGAI-EXAONE/EXAONE-3.5-7.8B-Instruct", + "name": "EXAONE-3.5-7.8B-Instruct", + "developer": "LGAI-EXAONE", + "scores": { + "IFEval": 0.8136, + "BBH": 0.4728, + "MATH Level 5": 0.4751, + "GPQA": 0.2576, + "MUSR": 0.3779, + "MMLU-PRO": 0.4133 + } + }, + { + "model_id": "LLM360/K2", + "name": "K2", + "developer": "LLM360", + "scores": { + "IFEval": 0.2252, + "BBH": 0.4972, + "MATH Level 5": 0.0272, + "GPQA": 0.2768, + "MUSR": 0.398, + "MMLU-PRO": 0.3004 + } + }, + { + "model_id": "LLM360/K2-Chat", + "name": "K2-Chat", + "developer": "LLM360", + "scores": { + "IFEval": 0.5152, + "BBH": 0.5358, + "MATH Level 5": 0.1035, + "GPQA": 0.3062, + "MUSR": 0.457, + "MMLU-PRO": 0.3371 + } + }, + { + "model_id": "LLM4Binary/llm4decompile-1.3b-v2", + "name": "llm4decompile-1.3b-v2", + "developer": "LLM4Binary", + "scores": { + "IFEval": 0.2268, + "BBH": 0.3272, + "MATH Level 5": 0.0128, + "GPQA": 0.2357, + "MUSR": 0.4072, + "MMLU-PRO": 0.1209 + } + }, + { + "model_id": "Lambent/qwen2.5-reinstruct-alternate-lumen-14B", + "name": "qwen2.5-reinstruct-alternate-lumen-14B", + "developer": "Lambent", + "scores": { + "IFEval": 0.4794, + "BBH": 0.6459, + "MATH Level 5": 0.4622, + "GPQA": 0.3767, + "MUSR": 0.477, + "MMLU-PRO": 0.5388 + } + }, + { + "model_id": "Langboat/Mengzi3-8B-Chat", + "name": "Mengzi3-8B-Chat", + "developer": "Langboat", + "scores": { + "IFEval": 0.514, + "BBH": 0.4684, + "MATH Level 5": 0.0906, + "GPQA": 0.2743, + "MUSR": 0.4078, + "MMLU-PRO": 0.3142 + } + }, + { + "model_id": "Lawnakk/BBA100", + "name": "BBA100", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.2076, + "BBH": 0.2826, + "MATH Level 5": 0.0098, + "GPQA": 0.2441, + "MUSR": 0.402, + "MMLU-PRO": 0.1122 + } + }, + { + "model_id": "Lawnakk/BBALAW1", + "name": "BBALAW1", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.1905, + "BBH": 0.2872, + "MATH Level 5": 0.0098, + "GPQA": 0.2433, + "MUSR": 0.4153, + "MMLU-PRO": 0.1121 + } + }, + { + "model_id": "Lawnakk/BBALAW1.0", + "name": "BBALAW1.0", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.1351, + "BBH": 0.2828, + "MATH Level 5": 0.0, + "GPQA": 0.2559, + "MUSR": 0.3526, + "MMLU-PRO": 0.1128 + } + }, + { + "model_id": "Lawnakk/BBALAW1.2", + "name": "BBALAW1.2", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.1354, + "BBH": 0.2811, + "MATH Level 5": 0.0, + "GPQA": 0.2643, + "MUSR": 0.3579, + "MMLU-PRO": 0.1105 + } + }, + { + "model_id": "Lawnakk/BBALAW1.3", + "name": "BBALAW1.3", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.1354, + "BBH": 0.2827, + "MATH Level 5": 0.0, + "GPQA": 0.2609, + "MUSR": 0.3619, + "MMLU-PRO": 0.1094 + } + }, + { + "model_id": "Lawnakk/BBALAW1.6", + "name": "BBALAW1.6", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.5245, + "BBH": 0.5554, + "MATH Level 5": 0.3603, + "GPQA": 0.3238, + "MUSR": 0.4368, + "MMLU-PRO": 0.4507 + } + }, + { + "model_id": "Lawnakk/BBALAW1.61", + "name": "BBALAW1.61", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.5771, + "BBH": 0.5549, + "MATH Level 5": 0.3663, + "GPQA": 0.3171, + "MUSR": 0.4355, + "MMLU-PRO": 0.4471 + } + }, + { + "model_id": "Lawnakk/BBALAW1.62", + "name": "BBALAW1.62", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.5046, + "BBH": 0.5581, + "MATH Level 5": 0.2825, + "GPQA": 0.3196, + "MUSR": 0.4343, + "MMLU-PRO": 0.4545 + } + }, + { + "model_id": "Lawnakk/BBALAW1.63", + "name": "BBALAW1.63", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.4407, + "BBH": 0.5541, + "MATH Level 5": 0.3701, + "GPQA": 0.3121, + "MUSR": 0.4303, + "MMLU-PRO": 0.4471 + } + }, + { + "model_id": "Lawnakk/BBALAW1.64", + "name": "BBALAW1.64", + "developer": "Lawnakk", + "scores": { + "IFEval": 0.1395, + "BBH": 0.2779, + "MATH Level 5": 0.0, + "GPQA": 0.2483, + "MUSR": 0.3447, + "MMLU-PRO": 0.1115 + } + }, + { + "model_id": "LenguajeNaturalAI/leniachat-gemma-2b-v0", + "name": "leniachat-gemma-2b-v0", + "developer": "LenguajeNaturalAI", + "scores": { + "IFEval": 0.215, + "BBH": 0.3074, + "MATH Level 5": 0.0113, + "GPQA": 0.2659, + "MUSR": 0.3659, + "MMLU-PRO": 0.117 + } + }, + { + "model_id": "LenguajeNaturalAI/leniachat-qwen2-1.5B-v0", + "name": "leniachat-qwen2-1.5B-v0", + "developer": "LenguajeNaturalAI", + "scores": { + "IFEval": 0.2221, + "BBH": 0.3684, + "MATH Level 5": 0.0128, + "GPQA": 0.2617, + "MUSR": 0.375, + "MMLU-PRO": 0.188 + } + }, + { + "model_id": "LeroyDyer/CheckPoint_A", + "name": "CheckPoint_A", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4513, + "BBH": 0.4748, + "MATH Level 5": 0.0589, + "GPQA": 0.2836, + "MUSR": 0.4231, + "MMLU-PRO": 0.288 + } + }, + { + "model_id": "LeroyDyer/CheckPoint_B", + "name": "CheckPoint_B", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.444, + "BBH": 0.478, + "MATH Level 5": 0.0718, + "GPQA": 0.2903, + "MUSR": 0.3898, + "MMLU-PRO": 0.2907 + } + }, + { + "model_id": "LeroyDyer/CheckPoint_C", + "name": "CheckPoint_C", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3477, + "BBH": 0.4586, + "MATH Level 5": 0.0551, + "GPQA": 0.271, + "MUSR": 0.4346, + "MMLU-PRO": 0.3021 + } + }, + { + "model_id": "LeroyDyer/CheckPoint_R1", + "name": "CheckPoint_R1", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.1728, + "BBH": 0.4225, + "MATH Level 5": 0.0431, + "GPQA": 0.2743, + "MUSR": 0.4031, + "MMLU-PRO": 0.2205 + } + }, + { + "model_id": "LeroyDyer/LCARS_AI_001", + "name": "LCARS_AI_001", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3109, + "BBH": 0.4258, + "MATH Level 5": 0.0234, + "GPQA": 0.2634, + "MUSR": 0.4384, + "MMLU-PRO": 0.267 + } + }, + { + "model_id": "LeroyDyer/LCARS_AI_1x4_003_SuperAI", + "name": "LCARS_AI_1x4_003_SuperAI", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4111, + "BBH": 0.492, + "MATH Level 5": 0.0574, + "GPQA": 0.2827, + "MUSR": 0.4506, + "MMLU-PRO": 0.2972 + } + }, + { + "model_id": "LeroyDyer/LCARS_AI_StarTrek_Computer", + "name": "LCARS_AI_StarTrek_Computer", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3583, + "BBH": 0.4446, + "MATH Level 5": 0.0408, + "GPQA": 0.2676, + "MUSR": 0.395, + "MMLU-PRO": 0.2458 + } + }, + { + "model_id": "LeroyDyer/LCARS_TOP_SCORE", + "name": "LCARS_TOP_SCORE", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4371, + "BBH": 0.5127, + "MATH Level 5": 0.0672, + "GPQA": 0.2861, + "MUSR": 0.4293, + "MMLU-PRO": 0.3031 + } + }, + { + "model_id": "LeroyDyer/Mixtral_AI_SwahiliTron_7b", + "name": "Mixtral_AI_SwahiliTron_7b", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.1534, + "BBH": 0.3055, + "MATH Level 5": 0.0136, + "GPQA": 0.2651, + "MUSR": 0.342, + "MMLU-PRO": 0.1208 + } + }, + { + "model_id": "LeroyDyer/SpydazWebAI_Human_AGI", + "name": "SpydazWebAI_Human_AGI", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3388, + "BBH": 0.3375, + "MATH Level 5": 0.0144, + "GPQA": 0.2827, + "MUSR": 0.3966, + "MMLU-PRO": 0.1479 + } + }, + { + "model_id": "LeroyDyer/SpydazWebAI_Human_AGI_001", + "name": "SpydazWebAI_Human_AGI_001", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3118, + "BBH": 0.3433, + "MATH Level 5": 0.0196, + "GPQA": 0.2987, + "MUSR": 0.3994, + "MMLU-PRO": 0.1426 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_CyberTron_Ultra_7b", + "name": "SpydazWeb_AI_CyberTron_Ultra_7b", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.1556, + "BBH": 0.4811, + "MATH Level 5": 0.0136, + "GPQA": 0.2928, + "MUSR": 0.4136, + "MMLU-PRO": 0.2866 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAGI_001_M2", + "name": "SpydazWeb_AI_HumanAGI_001_M2", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.394, + "BBH": 0.4888, + "MATH Level 5": 0.0385, + "GPQA": 0.2894, + "MUSR": 0.4503, + "MMLU-PRO": 0.3005 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAGI_002", + "name": "SpydazWeb_AI_HumanAGI_002", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4088, + "BBH": 0.5044, + "MATH Level 5": 0.0665, + "GPQA": 0.2869, + "MUSR": 0.4865, + "MMLU-PRO": 0.3059 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_001", + "name": "SpydazWeb_AI_HumanAI_001", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.2252, + "BBH": 0.3344, + "MATH Level 5": 0.0166, + "GPQA": 0.2886, + "MUSR": 0.386, + "MMLU-PRO": 0.1271 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_006", + "name": "SpydazWeb_AI_HumanAI_006", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.143, + "BBH": 0.3302, + "MATH Level 5": 0.0106, + "GPQA": 0.2802, + "MUSR": 0.3568, + "MMLU-PRO": 0.1135 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_007", + "name": "SpydazWeb_AI_HumanAI_007", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3352, + "BBH": 0.3416, + "MATH Level 5": 0.0227, + "GPQA": 0.2886, + "MUSR": 0.4096, + "MMLU-PRO": 0.1352 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_009_CHAT", + "name": "SpydazWeb_AI_HumanAI_009_CHAT", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.2973, + "BBH": 0.3307, + "MATH Level 5": 0.0166, + "GPQA": 0.281, + "MUSR": 0.4138, + "MMLU-PRO": 0.1433 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_010_CHAT", + "name": "SpydazWeb_AI_HumanAI_010_CHAT", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.2507, + "BBH": 0.3336, + "MATH Level 5": 0.0181, + "GPQA": 0.2592, + "MUSR": 0.4137, + "MMLU-PRO": 0.143 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_011_INSTRUCT", + "name": "SpydazWeb_AI_HumanAI_011_INSTRUCT", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3149, + "BBH": 0.3523, + "MATH Level 5": 0.0144, + "GPQA": 0.2794, + "MUSR": 0.3831, + "MMLU-PRO": 0.1595 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_011_INSTRUCT_ML", + "name": "SpydazWeb_AI_HumanAI_011_INSTRUCT_ML", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3752, + "BBH": 0.3984, + "MATH Level 5": 0.0257, + "GPQA": 0.2928, + "MUSR": 0.4239, + "MMLU-PRO": 0.2019 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_011_INSTRUCT_ML_r1", + "name": "SpydazWeb_AI_HumanAI_011_INSTRUCT_ML_r1", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.405, + "BBH": 0.4858, + "MATH Level 5": 0.0551, + "GPQA": 0.2928, + "MUSR": 0.3921, + "MMLU-PRO": 0.2956 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_012_INSTRUCT_IA", + "name": "SpydazWeb_AI_HumanAI_012_INSTRUCT_IA", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3036, + "BBH": 0.4575, + "MATH Level 5": 0.0446, + "GPQA": 0.3012, + "MUSR": 0.4253, + "MMLU-PRO": 0.2329 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_012_INSTRUCT_MX", + "name": "SpydazWeb_AI_HumanAI_012_INSTRUCT_MX", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3066, + "BBH": 0.3158, + "MATH Level 5": 0.0151, + "GPQA": 0.2911, + "MUSR": 0.3444, + "MMLU-PRO": 0.1107 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_012_INSTRUCT_XA", + "name": "SpydazWeb_AI_HumanAI_012_INSTRUCT_XA", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3579, + "BBH": 0.4477, + "MATH Level 5": 0.0423, + "GPQA": 0.3096, + "MUSR": 0.4134, + "MMLU-PRO": 0.2376 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_RP", + "name": "SpydazWeb_AI_HumanAI_RP", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.2541, + "BBH": 0.3323, + "MATH Level 5": 0.0128, + "GPQA": 0.2752, + "MUSR": 0.3883, + "MMLU-PRO": 0.1324 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_AI_HumanAI_TextVision", + "name": "SpydazWeb_AI_HumanAI_TextVision", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3063, + "BBH": 0.3354, + "MATH Level 5": 0.0144, + "GPQA": 0.2919, + "MUSR": 0.3938, + "MMLU-PRO": 0.1387 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_HumanAI_M1", + "name": "SpydazWeb_HumanAI_M1", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.3582, + "BBH": 0.3563, + "MATH Level 5": 0.0249, + "GPQA": 0.2676, + "MUSR": 0.3671, + "MMLU-PRO": 0.1663 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_HumanAI_M2", + "name": "SpydazWeb_HumanAI_M2", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.375, + "BBH": 0.3931, + "MATH Level 5": 0.0287, + "GPQA": 0.2794, + "MUSR": 0.3751, + "MMLU-PRO": 0.201 + } + }, + { + "model_id": "LeroyDyer/SpydazWeb_HumanAI_M3", + "name": "SpydazWeb_HumanAI_M3", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.1579, + "BBH": 0.3127, + "MATH Level 5": 0.0091, + "GPQA": 0.271, + "MUSR": 0.3914, + "MMLU-PRO": 0.1149 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_12", + "name": "_Spydaz_Web_AI_12", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.2765, + "BBH": 0.3163, + "MATH Level 5": 0.0136, + "GPQA": 0.2685, + "MUSR": 0.3582, + "MMLU-PRO": 0.1137 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_14", + "name": "_Spydaz_Web_AI_14", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.1812, + "BBH": 0.2989, + "MATH Level 5": 0.0121, + "GPQA": 0.2659, + "MUSR": 0.3395, + "MMLU-PRO": 0.1139 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_001", + "name": "_Spydaz_Web_AI_AGI_R1_001", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4505, + "BBH": 0.4609, + "MATH Level 5": 0.0634, + "GPQA": 0.2676, + "MUSR": 0.4256, + "MMLU-PRO": 0.2734 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_002", + "name": "_Spydaz_Web_AI_AGI_R1_002", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5307, + "BBH": 0.4683, + "MATH Level 5": 0.0582, + "GPQA": 0.2685, + "MUSR": 0.4255, + "MMLU-PRO": 0.2894 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_MUSR", + "name": "_Spydaz_Web_AI_AGI_R1_MUSR", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4786, + "BBH": 0.4672, + "MATH Level 5": 0.0604, + "GPQA": 0.2844, + "MUSR": 0.4869, + "MMLU-PRO": 0.2828 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_MasterCoder", + "name": "_Spydaz_Web_AI_AGI_R1_MasterCoder", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4143, + "BBH": 0.4689, + "MATH Level 5": 0.0612, + "GPQA": 0.276, + "MUSR": 0.472, + "MMLU-PRO": 0.2719 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_Math_001", + "name": "_Spydaz_Web_AI_AGI_R1_Math_001", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4571, + "BBH": 0.4818, + "MATH Level 5": 0.0695, + "GPQA": 0.2768, + "MUSR": 0.4778, + "MMLU-PRO": 0.2681 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_Math_003", + "name": "_Spydaz_Web_AI_AGI_R1_Math_003", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.62, + "BBH": 0.4756, + "MATH Level 5": 0.0695, + "GPQA": 0.281, + "MUSR": 0.4202, + "MMLU-PRO": 0.2999 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_Math_AdvancedStudent", + "name": "_Spydaz_Web_AI_AGI_R1_Math_AdvancedStudent", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5951, + "BBH": 0.4927, + "MATH Level 5": 0.0544, + "GPQA": 0.2919, + "MUSR": 0.5198, + "MMLU-PRO": 0.3 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_Math_Student", + "name": "_Spydaz_Web_AI_AGI_R1_Math_Student", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5736, + "BBH": 0.4881, + "MATH Level 5": 0.0514, + "GPQA": 0.2903, + "MUSR": 0.5098, + "MMLU-PRO": 0.2927 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_Math_Teacher", + "name": "_Spydaz_Web_AI_AGI_R1_Math_Teacher", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5772, + "BBH": 0.4805, + "MATH Level 5": 0.0544, + "GPQA": 0.2861, + "MUSR": 0.5222, + "MMLU-PRO": 0.2956 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_OmG_001", + "name": "_Spydaz_Web_AI_AGI_R1_OmG_001", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5818, + "BBH": 0.4908, + "MATH Level 5": 0.0506, + "GPQA": 0.3003, + "MUSR": 0.4486, + "MMLU-PRO": 0.2906 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_OmG_002", + "name": "_Spydaz_Web_AI_AGI_R1_OmG_002", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5462, + "BBH": 0.4655, + "MATH Level 5": 0.0498, + "GPQA": 0.2785, + "MUSR": 0.4511, + "MMLU-PRO": 0.2867 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_OmG_Coder", + "name": "_Spydaz_Web_AI_AGI_R1_OmG_Coder", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4924, + "BBH": 0.4638, + "MATH Level 5": 0.0544, + "GPQA": 0.2735, + "MUSR": 0.5625, + "MMLU-PRO": 0.289 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_OmG_Math", + "name": "_Spydaz_Web_AI_AGI_R1_OmG_Math", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5033, + "BBH": 0.4677, + "MATH Level 5": 0.0476, + "GPQA": 0.2827, + "MUSR": 0.4326, + "MMLU-PRO": 0.2913 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_OmG_MathMaster", + "name": "_Spydaz_Web_AI_AGI_R1_OmG_MathMaster", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5558, + "BBH": 0.4742, + "MATH Level 5": 0.0536, + "GPQA": 0.2878, + "MUSR": 0.451, + "MMLU-PRO": 0.2672 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_Student_Coder", + "name": "_Spydaz_Web_AI_AGI_R1_Student_Coder", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.545, + "BBH": 0.4651, + "MATH Level 5": 0.0657, + "GPQA": 0.2844, + "MUSR": 0.4388, + "MMLU-PRO": 0.2768 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_Teacher_Coder", + "name": "_Spydaz_Web_AI_AGI_R1_Teacher_Coder", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5082, + "BBH": 0.4797, + "MATH Level 5": 0.065, + "GPQA": 0.2911, + "MUSR": 0.4338, + "MMLU-PRO": 0.2845 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_Top_Student", + "name": "_Spydaz_Web_AI_AGI_R1_Top_Student", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.604, + "BBH": 0.4988, + "MATH Level 5": 0.0725, + "GPQA": 0.2727, + "MUSR": 0.5398, + "MMLU-PRO": 0.3024 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_X1", + "name": "_Spydaz_Web_AI_AGI_R1_X1", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4273, + "BBH": 0.4759, + "MATH Level 5": 0.0566, + "GPQA": 0.2601, + "MUSR": 0.4232, + "MMLU-PRO": 0.2891 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_R1_X2", + "name": "_Spydaz_Web_AI_AGI_R1_X2", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5434, + "BBH": 0.4786, + "MATH Level 5": 0.0612, + "GPQA": 0.2978, + "MUSR": 0.4695, + "MMLU-PRO": 0.2921 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_AGI_RP_R1", + "name": "_Spydaz_Web_AI_AGI_RP_R1", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.5426, + "BBH": 0.4701, + "MATH Level 5": 0.0604, + "GPQA": 0.2693, + "MUSR": 0.4201, + "MMLU-PRO": 0.2894 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_BIBLE_002", + "name": "_Spydaz_Web_AI_BIBLE_002", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.2195, + "BBH": 0.3289, + "MATH Level 5": 0.0174, + "GPQA": 0.2844, + "MUSR": 0.3407, + "MMLU-PRO": 0.1368 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_ChatML_002", + "name": "_Spydaz_Web_AI_ChatML_002", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.2412, + "BBH": 0.3106, + "MATH Level 5": 0.0113, + "GPQA": 0.2576, + "MUSR": 0.3623, + "MMLU-PRO": 0.1095 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_ChatQA", + "name": "_Spydaz_Web_AI_ChatQA", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.1415, + "BBH": 0.3236, + "MATH Level 5": 0.0098, + "GPQA": 0.2659, + "MUSR": 0.3447, + "MMLU-PRO": 0.1475 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_ChatQA_003", + "name": "_Spydaz_Web_AI_ChatQA_003", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.2209, + "BBH": 0.3172, + "MATH Level 5": 0.0106, + "GPQA": 0.271, + "MUSR": 0.3818, + "MMLU-PRO": 0.1133 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_TEMP_", + "name": "_Spydaz_Web_AI_TEMP_", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4795, + "BBH": 0.4957, + "MATH Level 5": 0.1239, + "GPQA": 0.2794, + "MUSR": 0.4218, + "MMLU-PRO": 0.3121 + } + }, + { + "model_id": "LeroyDyer/_Spydaz_Web_AI_Top_Teacher_", + "name": "_Spydaz_Web_AI_Top_Teacher_", + "developer": "LeroyDyer", + "scores": { + "IFEval": 0.4404, + "BBH": 0.4891, + "MATH Level 5": 0.1156, + "GPQA": 0.2777, + "MUSR": 0.4366, + "MMLU-PRO": 0.315 + } + }, + { + "model_id": "LightningRodLabs/Flashlight-v1.0", + "name": "Flashlight-v1.0", + "developer": "LightningRodLabs", + "scores": { + "IFEval": 0.6745, + "BBH": 0.6877, + "MATH Level 5": 0.497, + "GPQA": 0.3423, + "MUSR": 0.4101, + "MMLU-PRO": 0.5402 + } + }, + { + "model_id": "LightningRodLabs/Flashlight-v1.1", + "name": "Flashlight-v1.1", + "developer": "LightningRodLabs", + "scores": { + "IFEval": 0.6721, + "BBH": 0.6901, + "MATH Level 5": 0.5325, + "GPQA": 0.3398, + "MUSR": 0.4048, + "MMLU-PRO": 0.5416 + } + }, + { + "model_id": "LightningRodLabs/Flashlight-v1.2", + "name": "Flashlight-v1.2", + "developer": "LightningRodLabs", + "scores": { + "IFEval": 0.436, + "BBH": 0.3265, + "MATH Level 5": 0.1556, + "GPQA": 0.2357, + "MUSR": 0.4554, + "MMLU-PRO": 0.2485 + } + }, + { + "model_id": "Lil-R/2_PRYMMAL-ECE-2B-SLERP-V1", + "name": "2_PRYMMAL-ECE-2B-SLERP-V1", + "developer": "Lil-R", + "scores": { + "IFEval": 0.5823, + "BBH": 0.4287, + "MATH Level 5": 0.0914, + "GPQA": 0.3062, + "MUSR": 0.4375, + "MMLU-PRO": 0.2678 + } + }, + { + "model_id": "Lil-R/2_PRYMMAL-ECE-2B-SLERP-V2", + "name": "2_PRYMMAL-ECE-2B-SLERP-V2", + "developer": "Lil-R", + "scores": { + "IFEval": 0.5543, + "BBH": 0.4376, + "MATH Level 5": 0.0944, + "GPQA": 0.2978, + "MUSR": 0.4482, + "MMLU-PRO": 0.2744 + } + }, + { + "model_id": "Lil-R/2_PRYMMAL-ECE-7B-SLERP", + "name": "2_PRYMMAL-ECE-7B-SLERP", + "developer": "Lil-R", + "scores": { + "IFEval": 0.5577, + "BBH": 0.5557, + "MATH Level 5": 0.3633, + "GPQA": 0.3104, + "MUSR": 0.4396, + "MMLU-PRO": 0.4507 + } + }, + { + "model_id": "Lil-R/2_PRYMMAL-ECE-7B-SLERP-V1", + "name": "2_PRYMMAL-ECE-7B-SLERP-V1", + "developer": "Lil-R", + "scores": { + "IFEval": 0.1073, + "BBH": 0.3053, + "MATH Level 5": 0.0008, + "GPQA": 0.2508, + "MUSR": 0.3911, + "MMLU-PRO": 0.1124 + } + }, + { + "model_id": "Lil-R/2_PRYMMAL-ECE-7B-SLERP-V2", + "name": "2_PRYMMAL-ECE-7B-SLERP-V2", + "developer": "Lil-R", + "scores": { + "IFEval": 0.1073, + "BBH": 0.3053, + "MATH Level 5": 0.0008, + "GPQA": 0.2508, + "MUSR": 0.3911, + "MMLU-PRO": 0.1124 + } + }, + { + "model_id": "Lil-R/2_PRYMMAL-ECE-7B-SLERP-V3", + "name": "2_PRYMMAL-ECE-7B-SLERP-V3", + "developer": "Lil-R", + "scores": { + "IFEval": 0.2235, + "BBH": 0.3578, + "MATH Level 5": 0.006, + "GPQA": 0.2567, + "MUSR": 0.4107, + "MMLU-PRO": 0.1817 + } + }, + { + "model_id": "Lil-R/PRYMMAL-ECE-1B-SLERP-V1", + "name": "PRYMMAL-ECE-1B-SLERP-V1", + "developer": "Lil-R", + "scores": { + "IFEval": 0.2874, + "BBH": 0.419, + "MATH Level 5": 0.1035, + "GPQA": 0.276, + "MUSR": 0.3974, + "MMLU-PRO": 0.2926 + } + }, + { + "model_id": "Lil-R/PRYMMAL-ECE-7B-SLERP-V8", + "name": "PRYMMAL-ECE-7B-SLERP-V8", + "developer": "Lil-R", + "scores": { + "IFEval": 0.1258, + "BBH": 0.2955, + "MATH Level 5": 0.0098, + "GPQA": 0.25, + "MUSR": 0.3631, + "MMLU-PRO": 0.1128 + } + }, + { + "model_id": "LilRg/10PRYMMAL-3B-slerp", + "name": "10PRYMMAL-3B-slerp", + "developer": "LilRg", + "scores": { + "IFEval": 0.1946, + "BBH": 0.532, + "MATH Level 5": 0.1495, + "GPQA": 0.3213, + "MUSR": 0.4529, + "MMLU-PRO": 0.3881 + } + }, + { + "model_id": "LilRg/ECE-1B-merge-PRYMMAL", + "name": "ECE-1B-merge-PRYMMAL", + "developer": "LilRg", + "scores": { + "IFEval": 0.2712, + "BBH": 0.4235, + "MATH Level 5": 0.1012, + "GPQA": 0.281, + "MUSR": 0.3801, + "MMLU-PRO": 0.2906 + } + }, + { + "model_id": "LilRg/ECE_Finetunning", + "name": "ECE_Finetunning", + "developer": "LilRg", + "scores": { + "IFEval": 0.0445, + "BBH": 0.4732, + "MATH Level 5": 0.0453, + "GPQA": 0.2827, + "MUSR": 0.3839, + "MMLU-PRO": 0.3191 + } + }, + { + "model_id": "LilRg/PRYMMAL-6B-slerp", + "name": "PRYMMAL-6B-slerp", + "developer": "LilRg", + "scores": { + "IFEval": 0.1153, + "BBH": 0.2868, + "MATH Level 5": 0.0, + "GPQA": 0.2458, + "MUSR": 0.3698, + "MMLU-PRO": 0.1108 + } + }, + { + "model_id": "LilRg/PRYMMAL-ECE-7B-SLERP-V3", + "name": "PRYMMAL-ECE-7B-SLERP-V3", + "developer": "LilRg", + "scores": { + "IFEval": 0.1243, + "BBH": 0.2957, + "MATH Level 5": 0.0098, + "GPQA": 0.2567, + "MUSR": 0.3671, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "LilRg/PRYMMAL-ECE-7B-SLERP-V4", + "name": "PRYMMAL-ECE-7B-SLERP-V4", + "developer": "LilRg", + "scores": { + "IFEval": 0.1249, + "BBH": 0.2957, + "MATH Level 5": 0.0098, + "GPQA": 0.2567, + "MUSR": 0.3671, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "LilRg/PRYMMAL-ECE-7B-SLERP-V5", + "name": "PRYMMAL-ECE-7B-SLERP-V5", + "developer": "LilRg", + "scores": { + "IFEval": 0.1249, + "BBH": 0.2957, + "MATH Level 5": 0.0098, + "GPQA": 0.2567, + "MUSR": 0.3671, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "LilRg/PRYMMAL-ECE-7B-SLERP-V6", + "name": "PRYMMAL-ECE-7B-SLERP-V6", + "developer": "LilRg", + "scores": { + "IFEval": 0.1243, + "BBH": 0.2957, + "MATH Level 5": 0.0098, + "GPQA": 0.2567, + "MUSR": 0.3671, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "LilRg/PRYMMAL-ECE-7B-SLERP-V7", + "name": "PRYMMAL-ECE-7B-SLERP-V7", + "developer": "LilRg", + "scores": { + "IFEval": 0.1249, + "BBH": 0.2957, + "MATH Level 5": 0.0098, + "GPQA": 0.2567, + "MUSR": 0.3671, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "LilRg/PRYMMAL-slerp-Merge", + "name": "PRYMMAL-slerp-Merge", + "developer": "LilRg", + "scores": { + "IFEval": 0.3044, + "BBH": 0.5364, + "MATH Level 5": 0.1616, + "GPQA": 0.3205, + "MUSR": 0.4635, + "MMLU-PRO": 0.3863 + } + }, + { + "model_id": "LimYeri/CodeMind-Llama3-8B-unsloth_v2-merged", + "name": "CodeMind-Llama3-8B-unsloth_v2-merged", + "developer": "LimYeri", + "scores": { + "IFEval": 0.6946, + "BBH": 0.486, + "MATH Level 5": 0.0665, + "GPQA": 0.2651, + "MUSR": 0.3316, + "MMLU-PRO": 0.3506 + } + }, + { + "model_id": "LimYeri/CodeMind-Llama3-8B-unsloth_v3-merged", + "name": "CodeMind-Llama3-8B-unsloth_v3-merged", + "developer": "LimYeri", + "scores": { + "IFEval": 0.6763, + "BBH": 0.4908, + "MATH Level 5": 0.068, + "GPQA": 0.2584, + "MUSR": 0.3356, + "MMLU-PRO": 0.3496 + } + }, + { + "model_id": "LimYeri/CodeMind-Llama3-8B-unsloth_v4-one-DPO-merged", + "name": "CodeMind-Llama3-8B-unsloth_v4-one-DPO-merged", + "developer": "LimYeri", + "scores": { + "IFEval": 0.6492, + "BBH": 0.4853, + "MATH Level 5": 0.068, + "GPQA": 0.2685, + "MUSR": 0.3608, + "MMLU-PRO": 0.3354 + } + }, + { + "model_id": "LimYeri/CodeMind-Llama3-8B-unsloth_v4-one-merged", + "name": "CodeMind-Llama3-8B-unsloth_v4-one-merged", + "developer": "LimYeri", + "scores": { + "IFEval": 0.3211, + "BBH": 0.4739, + "MATH Level 5": 0.0551, + "GPQA": 0.3096, + "MUSR": 0.4069, + "MMLU-PRO": 0.3353 + } + }, + { + "model_id": "LimYeri/CodeMind-Llama3.1-8B-unsloth-merged", + "name": "CodeMind-Llama3.1-8B-unsloth-merged", + "developer": "LimYeri", + "scores": { + "IFEval": 0.649, + "BBH": 0.4695, + "MATH Level 5": 0.1088, + "GPQA": 0.2643, + "MUSR": 0.3752, + "MMLU-PRO": 0.334 + } + }, + { + "model_id": "Locutusque/CollectiveLM-Falcon-3-7B", + "name": "CollectiveLM-Falcon-3-7B", + "developer": "Locutusque", + "scores": { + "IFEval": 0.3918, + "BBH": 0.5105, + "MATH Level 5": 0.2183, + "GPQA": 0.3255, + "MUSR": 0.3887, + "MMLU-PRO": 0.3599 + } + }, + { + "model_id": "Locutusque/Hercules-6.0-Llama-3.1-8B", + "name": "Hercules-6.0-Llama-3.1-8B", + "developer": "Locutusque", + "scores": { + "IFEval": 0.663, + "BBH": 0.4813, + "MATH Level 5": 0.1669, + "GPQA": 0.2643, + "MUSR": 0.3621, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "Locutusque/Hercules-6.1-Llama-3.1-8B", + "name": "Hercules-6.1-Llama-3.1-8B", + "developer": "Locutusque", + "scores": { + "IFEval": 0.6007, + "BBH": 0.4656, + "MATH Level 5": 0.176, + "GPQA": 0.2609, + "MUSR": 0.3553, + "MMLU-PRO": 0.3669 + } + }, + { + "model_id": "Locutusque/Llama-3-NeuralHercules-5.0-8B", + "name": "Llama-3-NeuralHercules-5.0-8B", + "developer": "Locutusque", + "scores": { + "IFEval": 0.4489, + "BBH": 0.394, + "MATH Level 5": 0.0431, + "GPQA": 0.2685, + "MUSR": 0.3881, + "MMLU-PRO": 0.2933 + } + }, + { + "model_id": "Locutusque/Llama-3-Yggdrasil-2.0-8B", + "name": "Llama-3-Yggdrasil-2.0-8B", + "developer": "Locutusque", + "scores": { + "IFEval": 0.5371, + "BBH": 0.4772, + "MATH Level 5": 0.0831, + "GPQA": 0.2626, + "MUSR": 0.3977, + "MMLU-PRO": 0.3167 + } + }, + { + "model_id": "Locutusque/TinyMistral-248M-v2.5", + "name": "TinyMistral-248M-v2.5", + "developer": "Locutusque", + "scores": { + "IFEval": 0.1336, + "BBH": 0.3039, + "MATH Level 5": 0.0098, + "GPQA": 0.2508, + "MUSR": 0.3782, + "MMLU-PRO": 0.1135 + } + }, + { + "model_id": "Luni/StarDust-12b-v1", + "name": "StarDust-12b-v1", + "developer": "Luni", + "scores": { + "IFEval": 0.5459, + "BBH": 0.5366, + "MATH Level 5": 0.0763, + "GPQA": 0.276, + "MUSR": 0.4324, + "MMLU-PRO": 0.3412 + } + }, + { + "model_id": "Luni/StarDust-12b-v2", + "name": "StarDust-12b-v2", + "developer": "Luni", + "scores": { + "IFEval": 0.5629, + "BBH": 0.5419, + "MATH Level 5": 0.0687, + "GPQA": 0.2936, + "MUSR": 0.4338, + "MMLU-PRO": 0.3439 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v3", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v3", + "developer": "Lunzima", + "scores": { + "IFEval": 0.7049, + "BBH": 0.6478, + "MATH Level 5": 0.4162, + "GPQA": 0.3817, + "MUSR": 0.4808, + "MMLU-PRO": 0.5394 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v4", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v4", + "developer": "Lunzima", + "scores": { + "IFEval": 0.6943, + "BBH": 0.642, + "MATH Level 5": 0.3467, + "GPQA": 0.3716, + "MUSR": 0.4769, + "MMLU-PRO": 0.5252 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v5", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v5", + "developer": "Lunzima", + "scores": { + "IFEval": 0.7485, + "BBH": 0.6467, + "MATH Level 5": 0.4358, + "GPQA": 0.3624, + "MUSR": 0.4473, + "MMLU-PRO": 0.514 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v6", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v6", + "developer": "Lunzima", + "scores": { + "IFEval": 0.7043, + "BBH": 0.6458, + "MATH Level 5": 0.3958, + "GPQA": 0.3775, + "MUSR": 0.4768, + "MMLU-PRO": 0.5392 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v6-cpt", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v6-cpt", + "developer": "Lunzima", + "scores": { + "IFEval": 0.4663, + "BBH": 0.6215, + "MATH Level 5": 0.3316, + "GPQA": 0.3758, + "MUSR": 0.4937, + "MMLU-PRO": 0.5204 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v7", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v7", + "developer": "Lunzima", + "scores": { + "IFEval": 0.6794, + "BBH": 0.6531, + "MATH Level 5": 0.4101, + "GPQA": 0.3792, + "MUSR": 0.4834, + "MMLU-PRO": 0.5376 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v7-rebase", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v7-rebase", + "developer": "Lunzima", + "scores": { + "IFEval": 0.6931, + "BBH": 0.6423, + "MATH Level 5": 0.3406, + "GPQA": 0.375, + "MUSR": 0.4888, + "MMLU-PRO": 0.5277 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v8", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v8", + "developer": "Lunzima", + "scores": { + "IFEval": 0.7875, + "BBH": 0.6419, + "MATH Level 5": 0.5559, + "GPQA": 0.3356, + "MUSR": 0.4394, + "MMLU-PRO": 0.5206 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v8.5", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v8.5", + "developer": "Lunzima", + "scores": { + "IFEval": 0.5929, + "BBH": 0.6451, + "MATH Level 5": 0.3656, + "GPQA": 0.38, + "MUSR": 0.477, + "MMLU-PRO": 0.529 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v8.6", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v8.6", + "developer": "Lunzima", + "scores": { + "IFEval": 0.5919, + "BBH": 0.6457, + "MATH Level 5": 0.4071, + "GPQA": 0.3842, + "MUSR": 0.4953, + "MMLU-PRO": 0.54 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v8.7", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v8.7", + "developer": "Lunzima", + "scores": { + "IFEval": 0.7875, + "BBH": 0.6483, + "MATH Level 5": 0.5408, + "GPQA": 0.3515, + "MUSR": 0.4381, + "MMLU-PRO": 0.5242 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v8.8", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v8.8", + "developer": "Lunzima", + "scores": { + "IFEval": 0.7028, + "BBH": 0.6566, + "MATH Level 5": 0.4237, + "GPQA": 0.3758, + "MUSR": 0.4912, + "MMLU-PRO": 0.5323 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v8.9", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v8.9", + "developer": "Lunzima", + "scores": { + "IFEval": 0.7993, + "BBH": 0.6483, + "MATH Level 5": 0.537, + "GPQA": 0.3297, + "MUSR": 0.4328, + "MMLU-PRO": 0.5199 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v9", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v9", + "developer": "Lunzima", + "scores": { + "IFEval": 0.5235, + "BBH": 0.6546, + "MATH Level 5": 0.4366, + "GPQA": 0.3884, + "MUSR": 0.4806, + "MMLU-PRO": 0.5422 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v9-stock", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v9-stock", + "developer": "Lunzima", + "scores": { + "IFEval": 0.6514, + "BBH": 0.6571, + "MATH Level 5": 0.4184, + "GPQA": 0.3842, + "MUSR": 0.482, + "MMLU-PRO": 0.5412 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v9.1", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v9.1", + "developer": "Lunzima", + "scores": { + "IFEval": 0.8003, + "BBH": 0.6555, + "MATH Level 5": 0.5468, + "GPQA": 0.3431, + "MUSR": 0.4354, + "MMLU-PRO": 0.5251 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-MegaFusion-v9.2", + "name": "NQLSG-Qwen2.5-14B-MegaFusion-v9.2", + "developer": "Lunzima", + "scores": { + "IFEval": 0.7862, + "BBH": 0.6538, + "MATH Level 5": 0.5332, + "GPQA": 0.3557, + "MUSR": 0.4381, + "MMLU-PRO": 0.5283 + } + }, + { + "model_id": "Lunzima/NQLSG-Qwen2.5-14B-OriginalFusion", + "name": "NQLSG-Qwen2.5-14B-OriginalFusion", + "developer": "Lunzima", + "scores": { + "IFEval": 0.6142, + "BBH": 0.6592, + "MATH Level 5": 0.4275, + "GPQA": 0.3809, + "MUSR": 0.5122, + "MMLU-PRO": 0.5239 + } + }, + { + "model_id": "Lyte/Llama-3.1-8B-Instruct-Reasoner-1o1_v0.3", + "name": "Llama-3.1-8B-Instruct-Reasoner-1o1_v0.3", + "developer": "Lyte", + "scores": { + "IFEval": 0.7098, + "BBH": 0.495, + "MATH Level 5": 0.1903, + "GPQA": 0.2701, + "MUSR": 0.3461, + "MMLU-PRO": 0.3618 + } + }, + { + "model_id": "Lyte/Llama-3.2-1B-Instruct-COT-RL-Expriement1-EP04", + "name": "Llama-3.2-1B-Instruct-COT-RL-Expriement1-EP04", + "developer": "Lyte", + "scores": { + "IFEval": 0.5774, + "BBH": 0.3515, + "MATH Level 5": 0.0801, + "GPQA": 0.2601, + "MUSR": 0.3236, + "MMLU-PRO": 0.1843 + } + }, + { + "model_id": "Lyte/Llama-3.2-3B-Overthinker", + "name": "Llama-3.2-3B-Overthinker", + "developer": "Lyte", + "scores": { + "IFEval": 0.6408, + "BBH": 0.432, + "MATH Level 5": 0.1563, + "GPQA": 0.2592, + "MUSR": 0.3419, + "MMLU-PRO": 0.2985 + } + }, + { + "model_id": "M4-ai/TinyMistral-248M-v3", + "name": "TinyMistral-248M-v3", + "developer": "M4-ai", + "scores": { + "IFEval": 0.1639, + "BBH": 0.2885, + "MATH Level 5": 0.0045, + "GPQA": 0.2408, + "MUSR": 0.3793, + "MMLU-PRO": 0.1132 + } + }, + { + "model_id": "MEscriva/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis", + "name": "ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis", + "developer": "MEscriva", + "scores": { + "IFEval": 0.0866, + "BBH": 0.3057, + "MATH Level 5": 0.0106, + "GPQA": 0.2517, + "MUSR": 0.4017, + "MMLU-PRO": 0.1154 + } + }, + { + "model_id": "MLP-KTLim/llama-3-Korean-Bllossom-8B", + "name": "llama-3-Korean-Bllossom-8B", + "developer": "MLP-KTLim", + "scores": { + "IFEval": 0.5113, + "BBH": 0.49, + "MATH Level 5": 0.102, + "GPQA": 0.2626, + "MUSR": 0.3675, + "MMLU-PRO": 0.3594 + } + }, + { + "model_id": "MTSAIR/Cotype-Nano", + "name": "Cotype-Nano", + "developer": "MTSAIR", + "scores": { + "IFEval": 0.3748, + "BBH": 0.3865, + "MATH Level 5": 0.0974, + "GPQA": 0.2701, + "MUSR": 0.3289, + "MMLU-PRO": 0.2477 + } + }, + { + "model_id": "MTSAIR/MultiVerse_70B", + "name": "MultiVerse_70B", + "developer": "MTSAIR", + "scores": { + "IFEval": 0.5249, + "BBH": 0.6183, + "MATH Level 5": 0.1926, + "GPQA": 0.354, + "MUSR": 0.474, + "MMLU-PRO": 0.486 + } + }, + { + "model_id": "Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.1", + "name": "Llama-3-8B-Magpie-Align-SFT-v0.1", + "developer": "Magpie-Align", + "scores": { + "IFEval": 0.4361, + "BBH": 0.4615, + "MATH Level 5": 0.0574, + "GPQA": 0.2626, + "MUSR": 0.3277, + "MMLU-PRO": 0.2863 + } + }, + { + "model_id": "Magpie-Align/Llama-3-8B-Magpie-Align-SFT-v0.3", + "name": "Llama-3-8B-Magpie-Align-SFT-v0.3", + "developer": "Magpie-Align", + "scores": { + "IFEval": 0.5064, + "BBH": 0.4572, + "MATH Level 5": 0.0733, + "GPQA": 0.2659, + "MUSR": 0.3424, + "MMLU-PRO": 0.2902 + } + }, + { + "model_id": "Magpie-Align/Llama-3-8B-Magpie-Align-v0.1", + "name": "Llama-3-8B-Magpie-Align-v0.1", + "developer": "Magpie-Align", + "scores": { + "IFEval": 0.4027, + "BBH": 0.4789, + "MATH Level 5": 0.0461, + "GPQA": 0.2768, + "MUSR": 0.3087, + "MMLU-PRO": 0.3001 + } + }, + { + "model_id": "Magpie-Align/Llama-3-8B-Magpie-Align-v0.3", + "name": "Llama-3-8B-Magpie-Align-v0.3", + "developer": "Magpie-Align", + "scores": { + "IFEval": 0.4497, + "BBH": 0.457, + "MATH Level 5": 0.0566, + "GPQA": 0.2651, + "MUSR": 0.3406, + "MMLU-PRO": 0.3134 + } + }, + { + "model_id": "Magpie-Align/Llama-3.1-8B-Magpie-Align-SFT-v0.1", + "name": "Llama-3.1-8B-Magpie-Align-SFT-v0.1", + "developer": "Magpie-Align", + "scores": { + "IFEval": 0.4782, + "BBH": 0.4764, + "MATH Level 5": 0.0899, + "GPQA": 0.2609, + "MUSR": 0.3397, + "MMLU-PRO": 0.2943 + } + }, + { + "model_id": "Magpie-Align/Llama-3.1-8B-Magpie-Align-v0.1", + "name": "Llama-3.1-8B-Magpie-Align-v0.1", + "developer": "Magpie-Align", + "scores": { + "IFEval": 0.4458, + "BBH": 0.4622, + "MATH Level 5": 0.0665, + "GPQA": 0.2634, + "MUSR": 0.3141, + "MMLU-PRO": 0.3262 + } + }, + { + "model_id": "Magpie-Align/MagpieLM-8B-Chat-v0.1", + "name": "MagpieLM-8B-Chat-v0.1", + "developer": "Magpie-Align", + "scores": { + "IFEval": 0.3701, + "BBH": 0.4172, + "MATH Level 5": 0.0612, + "GPQA": 0.2617, + "MUSR": 0.3501, + "MMLU-PRO": 0.3195 + } + }, + { + "model_id": "Magpie-Align/MagpieLM-8B-SFT-v0.1", + "name": "MagpieLM-8B-SFT-v0.1", + "developer": "Magpie-Align", + "scores": { + "IFEval": 0.4721, + "BBH": 0.4553, + "MATH Level 5": 0.0755, + "GPQA": 0.2676, + "MUSR": 0.3649, + "MMLU-PRO": 0.299 + } + }, + { + "model_id": "MagusCorp/grpo_lora_enem_llama3_7b", + "name": "grpo_lora_enem_llama3_7b", + "developer": "MagusCorp", + "scores": { + "IFEval": 0.4724, + "BBH": 0.4801, + "MATH Level 5": 0.1216, + "GPQA": 0.3096, + "MUSR": 0.3971, + "MMLU-PRO": 0.3574 + } + }, + { + "model_id": "ManoloPueblo/ContentCuisine_1-7B-slerp", + "name": "ContentCuisine_1-7B-slerp", + "developer": "ManoloPueblo", + "scores": { + "IFEval": 0.3907, + "BBH": 0.5188, + "MATH Level 5": 0.0733, + "GPQA": 0.3029, + "MUSR": 0.4672, + "MMLU-PRO": 0.3054 + } + }, + { + "model_id": "ManoloPueblo/LLM_MERGE_CC2", + "name": "LLM_MERGE_CC2", + "developer": "ManoloPueblo", + "scores": { + "IFEval": 0.3853, + "BBH": 0.5209, + "MATH Level 5": 0.0642, + "GPQA": 0.3045, + "MUSR": 0.4593, + "MMLU-PRO": 0.3032 + } + }, + { + "model_id": "ManoloPueblo/LLM_MERGE_CC3", + "name": "LLM_MERGE_CC3", + "developer": "ManoloPueblo", + "scores": { + "IFEval": 0.3959, + "BBH": 0.5246, + "MATH Level 5": 0.0793, + "GPQA": 0.3096, + "MUSR": 0.4672, + "MMLU-PRO": 0.3156 + } + }, + { + "model_id": "MarinaraSpaghetti/NemoReRemix-12B", + "name": "NemoReRemix-12B", + "developer": "MarinaraSpaghetti", + "scores": { + "IFEval": 0.3343, + "BBH": 0.5537, + "MATH Level 5": 0.0906, + "GPQA": 0.318, + "MUSR": 0.4501, + "MMLU-PRO": 0.3598 + } + }, + { + "model_id": "MarinaraSpaghetti/Nemomix-v4.0-12B", + "name": "Nemomix-v4.0-12B", + "developer": "MarinaraSpaghetti", + "scores": { + "IFEval": 0.5575, + "BBH": 0.5275, + "MATH Level 5": 0.108, + "GPQA": 0.2919, + "MUSR": 0.4244, + "MMLU-PRO": 0.3613 + } + }, + { + "model_id": "Marsouuu/MiniMathExpert-2_61B-ECE-PRYMMAL-Martial", + "name": "MiniMathExpert-2_61B-ECE-PRYMMAL-Martial", + "developer": "Marsouuu", + "scores": { + "IFEval": 0.2548, + "BBH": 0.3953, + "MATH Level 5": 0.074, + "GPQA": 0.2752, + "MUSR": 0.4083, + "MMLU-PRO": 0.2274 + } + }, + { + "model_id": "Marsouuu/MiniQwenMathExpert-ECE-PRYMMAL-Martial", + "name": "MiniQwenMathExpert-ECE-PRYMMAL-Martial", + "developer": "Marsouuu", + "scores": { + "IFEval": 0.2795, + "BBH": 0.423, + "MATH Level 5": 0.114, + "GPQA": 0.2819, + "MUSR": 0.3867, + "MMLU-PRO": 0.2922 + } + }, + { + "model_id": "Marsouuu/MistralBase-4x7B-MoE-ECE-PRYMMAL-Martial", + "name": "MistralBase-4x7B-MoE-ECE-PRYMMAL-Martial", + "developer": "Marsouuu", + "scores": { + "IFEval": 0.1697, + "BBH": 0.3464, + "MATH Level 5": 0.0144, + "GPQA": 0.2592, + "MUSR": 0.3991, + "MMLU-PRO": 0.1379 + } + }, + { + "model_id": "Marsouuu/general3B-ECE-PRYMMAL-Martial", + "name": "general3B-ECE-PRYMMAL-Martial", + "developer": "Marsouuu", + "scores": { + "IFEval": 0.2722, + "BBH": 0.5394, + "MATH Level 5": 0.1548, + "GPQA": 0.3196, + "MUSR": 0.4701, + "MMLU-PRO": 0.3876 + } + }, + { + "model_id": "Marsouuu/general3Bv2-ECE-PRYMMAL-Martial", + "name": "general3Bv2-ECE-PRYMMAL-Martial", + "developer": "Marsouuu", + "scores": { + "IFEval": 0.5693, + "BBH": 0.5637, + "MATH Level 5": 0.3671, + "GPQA": 0.3104, + "MUSR": 0.4396, + "MMLU-PRO": 0.4498 + } + }, + { + "model_id": "Marsouuu/lareneg1_78B-ECE-PRYMMAL-Martial", + "name": "lareneg1_78B-ECE-PRYMMAL-Martial", + "developer": "Marsouuu", + "scores": { + "IFEval": 0.2795, + "BBH": 0.423, + "MATH Level 5": 0.114, + "GPQA": 0.2819, + "MUSR": 0.3867, + "MMLU-PRO": 0.2922 + } + }, + { + "model_id": "Marsouuu/lareneg3B-ECE-PRYMMAL-Martial", + "name": "lareneg3B-ECE-PRYMMAL-Martial", + "developer": "Marsouuu", + "scores": { + "IFEval": 0.3303, + "BBH": 0.5453, + "MATH Level 5": 0.1518, + "GPQA": 0.3247, + "MUSR": 0.4725, + "MMLU-PRO": 0.3767 + } + }, + { + "model_id": "Marsouuu/lareneg3Bv2-ECE-PRYMMAL-Martial", + "name": "lareneg3Bv2-ECE-PRYMMAL-Martial", + "developer": "Marsouuu", + "scores": { + "IFEval": 0.5753, + "BBH": 0.5623, + "MATH Level 5": 0.3656, + "GPQA": 0.3196, + "MUSR": 0.4369, + "MMLU-PRO": 0.4511 + } + }, + { + "model_id": "MaziyarPanahi/Calme-4x7B-MoE-v0.1", + "name": "Calme-4x7B-MoE-v0.1", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.4315, + "BBH": 0.5103, + "MATH Level 5": 0.0801, + "GPQA": 0.2819, + "MUSR": 0.4199, + "MMLU-PRO": 0.3057 + } + }, + { + "model_id": "MaziyarPanahi/Calme-4x7B-MoE-v0.2", + "name": "Calme-4x7B-MoE-v0.2", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.4294, + "BBH": 0.5111, + "MATH Level 5": 0.074, + "GPQA": 0.2794, + "MUSR": 0.4318, + "MMLU-PRO": 0.3058 + } + }, + { + "model_id": "MaziyarPanahi/Llama-3-70B-Instruct-v0.1", + "name": "Llama-3-70B-Instruct-v0.1", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.4714, + "BBH": 0.5366, + "MATH Level 5": 0.1805, + "GPQA": 0.2844, + "MUSR": 0.4433, + "MMLU-PRO": 0.4618 + } + }, + { + "model_id": "MaziyarPanahi/Llama-3-8B-Instruct-v0.10", + "name": "Llama-3-8B-Instruct-v0.10", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.7667, + "BBH": 0.4924, + "MATH Level 5": 0.0574, + "GPQA": 0.3087, + "MUSR": 0.4214, + "MMLU-PRO": 0.3862 + } + }, + { + "model_id": "MaziyarPanahi/Llama-3-8B-Instruct-v0.8", + "name": "Llama-3-8B-Instruct-v0.8", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.7528, + "BBH": 0.4963, + "MATH Level 5": 0.0778, + "GPQA": 0.3054, + "MUSR": 0.4202, + "MMLU-PRO": 0.3853 + } + }, + { + "model_id": "MaziyarPanahi/Llama-3-8B-Instruct-v0.9", + "name": "Llama-3-8B-Instruct-v0.9", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.763, + "BBH": 0.4936, + "MATH Level 5": 0.0733, + "GPQA": 0.3079, + "MUSR": 0.4148, + "MMLU-PRO": 0.3846 + } + }, + { + "model_id": "MaziyarPanahi/Qwen1.5-MoE-A2.7B-Wikihow", + "name": "Qwen1.5-MoE-A2.7B-Wikihow", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.2954, + "BBH": 0.392, + "MATH Level 5": 0.0823, + "GPQA": 0.2752, + "MUSR": 0.3502, + "MMLU-PRO": 0.238 + } + }, + { + "model_id": "MaziyarPanahi/Qwen2-7B-Instruct-v0.1", + "name": "Qwen2-7B-Instruct-v0.1", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.3352, + "BBH": 0.5123, + "MATH Level 5": 0.2213, + "GPQA": 0.2852, + "MUSR": 0.4435, + "MMLU-PRO": 0.3857 + } + }, + { + "model_id": "MaziyarPanahi/Qwen2-7B-Instruct-v0.8", + "name": "Qwen2-7B-Instruct-v0.8", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.2775, + "BBH": 0.4637, + "MATH Level 5": 0.1767, + "GPQA": 0.2936, + "MUSR": 0.4293, + "MMLU-PRO": 0.3566 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.1-llama3.1-70b", + "name": "calme-2.1-llama3.1-70b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8434, + "BBH": 0.6448, + "MATH Level 5": 0.4101, + "GPQA": 0.328, + "MUSR": 0.438, + "MMLU-PRO": 0.5283 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.1-phi3-4b", + "name": "calme-2.1-phi3-4b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.5525, + "BBH": 0.5595, + "MATH Level 5": 0.1314, + "GPQA": 0.3297, + "MUSR": 0.4015, + "MMLU-PRO": 0.3746 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.1-phi3.5-4b", + "name": "calme-2.1-phi3.5-4b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.5659, + "BBH": 0.5484, + "MATH Level 5": 0.2039, + "GPQA": 0.344, + "MUSR": 0.3995, + "MMLU-PRO": 0.3935 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.1-qwen2-72b", + "name": "calme-2.1-qwen2-72b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8163, + "BBH": 0.6966, + "MATH Level 5": 0.4079, + "GPQA": 0.3809, + "MUSR": 0.4732, + "MMLU-PRO": 0.5415 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.1-qwen2-7b", + "name": "calme-2.1-qwen2-7b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.3816, + "BBH": 0.5046, + "MATH Level 5": 0.2311, + "GPQA": 0.2894, + "MUSR": 0.4437, + "MMLU-PRO": 0.3693 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.1-qwen2.5-72b", + "name": "calme-2.1-qwen2.5-72b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8662, + "BBH": 0.7262, + "MATH Level 5": 0.5914, + "GPQA": 0.3633, + "MUSR": 0.4298, + "MMLU-PRO": 0.5619 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.1-rys-78b", + "name": "calme-2.1-rys-78b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8136, + "BBH": 0.7098, + "MATH Level 5": 0.3943, + "GPQA": 0.3943, + "MUSR": 0.4693, + "MMLU-PRO": 0.5444 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.2-llama3-70b", + "name": "calme-2.2-llama3-70b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8208, + "BBH": 0.6435, + "MATH Level 5": 0.2394, + "GPQA": 0.3414, + "MUSR": 0.4446, + "MMLU-PRO": 0.5207 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.2-llama3.1-70b", + "name": "calme-2.2-llama3.1-70b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8593, + "BBH": 0.6793, + "MATH Level 5": 0.4366, + "GPQA": 0.3247, + "MUSR": 0.4542, + "MMLU-PRO": 0.5415 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.2-phi3-4b", + "name": "calme-2.2-phi3-4b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.5069, + "BBH": 0.553, + "MATH Level 5": 0.145, + "GPQA": 0.3213, + "MUSR": 0.3976, + "MMLU-PRO": 0.3814 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.2-qwen2-72b", + "name": "calme-2.2-qwen2-72b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8008, + "BBH": 0.694, + "MATH Level 5": 0.4532, + "GPQA": 0.3742, + "MUSR": 0.4508, + "MMLU-PRO": 0.5435 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.2-qwen2-7b", + "name": "calme-2.2-qwen2-7b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.3597, + "BBH": 0.5215, + "MATH Level 5": 0.2145, + "GPQA": 0.2911, + "MUSR": 0.4358, + "MMLU-PRO": 0.3899 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.2-qwen2.5-72b", + "name": "calme-2.2-qwen2.5-72b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8477, + "BBH": 0.7276, + "MATH Level 5": 0.5891, + "GPQA": 0.3591, + "MUSR": 0.4207, + "MMLU-PRO": 0.5618 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.2-rys-78b", + "name": "calme-2.2-rys-78b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.7986, + "BBH": 0.7081, + "MATH Level 5": 0.4071, + "GPQA": 0.4069, + "MUSR": 0.4536, + "MMLU-PRO": 0.5386 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.3-llama3-70b", + "name": "calme-2.3-llama3-70b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.801, + "BBH": 0.6399, + "MATH Level 5": 0.2326, + "GPQA": 0.3381, + "MUSR": 0.4261, + "MMLU-PRO": 0.5204 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.3-llama3.1-70b", + "name": "calme-2.3-llama3.1-70b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8605, + "BBH": 0.6872, + "MATH Level 5": 0.3927, + "GPQA": 0.344, + "MUSR": 0.4568, + "MMLU-PRO": 0.5363 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.3-phi3-4b", + "name": "calme-2.3-phi3-4b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.4926, + "BBH": 0.5538, + "MATH Level 5": 0.1473, + "GPQA": 0.318, + "MUSR": 0.3988, + "MMLU-PRO": 0.3828 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.3-qwen2-72b", + "name": "calme-2.3-qwen2-72b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.385, + "BBH": 0.6576, + "MATH Level 5": 0.3172, + "GPQA": 0.3716, + "MUSR": 0.4112, + "MMLU-PRO": 0.5419 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.3-qwen2-7b", + "name": "calme-2.3-qwen2-7b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.3825, + "BBH": 0.5064, + "MATH Level 5": 0.2069, + "GPQA": 0.297, + "MUSR": 0.4422, + "MMLU-PRO": 0.3611 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.3-rys-78b", + "name": "calme-2.3-rys-78b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8066, + "BBH": 0.7108, + "MATH Level 5": 0.398, + "GPQA": 0.4044, + "MUSR": 0.4549, + "MMLU-PRO": 0.5475 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.4-llama3-70b", + "name": "calme-2.4-llama3-70b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.5027, + "BBH": 0.6418, + "MATH Level 5": 0.2447, + "GPQA": 0.3398, + "MUSR": 0.4288, + "MMLU-PRO": 0.5204 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.4-qwen2-7b", + "name": "calme-2.4-qwen2-7b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.33, + "BBH": 0.5101, + "MATH Level 5": 0.2032, + "GPQA": 0.2836, + "MUSR": 0.4453, + "MMLU-PRO": 0.3977 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.4-rys-78b", + "name": "calme-2.4-rys-78b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8011, + "BBH": 0.728, + "MATH Level 5": 0.4071, + "GPQA": 0.4027, + "MUSR": 0.5771, + "MMLU-PRO": 0.7002 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.5-qwen2-7b", + "name": "calme-2.5-qwen2-7b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.3145, + "BBH": 0.4887, + "MATH Level 5": 0.2258, + "GPQA": 0.3104, + "MUSR": 0.4565, + "MMLU-PRO": 0.3682 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.6-qwen2-7b", + "name": "calme-2.6-qwen2-7b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.3443, + "BBH": 0.493, + "MATH Level 5": 0.1216, + "GPQA": 0.2844, + "MUSR": 0.4586, + "MMLU-PRO": 0.3732 + } + }, + { + "model_id": "MaziyarPanahi/calme-2.7-qwen2-7b", + "name": "calme-2.7-qwen2-7b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.3592, + "BBH": 0.4883, + "MATH Level 5": 0.1382, + "GPQA": 0.2911, + "MUSR": 0.4824, + "MMLU-PRO": 0.3705 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.1-baguette-3b", + "name": "calme-3.1-baguette-3b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.6234, + "BBH": 0.4683, + "MATH Level 5": 0.256, + "GPQA": 0.2861, + "MUSR": 0.4008, + "MMLU-PRO": 0.3399 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.1-instruct-3b", + "name": "calme-3.1-instruct-3b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.4336, + "BBH": 0.4813, + "MATH Level 5": 0.1775, + "GPQA": 0.2861, + "MUSR": 0.3952, + "MMLU-PRO": 0.3557 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.1-instruct-78b", + "name": "calme-3.1-instruct-78b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8136, + "BBH": 0.7305, + "MATH Level 5": 0.3927, + "GPQA": 0.396, + "MUSR": 0.5891, + "MMLU-PRO": 0.7185 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.1-llamaloi-3b", + "name": "calme-3.1-llamaloi-3b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.7375, + "BBH": 0.4587, + "MATH Level 5": 0.173, + "GPQA": 0.281, + "MUSR": 0.3515, + "MMLU-PRO": 0.3205 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.2-baguette-3b", + "name": "calme-3.2-baguette-3b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.6338, + "BBH": 0.4709, + "MATH Level 5": 0.2825, + "GPQA": 0.2945, + "MUSR": 0.4021, + "MMLU-PRO": 0.3338 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.2-instruct-3b", + "name": "calme-3.2-instruct-3b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.5533, + "BBH": 0.4866, + "MATH Level 5": 0.2168, + "GPQA": 0.2836, + "MUSR": 0.4047, + "MMLU-PRO": 0.3653 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.2-instruct-78b", + "name": "calme-3.2-instruct-78b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.8063, + "BBH": 0.7319, + "MATH Level 5": 0.4033, + "GPQA": 0.4027, + "MUSR": 0.6024, + "MMLU-PRO": 0.7303 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.3-baguette-3b", + "name": "calme-3.3-baguette-3b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.636, + "BBH": 0.4678, + "MATH Level 5": 0.3807, + "GPQA": 0.2802, + "MUSR": 0.3928, + "MMLU-PRO": 0.3342 + } + }, + { + "model_id": "MaziyarPanahi/calme-3.3-instruct-3b", + "name": "calme-3.3-instruct-3b", + "developer": "MaziyarPanahi", + "scores": { + "IFEval": 0.6423, + "BBH": 0.4693, + "MATH Level 5": 0.3739, + "GPQA": 0.2827, + "MUSR": 0.4074, + "MMLU-PRO": 0.3305 + } + }, + { + "model_id": "Minami-su/Amara-o1-7B-Qwen", + "name": "Amara-o1-7B-Qwen", + "developer": "Minami-su", + "scores": { + "IFEval": 0.739, + "BBH": 0.5199, + "MATH Level 5": 0.5181, + "GPQA": 0.2936, + "MUSR": 0.4007, + "MMLU-PRO": 0.4083 + } + }, + { + "model_id": "Minami-su/Amara-o2-7B-Qwen", + "name": "Amara-o2-7B-Qwen", + "developer": "Minami-su", + "scores": { + "IFEval": 0.7147, + "BBH": 0.5173, + "MATH Level 5": 0.4086, + "GPQA": 0.2634, + "MUSR": 0.3781, + "MMLU-PRO": 0.4165 + } + }, + { + "model_id": "Minami-su/test-7B-00", + "name": "test-7B-00", + "developer": "Minami-su", + "scores": { + "IFEval": 0.669, + "BBH": 0.4466, + "MATH Level 5": 0.4517, + "GPQA": 0.3029, + "MUSR": 0.4126, + "MMLU-PRO": 0.3588 + } + }, + { + "model_id": "Minami-su/test-7B-01", + "name": "test-7B-01", + "developer": "Minami-su", + "scores": { + "IFEval": 0.6736, + "BBH": 0.4422, + "MATH Level 5": 0.4554, + "GPQA": 0.307, + "MUSR": 0.4153, + "MMLU-PRO": 0.3536 + } + }, + { + "model_id": "Minami-su/test-v2-7B-00", + "name": "test-v2-7B-00", + "developer": "Minami-su", + "scores": { + "IFEval": 0.6747, + "BBH": 0.4416, + "MATH Level 5": 0.4418, + "GPQA": 0.2919, + "MUSR": 0.4154, + "MMLU-PRO": 0.3472 + } + }, + { + "model_id": "ModelCloud/Llama-3.2-1B-Instruct-gptqmodel-4bit-vortex-v1", + "name": "Llama-3.2-1B-Instruct-gptqmodel-4bit-vortex-v1", + "developer": "ModelCloud", + "scores": { + "IFEval": 0.5269, + "BBH": 0.3253, + "MATH Level 5": 0.0604, + "GPQA": 0.2534, + "MUSR": 0.3249, + "MMLU-PRO": 0.1764 + } + }, + { + "model_id": "ModelSpace/GemmaX2-28-9B-v0.1", + "name": "GemmaX2-28-9B-v0.1", + "developer": "ModelSpace", + "scores": { + "IFEval": 0.0039, + "BBH": 0.3687, + "MATH Level 5": 0.0272, + "GPQA": 0.2768, + "MUSR": 0.3537, + "MMLU-PRO": 0.2231 + } + }, + { + "model_id": "MoonRide/Llama-3.2-3B-Khelavaster", + "name": "Llama-3.2-3B-Khelavaster", + "developer": "MoonRide", + "scores": { + "IFEval": 0.4925, + "BBH": 0.4516, + "MATH Level 5": 0.1616, + "GPQA": 0.2777, + "MUSR": 0.3699, + "MMLU-PRO": 0.3122 + } + }, + { + "model_id": "Mostafa8Mehrabi/llama-3.2-1b-Insomnia-ChatBot-merged", + "name": "llama-3.2-1b-Insomnia-ChatBot-merged", + "developer": "Mostafa8Mehrabi", + "scores": { + "IFEval": 0.1321, + "BBH": 0.3004, + "MATH Level 5": 0.0076, + "GPQA": 0.2366, + "MUSR": 0.3382, + "MMLU-PRO": 0.1131 + } + }, + { + "model_id": "MrRobotoAI/MrRoboto-ProLong-8b-v4i", + "name": "MrRoboto-ProLong-8b-v4i", + "developer": "MrRobotoAI", + "scores": { + "IFEval": 0.3835, + "BBH": 0.4585, + "MATH Level 5": 0.0551, + "GPQA": 0.2894, + "MUSR": 0.4014, + "MMLU-PRO": 0.3068 + } + }, + { + "model_id": "MrRobotoAI/MrRoboto-ProLongBASE-pt8-unaligned-8b", + "name": "MrRoboto-ProLongBASE-pt8-unaligned-8b", + "developer": "MrRobotoAI", + "scores": { + "IFEval": 0.3475, + "BBH": 0.4515, + "MATH Level 5": 0.0423, + "GPQA": 0.281, + "MUSR": 0.4279, + "MMLU-PRO": 0.2566 + } + }, + { + "model_id": "MultivexAI/Gladiator-Mini-Exp-1211-3B", + "name": "Gladiator-Mini-Exp-1211-3B", + "developer": "MultivexAI", + "scores": { + "IFEval": 0.6876, + "BBH": 0.4484, + "MATH Level 5": 0.1375, + "GPQA": 0.2727, + "MUSR": 0.326, + "MMLU-PRO": 0.3152 + } + }, + { + "model_id": "MultivexAI/Gladiator-Mini-Exp-1221-3B-Instruct", + "name": "Gladiator-Mini-Exp-1221-3B-Instruct", + "developer": "MultivexAI", + "scores": { + "IFEval": 0.6079, + "BBH": 0.437, + "MATH Level 5": 0.1352, + "GPQA": 0.2634, + "MUSR": 0.3115, + "MMLU-PRO": 0.3049 + } + }, + { + "model_id": "MultivexAI/Gladiator-Mini-Exp-1221-3B-Instruct-V2", + "name": "Gladiator-Mini-Exp-1221-3B-Instruct-V2", + "developer": "MultivexAI", + "scores": { + "IFEval": 0.6215, + "BBH": 0.4389, + "MATH Level 5": 0.1412, + "GPQA": 0.2634, + "MUSR": 0.3008, + "MMLU-PRO": 0.3025 + } + }, + { + "model_id": "MultivexAI/Gladiator-Mini-Exp-1222-3B-Instruct", + "name": "Gladiator-Mini-Exp-1222-3B-Instruct", + "developer": "MultivexAI", + "scores": { + "IFEval": 0.6163, + "BBH": 0.4373, + "MATH Level 5": 0.1412, + "GPQA": 0.2634, + "MUSR": 0.3128, + "MMLU-PRO": 0.3017 + } + }, + { + "model_id": "MultivexAI/Phi-3.5-Mini-Instruct-MultiVex-v0.25-GGUF", + "name": "Phi-3.5-Mini-Instruct-MultiVex-v0.25-GGUF", + "developer": "MultivexAI", + "scores": { + "IFEval": 0.144, + "BBH": 0.2908, + "MATH Level 5": 0.006, + "GPQA": 0.255, + "MUSR": 0.3642, + "MMLU-PRO": 0.1109 + } + }, + { + "model_id": "Mxode/NanoLM-0.3B-Instruct-v1", + "name": "NanoLM-0.3B-Instruct-v1", + "developer": "Mxode", + "scores": { + "IFEval": 0.1537, + "BBH": 0.3028, + "MATH Level 5": 0.0144, + "GPQA": 0.2718, + "MUSR": 0.4155, + "MMLU-PRO": 0.1105 + } + }, + { + "model_id": "Mxode/NanoLM-0.3B-Instruct-v1.1", + "name": "NanoLM-0.3B-Instruct-v1.1", + "developer": "Mxode", + "scores": { + "IFEval": 0.1783, + "BBH": 0.3014, + "MATH Level 5": 0.0136, + "GPQA": 0.25, + "MUSR": 0.4273, + "MMLU-PRO": 0.1121 + } + }, + { + "model_id": "Mxode/NanoLM-0.3B-Instruct-v2", + "name": "NanoLM-0.3B-Instruct-v2", + "developer": "Mxode", + "scores": { + "IFEval": 0.1668, + "BBH": 0.2921, + "MATH Level 5": 0.0068, + "GPQA": 0.2609, + "MUSR": 0.3955, + "MMLU-PRO": 0.1134 + } + }, + { + "model_id": "Mxode/NanoLM-1B-Instruct-v1.1", + "name": "NanoLM-1B-Instruct-v1.1", + "developer": "Mxode", + "scores": { + "IFEval": 0.2395, + "BBH": 0.3184, + "MATH Level 5": 0.0363, + "GPQA": 0.2634, + "MUSR": 0.3433, + "MMLU-PRO": 0.1215 + } + }, + { + "model_id": "Mxode/NanoLM-1B-Instruct-v2", + "name": "NanoLM-1B-Instruct-v2", + "developer": "Mxode", + "scores": { + "IFEval": 0.263, + "BBH": 0.3123, + "MATH Level 5": 0.0415, + "GPQA": 0.2634, + "MUSR": 0.3552, + "MMLU-PRO": 0.1238 + } + }, + { + "model_id": "NAPS-ai/naps-gemma-2-27b-v-0.1.0", + "name": "naps-gemma-2-27b-v-0.1.0", + "developer": "NAPS-ai", + "scores": { + "IFEval": 0.0, + "BBH": 0.2912, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3575, + "MMLU-PRO": 0.1168 + } + }, + { + "model_id": "NAPS-ai/naps-gemma-2-27b-v0.1.0", + "name": "naps-gemma-2-27b-v0.1.0", + "developer": "NAPS-ai", + "scores": { + "IFEval": 0.0, + "BBH": 0.2912, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3575, + "MMLU-PRO": 0.1168 + } + }, + { + "model_id": "NAPS-ai/naps-llama-3_1-8b-instruct-v0.3", + "name": "naps-llama-3_1-8b-instruct-v0.3", + "developer": "NAPS-ai", + "scores": { + "IFEval": 0.5391, + "BBH": 0.4901, + "MATH Level 5": 0.1903, + "GPQA": 0.2995, + "MUSR": 0.3787, + "MMLU-PRO": 0.3398 + } + }, + { + "model_id": "NAPS-ai/naps-llama-3_1-8b-instruct-v0.4", + "name": "naps-llama-3_1-8b-instruct-v0.4", + "developer": "NAPS-ai", + "scores": { + "IFEval": 0.7344, + "BBH": 0.4862, + "MATH Level 5": 0.1964, + "GPQA": 0.2794, + "MUSR": 0.4421, + "MMLU-PRO": 0.3475 + } + }, + { + "model_id": "NAPS-ai/naps-llama-3_1-instruct-v0.5.0", + "name": "naps-llama-3_1-instruct-v0.5.0", + "developer": "NAPS-ai", + "scores": { + "IFEval": 0.502, + "BBH": 0.4148, + "MATH Level 5": 0.0363, + "GPQA": 0.2685, + "MUSR": 0.3713, + "MMLU-PRO": 0.2614 + } + }, + { + "model_id": "NAPS-ai/naps-llama-3_1_instruct-v0.6.0", + "name": "naps-llama-3_1_instruct-v0.6.0", + "developer": "NAPS-ai", + "scores": { + "IFEval": 0.328, + "BBH": 0.4528, + "MATH Level 5": 0.0642, + "GPQA": 0.2819, + "MUSR": 0.3739, + "MMLU-PRO": 0.3241 + } + }, + { + "model_id": "NAPS-ai/naps-llama3.1-70B-v0.2-fp16", + "name": "naps-llama3.1-70B-v0.2-fp16", + "developer": "NAPS-ai", + "scores": { + "IFEval": 0.1845, + "BBH": 0.3041, + "MATH Level 5": 0.0, + "GPQA": 0.2391, + "MUSR": 0.3486, + "MMLU-PRO": 0.1099 + } + }, + { + "model_id": "NCSOFT/Llama-VARCO-8B-Instruct", + "name": "Llama-VARCO-8B-Instruct", + "developer": "NCSOFT", + "scores": { + "IFEval": 0.447, + "BBH": 0.5023, + "MATH Level 5": 0.1065, + "GPQA": 0.297, + "MUSR": 0.3841, + "MMLU-PRO": 0.319 + } + }, + { + "model_id": "NJS26/NJS_777", + "name": "NJS_777", + "developer": "NJS26", + "scores": { + "IFEval": 0.1881, + "BBH": 0.2178, + "MATH Level 5": 0.0, + "GPQA": 0.2064, + "MUSR": 0.3538, + "MMLU-PRO": 0.1163 + } + }, + { + "model_id": "NLPark/AnFeng_v3.1-Avocet", + "name": "AnFeng_v3.1-Avocet", + "developer": "NLPark", + "scores": { + "IFEval": 0.5096, + "BBH": 0.5829, + "MATH Level 5": 0.1594, + "GPQA": 0.3247, + "MUSR": 0.4476, + "MMLU-PRO": 0.4438 + } + }, + { + "model_id": "NLPark/B-and-W_Flycatcher-3AD1E", + "name": "B-and-W_Flycatcher-3AD1E", + "developer": "NLPark", + "scores": { + "IFEval": 0.4908, + "BBH": 0.6065, + "MATH Level 5": 0.2379, + "GPQA": 0.3305, + "MUSR": 0.4423, + "MMLU-PRO": 0.4741 + } + }, + { + "model_id": "NLPark/Shi-Ci-Robin-Test_3AD80", + "name": "Shi-Ci-Robin-Test_3AD80", + "developer": "NLPark", + "scores": { + "IFEval": 0.7227, + "BBH": 0.6705, + "MATH Level 5": 0.3157, + "GPQA": 0.3599, + "MUSR": 0.4696, + "MMLU-PRO": 0.5121 + } + }, + { + "model_id": "NTQAI/NxMobileLM-1.5B-SFT", + "name": "NxMobileLM-1.5B-SFT", + "developer": "NTQAI", + "scores": { + "IFEval": 0.6392, + "BBH": 0.3957, + "MATH Level 5": 0.0846, + "GPQA": 0.2592, + "MUSR": 0.3555, + "MMLU-PRO": 0.2817 + } + }, + { + "model_id": "NTQAI/Nxcode-CQ-7B-orpo", + "name": "Nxcode-CQ-7B-orpo", + "developer": "NTQAI", + "scores": { + "IFEval": 0.4007, + "BBH": 0.4143, + "MATH Level 5": 0.0219, + "GPQA": 0.2542, + "MUSR": 0.394, + "MMLU-PRO": 0.1612 + } + }, + { + "model_id": "NYTK/PULI-GPTrio", + "name": "PULI-GPTrio", + "developer": "NYTK", + "scores": { + "IFEval": 0.218, + "BBH": 0.306, + "MATH Level 5": 0.0121, + "GPQA": 0.2659, + "MUSR": 0.3819, + "MMLU-PRO": 0.1137 + } + }, + { + "model_id": "NYTK/PULI-LlumiX-32K", + "name": "PULI-LlumiX-32K", + "developer": "NYTK", + "scores": { + "IFEval": 0.17, + "BBH": 0.3189, + "MATH Level 5": 0.0128, + "GPQA": 0.2534, + "MUSR": 0.3964, + "MMLU-PRO": 0.1681 + } + }, + { + "model_id": "Naveenpoliasetty/llama3-8B-V2", + "name": "llama3-8B-V2", + "developer": "Naveenpoliasetty", + "scores": { + "IFEval": 0.4123, + "BBH": 0.5189, + "MATH Level 5": 0.0785, + "GPQA": 0.2903, + "MUSR": 0.4081, + "MMLU-PRO": 0.3738 + } + }, + { + "model_id": "NbAiLab/nb-llama-3.1-8B-Instruct", + "name": "nb-llama-3.1-8B-Instruct", + "developer": "NbAiLab", + "scores": { + "IFEval": 0.3625, + "BBH": 0.3247, + "MATH Level 5": 0.0227, + "GPQA": 0.2735, + "MUSR": 0.3208, + "MMLU-PRO": 0.1197 + } + }, + { + "model_id": "NbAiLab/nb-llama-3.1-8B-sft", + "name": "nb-llama-3.1-8B-sft", + "developer": "NbAiLab", + "scores": { + "IFEval": 0.3616, + "BBH": 0.3282, + "MATH Level 5": 0.0219, + "GPQA": 0.2542, + "MUSR": 0.3287, + "MMLU-PRO": 0.1222 + } + }, + { + "model_id": "Nekochu/Llama-3.1-8B-German-ORPO", + "name": "Llama-3.1-8B-German-ORPO", + "developer": "Nekochu", + "scores": { + "IFEval": 0.4611, + "BBH": 0.4983, + "MATH Level 5": 0.1171, + "GPQA": 0.3163, + "MUSR": 0.4647, + "MMLU-PRO": 0.3393 + } + }, + { + "model_id": "Nekochu/Llama-3.1-8B-french-DPO", + "name": "Llama-3.1-8B-french-DPO", + "developer": "Nekochu", + "scores": { + "IFEval": 0.4656, + "BBH": 0.5111, + "MATH Level 5": 0.0974, + "GPQA": 0.2911, + "MUSR": 0.4216, + "MMLU-PRO": 0.3414 + } + }, + { + "model_id": "Nekochu/Luminia-13B-v3", + "name": "Luminia-13B-v3", + "developer": "Nekochu", + "scores": { + "IFEval": 0.2523, + "BBH": 0.4112, + "MATH Level 5": 0.0181, + "GPQA": 0.2701, + "MUSR": 0.3983, + "MMLU-PRO": 0.2215 + } + }, + { + "model_id": "Nekochu/Luminia-8B-RP", + "name": "Luminia-8B-RP", + "developer": "Nekochu", + "scores": { + "IFEval": 0.5574, + "BBH": 0.5218, + "MATH Level 5": 0.136, + "GPQA": 0.297, + "MUSR": 0.3998, + "MMLU-PRO": 0.3631 + } + }, + { + "model_id": "NeverSleep/Lumimaid-v0.2-12B", + "name": "Lumimaid-v0.2-12B", + "developer": "NeverSleep", + "scores": { + "IFEval": 0.1099, + "BBH": 0.5396, + "MATH Level 5": 0.0566, + "GPQA": 0.3146, + "MUSR": 0.4821, + "MMLU-PRO": 0.3511 + } + }, + { + "model_id": "NeverSleep/Lumimaid-v0.2-8B", + "name": "Lumimaid-v0.2-8B", + "developer": "NeverSleep", + "scores": { + "IFEval": 0.5038, + "BBH": 0.5238, + "MATH Level 5": 0.1435, + "GPQA": 0.3112, + "MUSR": 0.4303, + "MMLU-PRO": 0.3636 + } + }, + { + "model_id": "Nexesenex/Dolphin3.0-Llama3.1-1B-abliterated", + "name": "Dolphin3.0-Llama3.1-1B-abliterated", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5312, + "BBH": 0.3241, + "MATH Level 5": 0.0385, + "GPQA": 0.2408, + "MUSR": 0.3237, + "MMLU-PRO": 0.1373 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DeepDive_3_Prev_v1.0", + "name": "Llama_3.1_8b_DeepDive_3_Prev_v1.0", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.6809, + "BBH": 0.5155, + "MATH Level 5": 0.1866, + "GPQA": 0.2911, + "MUSR": 0.3666, + "MMLU-PRO": 0.3438 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DeepDive_3_R1_Prev_v1.0", + "name": "Llama_3.1_8b_DeepDive_3_R1_Prev_v1.0", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7101, + "BBH": 0.512, + "MATH Level 5": 0.1926, + "GPQA": 0.3003, + "MUSR": 0.3758, + "MMLU-PRO": 0.3441 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DobHerWild_R1_v1.1R", + "name": "Llama_3.1_8b_DobHerWild_R1_v1.1R", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.76, + "BBH": 0.5257, + "MATH Level 5": 0.2319, + "GPQA": 0.2995, + "MUSR": 0.3852, + "MMLU-PRO": 0.3688 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DoberWild_v2.01", + "name": "Llama_3.1_8b_DoberWild_v2.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7996, + "BBH": 0.5251, + "MATH Level 5": 0.2002, + "GPQA": 0.3029, + "MUSR": 0.4012, + "MMLU-PRO": 0.3791 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DoberWild_v2.02", + "name": "Llama_3.1_8b_DoberWild_v2.02", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7746, + "BBH": 0.5313, + "MATH Level 5": 0.1994, + "GPQA": 0.2945, + "MUSR": 0.3946, + "MMLU-PRO": 0.3764 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DoberWild_v2.03", + "name": "Llama_3.1_8b_DoberWild_v2.03", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7764, + "BBH": 0.5294, + "MATH Level 5": 0.2077, + "GPQA": 0.3045, + "MUSR": 0.3906, + "MMLU-PRO": 0.3722 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DodoWild_v2.01", + "name": "Llama_3.1_8b_DodoWild_v2.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7978, + "BBH": 0.5253, + "MATH Level 5": 0.1986, + "GPQA": 0.3037, + "MUSR": 0.409, + "MMLU-PRO": 0.3738 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DodoWild_v2.02", + "name": "Llama_3.1_8b_DodoWild_v2.02", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.8017, + "BBH": 0.5262, + "MATH Level 5": 0.2273, + "GPQA": 0.3045, + "MUSR": 0.3971, + "MMLU-PRO": 0.3761 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DodoWild_v2.03", + "name": "Llama_3.1_8b_DodoWild_v2.03", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7941, + "BBH": 0.5308, + "MATH Level 5": 0.2221, + "GPQA": 0.3079, + "MUSR": 0.3959, + "MMLU-PRO": 0.3786 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_DodoWild_v2.10", + "name": "Llama_3.1_8b_DodoWild_v2.10", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.8054, + "BBH": 0.5278, + "MATH Level 5": 0.1971, + "GPQA": 0.2961, + "MUSR": 0.4157, + "MMLU-PRO": 0.3855 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Dolermed_R1_V1.01", + "name": "Llama_3.1_8b_Dolermed_R1_V1.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7534, + "BBH": 0.5312, + "MATH Level 5": 0.2017, + "GPQA": 0.3054, + "MUSR": 0.3747, + "MMLU-PRO": 0.3733 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Dolermed_R1_V1.03", + "name": "Llama_3.1_8b_Dolermed_R1_V1.03", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7564, + "BBH": 0.5316, + "MATH Level 5": 0.2092, + "GPQA": 0.318, + "MUSR": 0.38, + "MMLU-PRO": 0.372 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Dolermed_V1.01", + "name": "Llama_3.1_8b_Dolermed_V1.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5087, + "BBH": 0.5194, + "MATH Level 5": 0.1344, + "GPQA": 0.2945, + "MUSR": 0.3945, + "MMLU-PRO": 0.357 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Dolerstormed_V1.04", + "name": "Llama_3.1_8b_Dolerstormed_V1.04", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7889, + "BBH": 0.5195, + "MATH Level 5": 0.1926, + "GPQA": 0.3221, + "MUSR": 0.403, + "MMLU-PRO": 0.3889 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Hermedash_R1_V1.04", + "name": "Llama_3.1_8b_Hermedash_R1_V1.04", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7872, + "BBH": 0.5192, + "MATH Level 5": 0.1866, + "GPQA": 0.323, + "MUSR": 0.4111, + "MMLU-PRO": 0.3882 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Hermedive_R1_V1.01", + "name": "Llama_3.1_8b_Hermedive_R1_V1.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5001, + "BBH": 0.5171, + "MATH Level 5": 0.1775, + "GPQA": 0.2827, + "MUSR": 0.4008, + "MMLU-PRO": 0.3427 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Hermedive_R1_V1.03", + "name": "Llama_3.1_8b_Hermedive_R1_V1.03", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.6648, + "BBH": 0.5141, + "MATH Level 5": 0.1858, + "GPQA": 0.2978, + "MUSR": 0.3613, + "MMLU-PRO": 0.3488 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Hermedive_V1.01", + "name": "Llama_3.1_8b_Hermedive_V1.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5062, + "BBH": 0.4918, + "MATH Level 5": 0.1647, + "GPQA": 0.2894, + "MUSR": 0.3697, + "MMLU-PRO": 0.3551 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Mediver_V1.01", + "name": "Llama_3.1_8b_Mediver_V1.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.1885, + "BBH": 0.4415, + "MATH Level 5": 0.0015, + "GPQA": 0.2777, + "MUSR": 0.3898, + "MMLU-PRO": 0.2994 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Medusa_v1.01", + "name": "Llama_3.1_8b_Medusa_v1.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7685, + "BBH": 0.5018, + "MATH Level 5": 0.1465, + "GPQA": 0.2919, + "MUSR": 0.4067, + "MMLU-PRO": 0.3531 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Smarteaz_0.2_R1", + "name": "Llama_3.1_8b_Smarteaz_0.2_R1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.6346, + "BBH": 0.5113, + "MATH Level 5": 0.2606, + "GPQA": 0.3003, + "MUSR": 0.4188, + "MMLU-PRO": 0.3645 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Smarteaz_V1.01", + "name": "Llama_3.1_8b_Smarteaz_V1.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.8151, + "BBH": 0.5241, + "MATH Level 5": 0.2341, + "GPQA": 0.3096, + "MUSR": 0.3789, + "MMLU-PRO": 0.3736 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Stormeder_v1.04", + "name": "Llama_3.1_8b_Stormeder_v1.04", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.7853, + "BBH": 0.5207, + "MATH Level 5": 0.185, + "GPQA": 0.3205, + "MUSR": 0.3949, + "MMLU-PRO": 0.3852 + } + }, + { + "model_id": "Nexesenex/Llama_3.1_8b_Typhoon_v1.03", + "name": "Llama_3.1_8b_Typhoon_v1.03", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.8078, + "BBH": 0.5314, + "MATH Level 5": 0.2273, + "GPQA": 0.307, + "MUSR": 0.3815, + "MMLU-PRO": 0.3842 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_AquaSyn_0.1", + "name": "Llama_3.2_1b_AquaSyn_0.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.2741, + "BBH": 0.3284, + "MATH Level 5": 0.0219, + "GPQA": 0.2483, + "MUSR": 0.346, + "MMLU-PRO": 0.1378 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_AquaSyn_0.11", + "name": "Llama_3.2_1b_AquaSyn_0.11", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.2431, + "BBH": 0.3112, + "MATH Level 5": 0.0234, + "GPQA": 0.2651, + "MUSR": 0.3368, + "MMLU-PRO": 0.1116 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_Dolto_0.1", + "name": "Llama_3.2_1b_Dolto_0.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5434, + "BBH": 0.335, + "MATH Level 5": 0.037, + "GPQA": 0.2374, + "MUSR": 0.3421, + "MMLU-PRO": 0.1364 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_Odyssea_V1", + "name": "Llama_3.2_1b_Odyssea_V1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.2553, + "BBH": 0.301, + "MATH Level 5": 0.0144, + "GPQA": 0.2584, + "MUSR": 0.3394, + "MMLU-PRO": 0.1153 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_Odyssea_V1.01", + "name": "Llama_3.2_1b_Odyssea_V1.01", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.2495, + "BBH": 0.3045, + "MATH Level 5": 0.0174, + "GPQA": 0.2559, + "MUSR": 0.342, + "MMLU-PRO": 0.1152 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_OpenTree_R1_0.1", + "name": "Llama_3.2_1b_OpenTree_R1_0.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5366, + "BBH": 0.328, + "MATH Level 5": 0.0476, + "GPQA": 0.2525, + "MUSR": 0.3131, + "MMLU-PRO": 0.1675 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_OrcaSun_V1", + "name": "Llama_3.2_1b_OrcaSun_V1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5949, + "BBH": 0.355, + "MATH Level 5": 0.0597, + "GPQA": 0.2366, + "MUSR": 0.338, + "MMLU-PRO": 0.1904 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_RandomLego_RP_R1_0.1", + "name": "Llama_3.2_1b_RandomLego_RP_R1_0.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5543, + "BBH": 0.3428, + "MATH Level 5": 0.0566, + "GPQA": 0.25, + "MUSR": 0.3249, + "MMLU-PRO": 0.1563 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_SunOrca_V1", + "name": "Llama_3.2_1b_SunOrca_V1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.543, + "BBH": 0.3431, + "MATH Level 5": 0.0672, + "GPQA": 0.2743, + "MUSR": 0.3262, + "MMLU-PRO": 0.1884 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_Sydonia_0.1", + "name": "Llama_3.2_1b_Sydonia_0.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.2197, + "BBH": 0.3121, + "MATH Level 5": 0.0204, + "GPQA": 0.2282, + "MUSR": 0.3382, + "MMLU-PRO": 0.1224 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_Syneridol_0.2", + "name": "Llama_3.2_1b_Syneridol_0.2", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.2157, + "BBH": 0.3139, + "MATH Level 5": 0.0219, + "GPQA": 0.2349, + "MUSR": 0.3343, + "MMLU-PRO": 0.1227 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_Synopsys_0.1", + "name": "Llama_3.2_1b_Synopsys_0.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.1764, + "BBH": 0.3162, + "MATH Level 5": 0.0166, + "GPQA": 0.2391, + "MUSR": 0.3461, + "MMLU-PRO": 0.1231 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_1b_Synopsys_0.11", + "name": "Llama_3.2_1b_Synopsys_0.11", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.2842, + "BBH": 0.3102, + "MATH Level 5": 0.0128, + "GPQA": 0.2626, + "MUSR": 0.3513, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_3b_Kermes_v1", + "name": "Llama_3.2_3b_Kermes_v1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.4852, + "BBH": 0.441, + "MATH Level 5": 0.031, + "GPQA": 0.2735, + "MUSR": 0.407, + "MMLU-PRO": 0.2547 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_3b_Kermes_v2", + "name": "Llama_3.2_3b_Kermes_v2", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5754, + "BBH": 0.4455, + "MATH Level 5": 0.0544, + "GPQA": 0.2651, + "MUSR": 0.3778, + "MMLU-PRO": 0.2734 + } + }, + { + "model_id": "Nexesenex/Llama_3.2_3b_Kermes_v2.1", + "name": "Llama_3.2_3b_Kermes_v2.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.5584, + "BBH": 0.4464, + "MATH Level 5": 0.0521, + "GPQA": 0.2794, + "MUSR": 0.3964, + "MMLU-PRO": 0.2692 + } + }, + { + "model_id": "Nexesenex/Nemotron_W_4b_Halo_0.1", + "name": "Nemotron_W_4b_Halo_0.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.3627, + "BBH": 0.4135, + "MATH Level 5": 0.0423, + "GPQA": 0.2802, + "MUSR": 0.4165, + "MMLU-PRO": 0.2505 + } + }, + { + "model_id": "Nexesenex/Nemotron_W_4b_MagLight_0.1", + "name": "Nemotron_W_4b_MagLight_0.1", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.423, + "BBH": 0.4231, + "MATH Level 5": 0.04, + "GPQA": 0.2836, + "MUSR": 0.4112, + "MMLU-PRO": 0.2545 + } + }, + { + "model_id": "Nexesenex/Qwen_2.5_3b_Smarteaz_0.01a", + "name": "Qwen_2.5_3b_Smarteaz_0.01a", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.4012, + "BBH": 0.4637, + "MATH Level 5": 0.1805, + "GPQA": 0.2777, + "MUSR": 0.432, + "MMLU-PRO": 0.286 + } + }, + { + "model_id": "Nexesenex/pankajmathur_orca_mini_v9_6_1B-instruct-Abliterated-LPL", + "name": "pankajmathur_orca_mini_v9_6_1B-instruct-Abliterated-LPL", + "developer": "Nexesenex", + "scores": { + "IFEval": 0.589, + "BBH": 0.3562, + "MATH Level 5": 0.0748, + "GPQA": 0.2668, + "MUSR": 0.3396, + "MMLU-PRO": 0.1803 + } + }, + { + "model_id": "Nexusflow/NexusRaven-V2-13B", + "name": "NexusRaven-V2-13B", + "developer": "Nexusflow", + "scores": { + "IFEval": 0.1791, + "BBH": 0.3949, + "MATH Level 5": 0.0295, + "GPQA": 0.2601, + "MUSR": 0.3737, + "MMLU-PRO": 0.1872 + } + }, + { + "model_id": "NikolaSigmoid/AceMath-1.5B-Instruct-1epoch", + "name": "AceMath-1.5B-Instruct-1epoch", + "developer": "NikolaSigmoid", + "scores": { + "IFEval": 0.2849, + "BBH": 0.4263, + "MATH Level 5": 0.3051, + "GPQA": 0.2777, + "MUSR": 0.3925, + "MMLU-PRO": 0.2376 + } + }, + { + "model_id": "NikolaSigmoid/AceMath-1.5B-Instruct-dolphin-r1-200", + "name": "AceMath-1.5B-Instruct-dolphin-r1-200", + "developer": "NikolaSigmoid", + "scores": { + "IFEval": 0.1808, + "BBH": 0.2815, + "MATH Level 5": 0.0, + "GPQA": 0.2559, + "MUSR": 0.375, + "MMLU-PRO": 0.1143 + } + }, + { + "model_id": "NikolaSigmoid/DeepSeek-R1-Distill-Qwen-1.5B-500", + "name": "DeepSeek-R1-Distill-Qwen-1.5B-500", + "developer": "NikolaSigmoid", + "scores": { + "IFEval": 0.1749, + "BBH": 0.2602, + "MATH Level 5": 0.0, + "GPQA": 0.2458, + "MUSR": 0.338, + "MMLU-PRO": 0.1125 + } + }, + { + "model_id": "NikolaSigmoid/acemath-200", + "name": "acemath-200", + "developer": "NikolaSigmoid", + "scores": { + "IFEval": 0.2849, + "BBH": 0.4263, + "MATH Level 5": 0.3051, + "GPQA": 0.2777, + "MUSR": 0.3925, + "MMLU-PRO": 0.2376 + } + }, + { + "model_id": "NikolaSigmoid/phi-4-14b", + "name": "phi-4-14b", + "developer": "NikolaSigmoid", + "scores": { + "IFEval": 0.0561, + "BBH": 0.6695, + "MATH Level 5": 0.2938, + "GPQA": 0.4035, + "MUSR": 0.5047, + "MMLU-PRO": 0.5278 + } + }, + { + "model_id": "NikolaSigmoid/phi-4-1steps", + "name": "phi-4-1steps", + "developer": "NikolaSigmoid", + "scores": { + "IFEval": 0.0528, + "BBH": 0.6707, + "MATH Level 5": 0.2983, + "GPQA": 0.4018, + "MUSR": 0.5021, + "MMLU-PRO": 0.5273 + } + }, + { + "model_id": "NikolaSigmoid/phi-4-300steps", + "name": "phi-4-300steps", + "developer": "NikolaSigmoid", + "scores": { + "IFEval": 0.0561, + "BBH": 0.6701, + "MATH Level 5": 0.2946, + "GPQA": 0.4052, + "MUSR": 0.5034, + "MMLU-PRO": 0.5288 + } + }, + { + "model_id": "Nitral-AI/Captain-Eris-BMO_Violent-GRPO-v0.420", + "name": "Captain-Eris-BMO_Violent-GRPO-v0.420", + "developer": "Nitral-AI", + "scores": { + "IFEval": 0.6313, + "BBH": 0.5079, + "MATH Level 5": 0.1314, + "GPQA": 0.3096, + "MUSR": 0.4228, + "MMLU-PRO": 0.3596 + } + }, + { + "model_id": "Nitral-AI/Captain-Eris_BMO-Violent-12B", + "name": "Captain-Eris_BMO-Violent-12B", + "developer": "Nitral-AI", + "scores": { + "IFEval": 0.6152, + "BBH": 0.5104, + "MATH Level 5": 0.1367, + "GPQA": 0.3096, + "MUSR": 0.4255, + "MMLU-PRO": 0.3571 + } + }, + { + "model_id": "Nitral-AI/Captain-Eris_Violet-GRPO-v0.420", + "name": "Captain-Eris_Violet-GRPO-v0.420", + "developer": "Nitral-AI", + "scores": { + "IFEval": 0.6262, + "BBH": 0.5159, + "MATH Level 5": 0.108, + "GPQA": 0.2987, + "MUSR": 0.4279, + "MMLU-PRO": 0.3535 + } + }, + { + "model_id": "Nitral-AI/Captain-Eris_Violet-V0.420-12B", + "name": "Captain-Eris_Violet-V0.420-12B", + "developer": "Nitral-AI", + "scores": { + "IFEval": 0.4339, + "BBH": 0.5478, + "MATH Level 5": 0.1073, + "GPQA": 0.3112, + "MUSR": 0.4331, + "MMLU-PRO": 0.3723 + } + }, + { + "model_id": "Nitral-AI/Captain_BMO-12B", + "name": "Captain_BMO-12B", + "developer": "Nitral-AI", + "scores": { + "IFEval": 0.4751, + "BBH": 0.5286, + "MATH Level 5": 0.1397, + "GPQA": 0.3196, + "MUSR": 0.3748, + "MMLU-PRO": 0.3569 + } + }, + { + "model_id": "Nitral-AI/Hathor_Stable-v0.2-L3-8B", + "name": "Hathor_Stable-v0.2-L3-8B", + "developer": "Nitral-AI", + "scores": { + "IFEval": 0.7175, + "BBH": 0.5286, + "MATH Level 5": 0.105, + "GPQA": 0.2869, + "MUSR": 0.3781, + "MMLU-PRO": 0.3696 + } + }, + { + "model_id": "Nitral-AI/Hathor_Tahsin-L3-8B-v0.85", + "name": "Hathor_Tahsin-L3-8B-v0.85", + "developer": "Nitral-AI", + "scores": { + "IFEval": 0.711, + "BBH": 0.5279, + "MATH Level 5": 0.1005, + "GPQA": 0.2852, + "MUSR": 0.3647, + "MMLU-PRO": 0.372 + } + }, + { + "model_id": "Nitral-AI/Nera_Noctis-12B", + "name": "Nera_Noctis-12B", + "developer": "Nitral-AI", + "scores": { + "IFEval": 0.4562, + "BBH": 0.5194, + "MATH Level 5": 0.0876, + "GPQA": 0.2634, + "MUSR": 0.3979, + "MMLU-PRO": 0.3468 + } + }, + { + "model_id": "Nohobby/MS-Schisandra-22B-v0.1", + "name": "MS-Schisandra-22B-v0.1", + "developer": "Nohobby", + "scores": { + "IFEval": 0.6331, + "BBH": 0.579, + "MATH Level 5": 0.2228, + "GPQA": 0.3322, + "MUSR": 0.3928, + "MMLU-PRO": 0.4096 + } + }, + { + "model_id": "Nohobby/MS-Schisandra-22B-v0.2", + "name": "MS-Schisandra-22B-v0.2", + "developer": "Nohobby", + "scores": { + "IFEval": 0.6383, + "BBH": 0.5841, + "MATH Level 5": 0.2032, + "GPQA": 0.3356, + "MUSR": 0.4075, + "MMLU-PRO": 0.4136 + } + }, + { + "model_id": "Norquinal/Alpha", + "name": "Alpha", + "developer": "Norquinal", + "scores": { + "IFEval": 0.2803, + "BBH": 0.3374, + "MATH Level 5": 0.0574, + "GPQA": 0.2651, + "MUSR": 0.3631, + "MMLU-PRO": 0.3003 + } + }, + { + "model_id": "Norquinal/Bravo", + "name": "Bravo", + "developer": "Norquinal", + "scores": { + "IFEval": 0.3025, + "BBH": 0.3558, + "MATH Level 5": 0.0574, + "GPQA": 0.2819, + "MUSR": 0.3869, + "MMLU-PRO": 0.3127 + } + }, + { + "model_id": "Norquinal/Charlie", + "name": "Charlie", + "developer": "Norquinal", + "scores": { + "IFEval": 0.3061, + "BBH": 0.3515, + "MATH Level 5": 0.0582, + "GPQA": 0.271, + "MUSR": 0.3737, + "MMLU-PRO": 0.3093 + } + }, + { + "model_id": "Norquinal/Delta", + "name": "Delta", + "developer": "Norquinal", + "scores": { + "IFEval": 0.2538, + "BBH": 0.3435, + "MATH Level 5": 0.0612, + "GPQA": 0.2609, + "MUSR": 0.3777, + "MMLU-PRO": 0.2959 + } + }, + { + "model_id": "Norquinal/Echo", + "name": "Echo", + "developer": "Norquinal", + "scores": { + "IFEval": 0.3158, + "BBH": 0.353, + "MATH Level 5": 0.0574, + "GPQA": 0.2794, + "MUSR": 0.3804, + "MMLU-PRO": 0.3095 + } + }, + { + "model_id": "Norquinal/Foxtrot", + "name": "Foxtrot", + "developer": "Norquinal", + "scores": { + "IFEval": 0.3012, + "BBH": 0.3558, + "MATH Level 5": 0.0582, + "GPQA": 0.2869, + "MUSR": 0.3804, + "MMLU-PRO": 0.305 + } + }, + { + "model_id": "Norquinal/Golf", + "name": "Golf", + "developer": "Norquinal", + "scores": { + "IFEval": 0.3534, + "BBH": 0.3533, + "MATH Level 5": 0.0536, + "GPQA": 0.2903, + "MUSR": 0.338, + "MMLU-PRO": 0.3056 + } + }, + { + "model_id": "Norquinal/Hotel", + "name": "Hotel", + "developer": "Norquinal", + "scores": { + "IFEval": 0.3215, + "BBH": 0.3679, + "MATH Level 5": 0.0529, + "GPQA": 0.2794, + "MUSR": 0.3288, + "MMLU-PRO": 0.3157 + } + }, + { + "model_id": "NotASI/FineTome-Llama3.2-1B-0929", + "name": "FineTome-Llama3.2-1B-0929", + "developer": "NotASI", + "scores": { + "IFEval": 0.3991, + "BBH": 0.3246, + "MATH Level 5": 0.0363, + "GPQA": 0.2727, + "MUSR": 0.3488, + "MMLU-PRO": 0.1429 + } + }, + { + "model_id": "NotASI/FineTome-Llama3.2-3B-1002", + "name": "FineTome-Llama3.2-3B-1002", + "developer": "NotASI", + "scores": { + "IFEval": 0.5474, + "BBH": 0.4319, + "MATH Level 5": 0.0627, + "GPQA": 0.2508, + "MUSR": 0.3685, + "MMLU-PRO": 0.2437 + } + }, + { + "model_id": "NotASI/FineTome-v1.5-Llama3.2-1B-1007", + "name": "FineTome-v1.5-Llama3.2-1B-1007", + "developer": "NotASI", + "scores": { + "IFEval": 0.3924, + "BBH": 0.3241, + "MATH Level 5": 0.0317, + "GPQA": 0.25, + "MUSR": 0.3475, + "MMLU-PRO": 0.1427 + } + }, + { + "model_id": "NotASI/FineTome-v1.5-Llama3.2-3B-1007", + "name": "FineTome-v1.5-Llama3.2-3B-1007", + "developer": "NotASI", + "scores": { + "IFEval": 0.5508, + "BBH": 0.4312, + "MATH Level 5": 0.0642, + "GPQA": 0.2617, + "MUSR": 0.3645, + "MMLU-PRO": 0.2448 + } + }, + { + "model_id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", + "name": "DeepHermes-3-Mistral-24B-Preview", + "developer": "NousResearch", + "scores": { + "IFEval": 0.4536, + "BBH": 0.6488, + "MATH Level 5": 0.2576, + "GPQA": 0.37, + "MUSR": 0.4503, + "MMLU-PRO": 0.459 + } + }, + { + "model_id": "NousResearch/Hermes-2-Pro-Llama-3-8B", + "name": "Hermes-2-Pro-Llama-3-8B", + "developer": "NousResearch", + "scores": { + "IFEval": 0.5362, + "BBH": 0.5071, + "MATH Level 5": 0.0838, + "GPQA": 0.2928, + "MUSR": 0.4262, + "MMLU-PRO": 0.3052 + } + }, + { + "model_id": "NousResearch/Hermes-2-Pro-Mistral-7B", + "name": "Hermes-2-Pro-Mistral-7B", + "developer": "NousResearch", + "scores": { + "IFEval": 0.5668, + "BBH": 0.4995, + "MATH Level 5": 0.0604, + "GPQA": 0.2735, + "MUSR": 0.4376, + "MMLU-PRO": 0.2946 + } + }, + { + "model_id": "NousResearch/Hermes-2-Theta-Llama-3-8B", + "name": "Hermes-2-Theta-Llama-3-8B", + "developer": "NousResearch", + "scores": { + "IFEval": 0.6518, + "BBH": 0.5207, + "MATH Level 5": 0.0967, + "GPQA": 0.3037, + "MUSR": 0.3949, + "MMLU-PRO": 0.3369 + } + }, + { + "model_id": "NousResearch/Hermes-3-Llama-3.1-70B", + "name": "Hermes-3-Llama-3.1-70B", + "developer": "NousResearch", + "scores": { + "IFEval": 0.7661, + "BBH": 0.6756, + "MATH Level 5": 0.21, + "GPQA": 0.3616, + "MUSR": 0.4949, + "MMLU-PRO": 0.4727 + } + }, + { + "model_id": "NousResearch/Hermes-3-Llama-3.1-8B", + "name": "Hermes-3-Llama-3.1-8B", + "developer": "NousResearch", + "scores": { + "IFEval": 0.617, + "BBH": 0.5177, + "MATH Level 5": 0.0476, + "GPQA": 0.2978, + "MUSR": 0.4369, + "MMLU-PRO": 0.3139 + } + }, + { + "model_id": "NousResearch/Hermes-3-Llama-3.2-3B", + "name": "Hermes-3-Llama-3.2-3B", + "developer": "NousResearch", + "scores": { + "IFEval": 0.3825, + "BBH": 0.4352, + "MATH Level 5": 0.0393, + "GPQA": 0.2752, + "MUSR": 0.403, + "MMLU-PRO": 0.2544 + } + }, + { + "model_id": "NousResearch/Nous-Hermes-2-Mistral-7B-DPO", + "name": "Nous-Hermes-2-Mistral-7B-DPO", + "developer": "NousResearch", + "scores": { + "IFEval": 0.5763, + "BBH": 0.4853, + "MATH Level 5": 0.0476, + "GPQA": 0.2928, + "MUSR": 0.4, + "MMLU-PRO": 0.3015 + } + }, + { + "model_id": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO", + "name": "Nous-Hermes-2-Mixtral-8x7B-DPO", + "developer": "NousResearch", + "scores": { + "IFEval": 0.5897, + "BBH": 0.5539, + "MATH Level 5": 0.1224, + "GPQA": 0.3213, + "MUSR": 0.4595, + "MMLU-PRO": 0.3666 + } + }, + { + "model_id": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT", + "name": "Nous-Hermes-2-Mixtral-8x7B-SFT", + "developer": "NousResearch", + "scores": { + "IFEval": 0.5731, + "BBH": 0.5058, + "MATH Level 5": 0.0211, + "GPQA": 0.302, + "MUSR": 0.4214, + "MMLU-PRO": 0.3066 + } + }, + { + "model_id": "NousResearch/Nous-Hermes-2-SOLAR-10.7B", + "name": "Nous-Hermes-2-SOLAR-10.7B", + "developer": "NousResearch", + "scores": { + "IFEval": 0.5279, + "BBH": 0.5414, + "MATH Level 5": 0.0574, + "GPQA": 0.2936, + "MUSR": 0.4373, + "MMLU-PRO": 0.3458 + } + }, + { + "model_id": "NousResearch/Nous-Hermes-llama-2-7b", + "name": "Nous-Hermes-llama-2-7b", + "developer": "NousResearch", + "scores": { + "IFEval": 0.1729, + "BBH": 0.3824, + "MATH Level 5": 0.0091, + "GPQA": 0.2634, + "MUSR": 0.4257, + "MMLU-PRO": 0.194 + } + }, + { + "model_id": "NousResearch/Yarn-Llama-2-13b-128k", + "name": "Yarn-Llama-2-13b-128k", + "developer": "NousResearch", + "scores": { + "IFEval": 0.1655, + "BBH": 0.3827, + "MATH Level 5": 0.0174, + "GPQA": 0.2584, + "MUSR": 0.3458, + "MMLU-PRO": 0.232 + } + }, + { + "model_id": "NousResearch/Yarn-Llama-2-7b-128k", + "name": "Yarn-Llama-2-7b-128k", + "developer": "NousResearch", + "scores": { + "IFEval": 0.1485, + "BBH": 0.3248, + "MATH Level 5": 0.0151, + "GPQA": 0.2601, + "MUSR": 0.3967, + "MMLU-PRO": 0.1791 + } + }, + { + "model_id": "NousResearch/Yarn-Llama-2-7b-64k", + "name": "Yarn-Llama-2-7b-64k", + "developer": "NousResearch", + "scores": { + "IFEval": 0.17, + "BBH": 0.3326, + "MATH Level 5": 0.0159, + "GPQA": 0.2643, + "MUSR": 0.3939, + "MMLU-PRO": 0.1799 + } + }, + { + "model_id": "NousResearch/Yarn-Mistral-7b-128k", + "name": "Yarn-Mistral-7b-128k", + "developer": "NousResearch", + "scores": { + "IFEval": 0.1934, + "BBH": 0.4314, + "MATH Level 5": 0.0317, + "GPQA": 0.2987, + "MUSR": 0.4071, + "MMLU-PRO": 0.2893 + } + }, + { + "model_id": "NousResearch/Yarn-Mistral-7b-64k", + "name": "Yarn-Mistral-7b-64k", + "developer": "NousResearch", + "scores": { + "IFEval": 0.208, + "BBH": 0.4293, + "MATH Level 5": 0.037, + "GPQA": 0.2903, + "MUSR": 0.4124, + "MMLU-PRO": 0.2914 + } + }, + { + "model_id": "NousResearch/Yarn-Solar-10b-32k", + "name": "Yarn-Solar-10b-32k", + "developer": "NousResearch", + "scores": { + "IFEval": 0.1942, + "BBH": 0.4987, + "MATH Level 5": 0.0302, + "GPQA": 0.3029, + "MUSR": 0.4146, + "MMLU-PRO": 0.3272 + } + }, + { + "model_id": "NousResearch/Yarn-Solar-10b-64k", + "name": "Yarn-Solar-10b-64k", + "developer": "NousResearch", + "scores": { + "IFEval": 0.1989, + "BBH": 0.4922, + "MATH Level 5": 0.0287, + "GPQA": 0.302, + "MUSR": 0.4014, + "MMLU-PRO": 0.3148 + } + }, + { + "model_id": "Novaciano/ASTAROTH-3.2-1B", + "name": "ASTAROTH-3.2-1B", + "developer": "Novaciano", + "scores": { + "IFEval": 0.5613, + "BBH": 0.3543, + "MATH Level 5": 0.0733, + "GPQA": 0.2559, + "MUSR": 0.3142, + "MMLU-PRO": 0.1909 + } + }, + { + "model_id": "Novaciano/BLAST_PROCESSING-3.2-1B", + "name": "BLAST_PROCESSING-3.2-1B", + "developer": "Novaciano", + "scores": { + "IFEval": 0.3922, + "BBH": 0.346, + "MATH Level 5": 0.0748, + "GPQA": 0.2659, + "MUSR": 0.3351, + "MMLU-PRO": 0.1941 + } + }, + { + "model_id": "Novaciano/Cerberus-3.2-1B", + "name": "Cerberus-3.2-1B", + "developer": "Novaciano", + "scores": { + "IFEval": 0.5017, + "BBH": 0.4165, + "MATH Level 5": 0.0582, + "GPQA": 0.2584, + "MUSR": 0.3289, + "MMLU-PRO": 0.1663 + } + }, + { + "model_id": "Novaciano/Cultist-3.2-1B", + "name": "Cultist-3.2-1B", + "developer": "Novaciano", + "scores": { + "IFEval": 0.5295, + "BBH": 0.3399, + "MATH Level 5": 0.0589, + "GPQA": 0.2609, + "MUSR": 0.333, + "MMLU-PRO": 0.1714 + } + }, + { + "model_id": "Novaciano/FuseChat-3.2-1B-GRPO_Creative_RP", + "name": "FuseChat-3.2-1B-GRPO_Creative_RP", + "developer": "Novaciano", + "scores": { + "IFEval": 0.5598, + "BBH": 0.3488, + "MATH Level 5": 0.0801, + "GPQA": 0.2559, + "MUSR": 0.3329, + "MMLU-PRO": 0.1735 + } + }, + { + "model_id": "Novaciano/Fusetrix-3.2-1B-GRPO_RP_Creative", + "name": "Fusetrix-3.2-1B-GRPO_RP_Creative", + "developer": "Novaciano", + "scores": { + "IFEval": 0.5366, + "BBH": 0.3435, + "MATH Level 5": 0.1148, + "GPQA": 0.25, + "MUSR": 0.3209, + "MMLU-PRO": 0.1758 + } + }, + { + "model_id": "Novaciano/Fusetrix-Dolphin-3.2-1B-GRPO_Creative_RP", + "name": "Fusetrix-Dolphin-3.2-1B-GRPO_Creative_RP", + "developer": "Novaciano", + "scores": { + "IFEval": 0.5343, + "BBH": 0.3502, + "MATH Level 5": 0.105, + "GPQA": 0.2685, + "MUSR": 0.3183, + "MMLU-PRO": 0.1823 + } + }, + { + "model_id": "Novaciano/HarmfulProject-3.2-1B", + "name": "HarmfulProject-3.2-1B", + "developer": "Novaciano", + "scores": { + "IFEval": 0.3874, + "BBH": 0.3274, + "MATH Level 5": 0.0476, + "GPQA": 0.2668, + "MUSR": 0.3419, + "MMLU-PRO": 0.1823 + } + }, + { + "model_id": "Novaciano/LEWD-Mental-Cultist-3.2-1B", + "name": "LEWD-Mental-Cultist-3.2-1B", + "developer": "Novaciano", + "scores": { + "IFEval": 0.5309, + "BBH": 0.3513, + "MATH Level 5": 0.0529, + "GPQA": 0.2567, + "MUSR": 0.3223, + "MMLU-PRO": 0.1769 + } + }, + { + "model_id": "Novaciano/La_Mejor_Mezcla-3.2-1B", + "name": "La_Mejor_Mezcla-3.2-1B", + "developer": "Novaciano", + "scores": { + "IFEval": 0.551, + "BBH": 0.3488, + "MATH Level 5": 0.0899, + "GPQA": 0.2576, + "MUSR": 0.3196, + "MMLU-PRO": 0.1829 + } + }, + { + "model_id": "Novaciano/Sigil-Of-Satan-3.2-1B", + "name": "Sigil-Of-Satan-3.2-1B", + "developer": "Novaciano", + "scores": { + "IFEval": 0.5494, + "BBH": 0.3546, + "MATH Level 5": 0.0544, + "GPQA": 0.2609, + "MUSR": 0.3276, + "MMLU-PRO": 0.1855 + } + }, + { + "model_id": "NucleusAI/nucleus-22B-token-500B", + "name": "nucleus-22B-token-500B", + "developer": "NucleusAI", + "scores": { + "IFEval": 0.0257, + "BBH": 0.292, + "MATH Level 5": 0.0, + "GPQA": 0.25, + "MUSR": 0.3511, + "MMLU-PRO": 0.1162 + } + }, + { + "model_id": "NyxKrage/Microsoft_Phi-4", + "name": "Microsoft_Phi-4", + "developer": "NyxKrage", + "scores": { + "IFEval": 0.0585, + "BBH": 0.6691, + "MATH Level 5": 0.2991, + "GPQA": 0.406, + "MUSR": 0.5034, + "MMLU-PRO": 0.5287 + } + }, + { + "model_id": "OEvortex/Emotional-llama-8B", + "name": "Emotional-llama-8B", + "developer": "OEvortex", + "scores": { + "IFEval": 0.3516, + "BBH": 0.4839, + "MATH Level 5": 0.0816, + "GPQA": 0.2945, + "MUSR": 0.3659, + "MMLU-PRO": 0.3535 + } + }, + { + "model_id": "OEvortex/HelpingAI-15B", + "name": "HelpingAI-15B", + "developer": "OEvortex", + "scores": { + "IFEval": 0.203, + "BBH": 0.2936, + "MATH Level 5": 0.0, + "GPQA": 0.2576, + "MUSR": 0.3619, + "MMLU-PRO": 0.1111 + } + }, + { + "model_id": "OEvortex/HelpingAI-3B-reloaded", + "name": "HelpingAI-3B-reloaded", + "developer": "OEvortex", + "scores": { + "IFEval": 0.4647, + "BBH": 0.4129, + "MATH Level 5": 0.0136, + "GPQA": 0.2634, + "MUSR": 0.3524, + "MMLU-PRO": 0.2595 + } + }, + { + "model_id": "OEvortex/HelpingAI2-9B", + "name": "HelpingAI2-9B", + "developer": "OEvortex", + "scores": { + "IFEval": 0.4413, + "BBH": 0.4845, + "MATH Level 5": 0.0589, + "GPQA": 0.2584, + "MUSR": 0.3711, + "MMLU-PRO": 0.29 + } + }, + { + "model_id": "OEvortex/HelpingAI2.5-10B", + "name": "HelpingAI2.5-10B", + "developer": "OEvortex", + "scores": { + "IFEval": 0.3277, + "BBH": 0.4496, + "MATH Level 5": 0.0204, + "GPQA": 0.2693, + "MUSR": 0.3738, + "MMLU-PRO": 0.2575 + } + }, + { + "model_id": "OliveiraJLT/Sagui-7B-Instruct-v0.1", + "name": "Sagui-7B-Instruct-v0.1", + "developer": "OliveiraJLT", + "scores": { + "IFEval": 0.2892, + "BBH": 0.3111, + "MATH Level 5": 0.0151, + "GPQA": 0.2424, + "MUSR": 0.4191, + "MMLU-PRO": 0.1485 + } + }, + { + "model_id": "Omkar1102/code-yi", + "name": "code-yi", + "developer": "Omkar1102", + "scores": { + "IFEval": 0.2148, + "BBH": 0.276, + "MATH Level 5": 0.0, + "GPQA": 0.2508, + "MUSR": 0.3802, + "MMLU-PRO": 0.1126 + } + }, + { + "model_id": "OmnicromsBrain/NeuralStar_FusionWriter_4x7b", + "name": "NeuralStar_FusionWriter_4x7b", + "developer": "OmnicromsBrain", + "scores": { + "IFEval": 0.5964, + "BBH": 0.4776, + "MATH Level 5": 0.0491, + "GPQA": 0.2785, + "MUSR": 0.4019, + "MMLU-PRO": 0.2606 + } + }, + { + "model_id": "OnlyCheeini/greesychat-turbo", + "name": "greesychat-turbo", + "developer": "OnlyCheeini", + "scores": { + "IFEval": 0.0233, + "BBH": 0.3092, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3314, + "MMLU-PRO": 0.1138 + } + }, + { + "model_id": "Open-Orca/Mistral-7B-OpenOrca", + "name": "Mistral-7B-OpenOrca", + "developer": "Open-Orca", + "scores": { + "IFEval": 0.4978, + "BBH": 0.4768, + "MATH Level 5": 0.0355, + "GPQA": 0.2718, + "MUSR": 0.3858, + "MMLU-PRO": 0.2653 + } + }, + { + "model_id": "OpenAssistant/oasst-sft-1-pythia-12b", + "name": "oasst-sft-1-pythia-12b", + "developer": "OpenAssistant", + "scores": { + "IFEval": 0.1055, + "BBH": 0.3147, + "MATH Level 5": 0.0151, + "GPQA": 0.2576, + "MUSR": 0.3327, + "MMLU-PRO": 0.1113 + } + }, + { + "model_id": "OpenBuddy/openbuddy-falcon3-10b-v24.2-131k", + "name": "openbuddy-falcon3-10b-v24.2-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.5086, + "BBH": 0.6004, + "MATH Level 5": 0.213, + "GPQA": 0.2995, + "MUSR": 0.4186, + "MMLU-PRO": 0.3834 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3-70b-v21.2-32k", + "name": "openbuddy-llama3-70b-v21.2-32k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.701, + "BBH": 0.6507, + "MATH Level 5": 0.2032, + "GPQA": 0.3423, + "MUSR": 0.458, + "MMLU-PRO": 0.4832 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3-8b-v21.1-8k", + "name": "openbuddy-llama3-8b-v21.1-8k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.557, + "BBH": 0.4788, + "MATH Level 5": 0.0431, + "GPQA": 0.271, + "MUSR": 0.3988, + "MMLU-PRO": 0.2955 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3-8b-v21.2-32k", + "name": "openbuddy-llama3-8b-v21.2-32k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.6192, + "BBH": 0.4856, + "MATH Level 5": 0.0785, + "GPQA": 0.2794, + "MUSR": 0.3779, + "MMLU-PRO": 0.3299 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3.1-70b-v22.1-131k", + "name": "openbuddy-llama3.1-70b-v22.1-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.7333, + "BBH": 0.6698, + "MATH Level 5": 0.395, + "GPQA": 0.375, + "MUSR": 0.463, + "MMLU-PRO": 0.5304 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3.1-8b-v22.2-131k", + "name": "openbuddy-llama3.1-8b-v22.2-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.6657, + "BBH": 0.5007, + "MATH Level 5": 0.1148, + "GPQA": 0.2794, + "MUSR": 0.4081, + "MMLU-PRO": 0.331 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3.1-8b-v22.3-131k", + "name": "openbuddy-llama3.1-8b-v22.3-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.5997, + "BBH": 0.5066, + "MATH Level 5": 0.1208, + "GPQA": 0.2794, + "MUSR": 0.4015, + "MMLU-PRO": 0.3277 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3.2-1b-v23.1-131k", + "name": "openbuddy-llama3.2-1b-v23.1-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.359, + "BBH": 0.3267, + "MATH Level 5": 0.0249, + "GPQA": 0.2584, + "MUSR": 0.3342, + "MMLU-PRO": 0.184 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3.2-3b-v23.2-131k", + "name": "openbuddy-llama3.2-3b-v23.2-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.4319, + "BBH": 0.4073, + "MATH Level 5": 0.0264, + "GPQA": 0.276, + "MUSR": 0.3263, + "MMLU-PRO": 0.2479 + } + }, + { + "model_id": "OpenBuddy/openbuddy-llama3.3-70b-v24.1-131k", + "name": "openbuddy-llama3.3-70b-v24.1-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.8121, + "BBH": 0.6858, + "MATH Level 5": 0.4411, + "GPQA": 0.4346, + "MUSR": 0.4869, + "MMLU-PRO": 0.5327 + } + }, + { + "model_id": "OpenBuddy/openbuddy-mixtral-7bx8-v18.1-32k", + "name": "openbuddy-mixtral-7bx8-v18.1-32k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.5493, + "BBH": 0.4656, + "MATH Level 5": 0.108, + "GPQA": 0.3045, + "MUSR": 0.3831, + "MMLU-PRO": 0.3804 + } + }, + { + "model_id": "OpenBuddy/openbuddy-nemotron-70b-v23.1-131k", + "name": "openbuddy-nemotron-70b-v23.1-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.7555, + "BBH": 0.6749, + "MATH Level 5": 0.321, + "GPQA": 0.3633, + "MUSR": 0.4538, + "MMLU-PRO": 0.5175 + } + }, + { + "model_id": "OpenBuddy/openbuddy-nemotron-70b-v23.2-131k", + "name": "openbuddy-nemotron-70b-v23.2-131k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.7227, + "BBH": 0.6705, + "MATH Level 5": 0.3157, + "GPQA": 0.3599, + "MUSR": 0.4696, + "MMLU-PRO": 0.5121 + } + }, + { + "model_id": "OpenBuddy/openbuddy-qwen2.5llamaify-14b-v23.1-200k", + "name": "openbuddy-qwen2.5llamaify-14b-v23.1-200k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.6309, + "BBH": 0.6013, + "MATH Level 5": 0.2538, + "GPQA": 0.3331, + "MUSR": 0.424, + "MMLU-PRO": 0.4673 + } + }, + { + "model_id": "OpenBuddy/openbuddy-qwen2.5llamaify-14b-v23.3-200k", + "name": "openbuddy-qwen2.5llamaify-14b-v23.3-200k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.6131, + "BBH": 0.6081, + "MATH Level 5": 0.2311, + "GPQA": 0.3272, + "MUSR": 0.4346, + "MMLU-PRO": 0.4795 + } + }, + { + "model_id": "OpenBuddy/openbuddy-qwen2.5llamaify-7b-v23.1-200k", + "name": "openbuddy-qwen2.5llamaify-7b-v23.1-200k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.5673, + "BBH": 0.5509, + "MATH Level 5": 0.1888, + "GPQA": 0.3146, + "MUSR": 0.4363, + "MMLU-PRO": 0.3948 + } + }, + { + "model_id": "OpenBuddy/openbuddy-qwq-32b-v24.1-200k", + "name": "openbuddy-qwq-32b-v24.1-200k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.5937, + "BBH": 0.6798, + "MATH Level 5": 0.3739, + "GPQA": 0.3809, + "MUSR": 0.4849, + "MMLU-PRO": 0.549 + } + }, + { + "model_id": "OpenBuddy/openbuddy-qwq-32b-v24.2-200k", + "name": "openbuddy-qwq-32b-v24.2-200k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.597, + "BBH": 0.6772, + "MATH Level 5": 0.3776, + "GPQA": 0.3767, + "MUSR": 0.4718, + "MMLU-PRO": 0.5446 + } + }, + { + "model_id": "OpenBuddy/openbuddy-yi1.5-34b-v21.3-32k", + "name": "openbuddy-yi1.5-34b-v21.3-32k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.542, + "BBH": 0.6163, + "MATH Level 5": 0.1782, + "GPQA": 0.349, + "MUSR": 0.4439, + "MMLU-PRO": 0.4599 + } + }, + { + "model_id": "OpenBuddy/openbuddy-zero-14b-v22.3-32k", + "name": "openbuddy-zero-14b-v22.3-32k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.3753, + "BBH": 0.486, + "MATH Level 5": 0.0937, + "GPQA": 0.307, + "MUSR": 0.4166, + "MMLU-PRO": 0.3187 + } + }, + { + "model_id": "OpenBuddy/openbuddy-zero-3b-v21.2-32k", + "name": "openbuddy-zero-3b-v21.2-32k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.3802, + "BBH": 0.3935, + "MATH Level 5": 0.0189, + "GPQA": 0.2601, + "MUSR": 0.3566, + "MMLU-PRO": 0.2034 + } + }, + { + "model_id": "OpenBuddy/openbuddy-zero-56b-v21.2-32k", + "name": "openbuddy-zero-56b-v21.2-32k", + "developer": "OpenBuddy", + "scores": { + "IFEval": 0.5057, + "BBH": 0.6128, + "MATH Level 5": 0.1624, + "GPQA": 0.318, + "MUSR": 0.4305, + "MMLU-PRO": 0.4399 + } + }, + { + "model_id": "OpenGenerativeAI/Bifrost", + "name": "Bifrost", + "developer": "OpenGenerativeAI", + "scores": { + "IFEval": 0.6348, + "BBH": 0.6849, + "MATH Level 5": 0.2545, + "GPQA": 0.3683, + "MUSR": 0.4598, + "MMLU-PRO": 0.516 + } + }, + { + "model_id": "OpenGenerativeAI/Bifrost-14B", + "name": "Bifrost-14B", + "developer": "OpenGenerativeAI", + "scores": { + "IFEval": 0.6615, + "BBH": 0.6845, + "MATH Level 5": 0.2356, + "GPQA": 0.3792, + "MUSR": 0.4624, + "MMLU-PRO": 0.5074 + } + }, + { + "model_id": "OpenLLM-France/Lucie-7B", + "name": "Lucie-7B", + "developer": "OpenLLM-France", + "scores": { + "IFEval": 0.2496, + "BBH": 0.3492, + "MATH Level 5": 0.0144, + "GPQA": 0.2727, + "MUSR": 0.3923, + "MMLU-PRO": 0.1498 + } + }, + { + "model_id": "OpenLLM-France/Lucie-7B-Instruct", + "name": "Lucie-7B-Instruct", + "developer": "OpenLLM-France", + "scores": { + "IFEval": 0.2796, + "BBH": 0.3254, + "MATH Level 5": 0.0166, + "GPQA": 0.2794, + "MUSR": 0.3662, + "MMLU-PRO": 0.1556 + } + }, + { + "model_id": "OpenLLM-France/Lucie-7B-Instruct-human-data", + "name": "Lucie-7B-Instruct-human-data", + "developer": "OpenLLM-France", + "scores": { + "IFEval": 0.2946, + "BBH": 0.3284, + "MATH Level 5": 0.0219, + "GPQA": 0.2752, + "MUSR": 0.3729, + "MMLU-PRO": 0.143 + } + }, + { + "model_id": "OpenLLM-France/Lucie-7B-Instruct-v1.1", + "name": "Lucie-7B-Instruct-v1.1", + "developer": "OpenLLM-France", + "scores": { + "IFEval": 0.3039, + "BBH": 0.3816, + "MATH Level 5": 0.0317, + "GPQA": 0.2819, + "MUSR": 0.375, + "MMLU-PRO": 0.1864 + } + }, + { + "model_id": "OpenLeecher/llama3-8b-lima", + "name": "llama3-8b-lima", + "developer": "OpenLeecher", + "scores": { + "IFEval": 0.4371, + "BBH": 0.4296, + "MATH Level 5": 0.0506, + "GPQA": 0.2383, + "MUSR": 0.3713, + "MMLU-PRO": 0.2626 + } + }, + { + "model_id": "OpenScholar/Llama-3.1_OpenScholar-8B", + "name": "Llama-3.1_OpenScholar-8B", + "developer": "OpenScholar", + "scores": { + "IFEval": 0.6064, + "BBH": 0.5208, + "MATH Level 5": 0.1654, + "GPQA": 0.2819, + "MUSR": 0.4275, + "MMLU-PRO": 0.3708 + } + }, + { + "model_id": "Orenguteng/Llama-3.1-8B-Lexi-Uncensored", + "name": "Llama-3.1-8B-Lexi-Uncensored", + "developer": "Orenguteng", + "scores": { + "IFEval": 0.7777, + "BBH": 0.5057, + "MATH Level 5": 0.1571, + "GPQA": 0.2718, + "MUSR": 0.3871, + "MMLU-PRO": 0.379 + } + }, + { + "model_id": "Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2", + "name": "Llama-3.1-8B-Lexi-Uncensored-V2", + "developer": "Orenguteng", + "scores": { + "IFEval": 0.7792, + "BBH": 0.5084, + "MATH Level 5": 0.1971, + "GPQA": 0.2827, + "MUSR": 0.3843, + "MMLU-PRO": 0.3781 + } + }, + { + "model_id": "Orion-zhen/Qwen2.5-7B-Instruct-Uncensored", + "name": "Qwen2.5-7B-Instruct-Uncensored", + "developer": "Orion-zhen", + "scores": { + "IFEval": 0.7204, + "BBH": 0.5474, + "MATH Level 5": 0.4773, + "GPQA": 0.3029, + "MUSR": 0.4361, + "MMLU-PRO": 0.4427 + } + }, + { + "model_id": "Orion-zhen/phi-4-abliterated", + "name": "phi-4-abliterated", + "developer": "Orion-zhen", + "scores": { + "IFEval": 0.0576, + "BBH": 0.6698, + "MATH Level 5": 0.3021, + "GPQA": 0.4044, + "MUSR": 0.5006, + "MMLU-PRO": 0.5292 + } + }, + { + "model_id": "P0x0/Astra-v1-12B", + "name": "Astra-v1-12B", + "developer": "P0x0", + "scores": { + "IFEval": 0.2806, + "BBH": 0.5215, + "MATH Level 5": 0.1133, + "GPQA": 0.3138, + "MUSR": 0.4052, + "MMLU-PRO": 0.3461 + } + }, + { + "model_id": "PJMixers-Dev/L3.2-Instruct-Thinking-v0.1-1B", + "name": "L3.2-Instruct-Thinking-v0.1-1B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.4628, + "BBH": 0.3302, + "MATH Level 5": 0.0544, + "GPQA": 0.2576, + "MUSR": 0.3262, + "MMLU-PRO": 0.1483 + } + }, + { + "model_id": "PJMixers-Dev/LLaMa-3.1-Instruct-Interleaved-Zeroed-13B", + "name": "LLaMa-3.1-Instruct-Interleaved-Zeroed-13B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.7871, + "BBH": 0.5073, + "MATH Level 5": 0.2002, + "GPQA": 0.2919, + "MUSR": 0.387, + "MMLU-PRO": 0.3767 + } + }, + { + "model_id": "PJMixers-Dev/LLaMa-3.1-RomboTiesTest-8B", + "name": "LLaMa-3.1-RomboTiesTest-8B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.7825, + "BBH": 0.5073, + "MATH Level 5": 0.2002, + "GPQA": 0.2919, + "MUSR": 0.387, + "MMLU-PRO": 0.3767 + } + }, + { + "model_id": "PJMixers-Dev/LLaMa-3.1-RomboTiesTest2-8B", + "name": "LLaMa-3.1-RomboTiesTest2-8B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.7825, + "BBH": 0.5073, + "MATH Level 5": 0.2002, + "GPQA": 0.2919, + "MUSR": 0.387, + "MMLU-PRO": 0.3767 + } + }, + { + "model_id": "PJMixers-Dev/LLaMa-3.2-Instruct-JankMix-v0.1-SFT-3B", + "name": "LLaMa-3.2-Instruct-JankMix-v0.1-SFT-3B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.6931, + "BBH": 0.4556, + "MATH Level 5": 0.1216, + "GPQA": 0.2743, + "MUSR": 0.37, + "MMLU-PRO": 0.3127 + } + }, + { + "model_id": "PJMixers-Dev/LLaMa-3.2-Instruct-JankMix-v0.2-SFT-3B", + "name": "LLaMa-3.2-Instruct-JankMix-v0.2-SFT-3B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.6292, + "BBH": 0.4581, + "MATH Level 5": 0.1299, + "GPQA": 0.2727, + "MUSR": 0.3659, + "MMLU-PRO": 0.3115 + } + }, + { + "model_id": "PJMixers-Dev/LLaMa-3.2-Instruct-JankMix-v0.2-SFT-HailMary-v0.1-KTO-3B", + "name": "LLaMa-3.2-Instruct-JankMix-v0.2-SFT-HailMary-v0.1-KTO-3B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.6504, + "BBH": 0.4511, + "MATH Level 5": 0.1261, + "GPQA": 0.2718, + "MUSR": 0.3687, + "MMLU-PRO": 0.3108 + } + }, + { + "model_id": "PJMixers-Dev/LLaMa-3.2-Instruct-JankMixBread-v0.1-3B", + "name": "LLaMa-3.2-Instruct-JankMixBread-v0.1-3B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.5041, + "BBH": 0.4483, + "MATH Level 5": 0.1307, + "GPQA": 0.2827, + "MUSR": 0.3516, + "MMLU-PRO": 0.3083 + } + }, + { + "model_id": "PJMixers-Dev/Qwen2.5-RomboTiesTest-7B", + "name": "Qwen2.5-RomboTiesTest-7B", + "developer": "PJMixers-Dev", + "scores": { + "IFEval": 0.7558, + "BBH": 0.5399, + "MATH Level 5": 0.4962, + "GPQA": 0.2978, + "MUSR": 0.4034, + "MMLU-PRO": 0.4285 + } + }, + { + "model_id": "PJMixers/LLaMa-3-CursedStock-v2.0-8B", + "name": "LLaMa-3-CursedStock-v2.0-8B", + "developer": "PJMixers", + "scores": { + "IFEval": 0.6331, + "BBH": 0.5271, + "MATH Level 5": 0.0944, + "GPQA": 0.2743, + "MUSR": 0.3856, + "MMLU-PRO": 0.3556 + } + }, + { + "model_id": "Parissa3/test-model", + "name": "test-model", + "developer": "Parissa3", + "scores": { + "IFEval": 0.3883, + "BBH": 0.5194, + "MATH Level 5": 0.065, + "GPQA": 0.2945, + "MUSR": 0.4685, + "MMLU-PRO": 0.3057 + } + }, + { + "model_id": "Pinkstack/PARM-V1.5-base-QwQ-Qwen-2.5-o1-3B", + "name": "PARM-V1.5-base-QwQ-Qwen-2.5-o1-3B", + "developer": "Pinkstack", + "scores": { + "IFEval": 0.5085, + "BBH": 0.4711, + "MATH Level 5": 0.1692, + "GPQA": 0.297, + "MUSR": 0.4479, + "MMLU-PRO": 0.3511 + } + }, + { + "model_id": "Pinkstack/SuperThoughts-CoT-14B-16k-o1-QwQ", + "name": "SuperThoughts-CoT-14B-16k-o1-QwQ", + "developer": "Pinkstack", + "scores": { + "IFEval": 0.0515, + "BBH": 0.672, + "MATH Level 5": 0.4199, + "GPQA": 0.3926, + "MUSR": 0.4914, + "MMLU-PRO": 0.5268 + } + }, + { + "model_id": "Pinkstack/Superthoughts-lite-1.8B-experimental-o1", + "name": "Superthoughts-lite-1.8B-experimental-o1", + "developer": "Pinkstack", + "scores": { + "IFEval": 0.0375, + "BBH": 0.3435, + "MATH Level 5": 0.0317, + "GPQA": 0.2752, + "MUSR": 0.3354, + "MMLU-PRO": 0.1851 + } + }, + { + "model_id": "Pinkstack/Superthoughts-lite-v1", + "name": "Superthoughts-lite-v1", + "developer": "Pinkstack", + "scores": { + "IFEval": 0.1659, + "BBH": 0.3466, + "MATH Level 5": 0.0295, + "GPQA": 0.281, + "MUSR": 0.3672, + "MMLU-PRO": 0.1755 + } + }, + { + "model_id": "PocketDoc/Dans-Instruct-CoreCurriculum-12b", + "name": "Dans-Instruct-CoreCurriculum-12b", + "developer": "PocketDoc", + "scores": { + "IFEval": 0.2191, + "BBH": 0.3789, + "MATH Level 5": 0.0544, + "GPQA": 0.2827, + "MUSR": 0.4096, + "MMLU-PRO": 0.1219 + } + }, + { + "model_id": "PocketDoc/Dans-PersonalityEngine-V1.1.0-12b", + "name": "Dans-PersonalityEngine-V1.1.0-12b", + "developer": "PocketDoc", + "scores": { + "IFEval": 0.7075, + "BBH": 0.5361, + "MATH Level 5": 0.105, + "GPQA": 0.2869, + "MUSR": 0.4587, + "MMLU-PRO": 0.3262 + } + }, + { + "model_id": "PocketDoc/Dans-PersonalityEngine-V1.2.0-24b", + "name": "Dans-PersonalityEngine-V1.2.0-24b", + "developer": "PocketDoc", + "scores": { + "IFEval": 0.7886, + "BBH": 0.6421, + "MATH Level 5": 0.2455, + "GPQA": 0.3188, + "MUSR": 0.43, + "MMLU-PRO": 0.5026 + } + }, + { + "model_id": "PocketDoc/Dans-PersonalityEngine-v1.0.0-8b", + "name": "Dans-PersonalityEngine-v1.0.0-8b", + "developer": "PocketDoc", + "scores": { + "IFEval": 0.4982, + "BBH": 0.4733, + "MATH Level 5": 0.0816, + "GPQA": 0.2852, + "MUSR": 0.3542, + "MMLU-PRO": 0.3065 + } + }, + { + "model_id": "PocketDoc/Dans-SakuraKaze-V1.0.0-12b", + "name": "Dans-SakuraKaze-V1.0.0-12b", + "developer": "PocketDoc", + "scores": { + "IFEval": 0.652, + "BBH": 0.5405, + "MATH Level 5": 0.0929, + "GPQA": 0.2936, + "MUSR": 0.4745, + "MMLU-PRO": 0.356 + } + }, + { + "model_id": "PowerInfer/SmallThinker-3B-Preview", + "name": "SmallThinker-3B-Preview", + "developer": "PowerInfer", + "scores": { + "IFEval": 0.62, + "BBH": 0.4495, + "MATH Level 5": 0.2779, + "GPQA": 0.2609, + "MUSR": 0.3525, + "MMLU-PRO": 0.3018 + } + }, + { + "model_id": "PranavHarshan/LaMistral-V4", + "name": "LaMistral-V4", + "developer": "PranavHarshan", + "scores": { + "IFEval": 0.6239, + "BBH": 0.5184, + "MATH Level 5": 0.0687, + "GPQA": 0.328, + "MUSR": 0.3643, + "MMLU-PRO": 0.3599 + } + }, + { + "model_id": "PranavHarshan/MedNarra-X1", + "name": "MedNarra-X1", + "developer": "PranavHarshan", + "scores": { + "IFEval": 0.4338, + "BBH": 0.4637, + "MATH Level 5": 0.0438, + "GPQA": 0.3079, + "MUSR": 0.354, + "MMLU-PRO": 0.3431 + } + }, + { + "model_id": "Pretergeek/OpenChat-3.5-0106_10.7B_48Layers-Appended", + "name": "OpenChat-3.5-0106_10.7B_48Layers-Appended", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.5961, + "BBH": 0.462, + "MATH Level 5": 0.0793, + "GPQA": 0.307, + "MUSR": 0.4254, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "Pretergeek/OpenChat-3.5-0106_10.7B_48Layers-Interleaved", + "name": "OpenChat-3.5-0106_10.7B_48Layers-Interleaved", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.5961, + "BBH": 0.462, + "MATH Level 5": 0.0778, + "GPQA": 0.3045, + "MUSR": 0.4254, + "MMLU-PRO": 0.3299 + } + }, + { + "model_id": "Pretergeek/OpenChat-3.5-0106_32K-PoSE", + "name": "OpenChat-3.5-0106_32K-PoSE", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.3969, + "BBH": 0.3471, + "MATH Level 5": 0.0264, + "GPQA": 0.276, + "MUSR": 0.4205, + "MMLU-PRO": 0.2031 + } + }, + { + "model_id": "Pretergeek/OpenChat-3.5-0106_8.11B_36Layers-Appended", + "name": "OpenChat-3.5-0106_8.11B_36Layers-Appended", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.5976, + "BBH": 0.462, + "MATH Level 5": 0.0793, + "GPQA": 0.307, + "MUSR": 0.4254, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "Pretergeek/OpenChat-3.5-0106_8.11B_36Layers-Interleaved", + "name": "OpenChat-3.5-0106_8.11B_36Layers-Interleaved", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.5961, + "BBH": 0.4621, + "MATH Level 5": 0.0778, + "GPQA": 0.3045, + "MUSR": 0.4241, + "MMLU-PRO": 0.3299 + } + }, + { + "model_id": "Pretergeek/OpenChat-3.5-0106_8.99B_40Layers-Appended", + "name": "OpenChat-3.5-0106_8.99B_40Layers-Appended", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.5961, + "BBH": 0.462, + "MATH Level 5": 0.0793, + "GPQA": 0.307, + "MUSR": 0.4254, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "Pretergeek/OpenChat-3.5-0106_8.99B_40Layers-Interleaved", + "name": "OpenChat-3.5-0106_8.99B_40Layers-Interleaved", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.5976, + "BBH": 0.4621, + "MATH Level 5": 0.0778, + "GPQA": 0.3045, + "MUSR": 0.4241, + "MMLU-PRO": 0.3299 + } + }, + { + "model_id": "Pretergeek/OpenChat-3.5-0106_9.86B_44Layers-Appended", + "name": "OpenChat-3.5-0106_9.86B_44Layers-Appended", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.5961, + "BBH": 0.462, + "MATH Level 5": 0.0793, + "GPQA": 0.307, + "MUSR": 0.4254, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "Pretergeek/openchat-3.5-0106_Rebased_Mistral-7B-v0.2", + "name": "openchat-3.5-0106_Rebased_Mistral-7B-v0.2", + "developer": "Pretergeek", + "scores": { + "IFEval": 0.3706, + "BBH": 0.3627, + "MATH Level 5": 0.0453, + "GPQA": 0.2718, + "MUSR": 0.484, + "MMLU-PRO": 0.283 + } + }, + { + "model_id": "PrimeIntellect/INTELLECT-1", + "name": "INTELLECT-1", + "developer": "PrimeIntellect", + "scores": { + "IFEval": 0.1757, + "BBH": 0.274, + "MATH Level 5": 0.0, + "GPQA": 0.25, + "MUSR": 0.3753, + "MMLU-PRO": 0.112 + } + }, + { + "model_id": "PrimeIntellect/INTELLECT-1-Instruct", + "name": "INTELLECT-1-Instruct", + "developer": "PrimeIntellect", + "scores": { + "IFEval": 0.0, + "BBH": 0.287, + "MATH Level 5": 0.0227, + "GPQA": 0.2483, + "MUSR": 0.3577, + "MMLU-PRO": 0.1064 + } + }, + { + "model_id": "PuxAI/LUA_model", + "name": "LUA_model", + "developer": "PuxAI", + "scores": { + "IFEval": 0.2282, + "BBH": 0.2877, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3484, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "PygmalionAI/pygmalion-6b", + "name": "pygmalion-6b", + "developer": "PygmalionAI", + "scores": { + "IFEval": 0.2091, + "BBH": 0.3199, + "MATH Level 5": 0.0083, + "GPQA": 0.2492, + "MUSR": 0.3684, + "MMLU-PRO": 0.1184 + } + }, + { + "model_id": "Q-bert/MetaMath-1B", + "name": "MetaMath-1B", + "developer": "Q-bert", + "scores": { + "IFEval": 0.53, + "BBH": 0.3451, + "MATH Level 5": 0.0627, + "GPQA": 0.2517, + "MUSR": 0.3289, + "MMLU-PRO": 0.1495 + } + }, + { + "model_id": "Quazim0t0/1up-14b", + "name": "1up-14b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6888, + "BBH": 0.6921, + "MATH Level 5": 0.4162, + "GPQA": 0.3624, + "MUSR": 0.4583, + "MMLU-PRO": 0.5406 + } + }, + { + "model_id": "Quazim0t0/Adamant-14B-sce", + "name": "Adamant-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6858, + "BBH": 0.6859, + "MATH Level 5": 0.3988, + "GPQA": 0.3507, + "MUSR": 0.4558, + "MMLU-PRO": 0.5372 + } + }, + { + "model_id": "Quazim0t0/Alice-14B", + "name": "Alice-14B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6836, + "BBH": 0.6938, + "MATH Level 5": 0.4569, + "GPQA": 0.3515, + "MUSR": 0.4479, + "MMLU-PRO": 0.5419 + } + }, + { + "model_id": "Quazim0t0/Alien-CoT-14B-sce", + "name": "Alien-CoT-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.0749, + "BBH": 0.6395, + "MATH Level 5": 0.5204, + "GPQA": 0.3918, + "MUSR": 0.4785, + "MMLU-PRO": 0.517 + } + }, + { + "model_id": "Quazim0t0/Aura-8B-Linear", + "name": "Aura-8B-Linear", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.7948, + "BBH": 0.5074, + "MATH Level 5": 0.1805, + "GPQA": 0.2693, + "MUSR": 0.3687, + "MMLU-PRO": 0.3801 + } + }, + { + "model_id": "Quazim0t0/Casa-14b-sce", + "name": "Casa-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6654, + "BBH": 0.6901, + "MATH Level 5": 0.4698, + "GPQA": 0.3331, + "MUSR": 0.431, + "MMLU-PRO": 0.5426 + } + }, + { + "model_id": "Quazim0t0/Charlie-8B-Linear", + "name": "Charlie-8B-Linear", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.7381, + "BBH": 0.5141, + "MATH Level 5": 0.2651, + "GPQA": 0.271, + "MUSR": 0.3485, + "MMLU-PRO": 0.3573 + } + }, + { + "model_id": "Quazim0t0/Chromatic-8b-sce", + "name": "Chromatic-8b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.5085, + "BBH": 0.5063, + "MATH Level 5": 0.1556, + "GPQA": 0.3196, + "MUSR": 0.4051, + "MMLU-PRO": 0.3755 + } + }, + { + "model_id": "Quazim0t0/CoT_Phi", + "name": "CoT_Phi", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6159, + "BBH": 0.6751, + "MATH Level 5": 0.3308, + "GPQA": 0.3582, + "MUSR": 0.4244, + "MMLU-PRO": 0.4901 + } + }, + { + "model_id": "Quazim0t0/Dyson-14b", + "name": "Dyson-14b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.5857, + "BBH": 0.6863, + "MATH Level 5": 0.5393, + "GPQA": 0.3138, + "MUSR": 0.4259, + "MMLU-PRO": 0.5399 + } + }, + { + "model_id": "Quazim0t0/Edu-14B-Linear", + "name": "Edu-14B-Linear", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6158, + "BBH": 0.6758, + "MATH Level 5": 0.2447, + "GPQA": 0.3171, + "MUSR": 0.4378, + "MMLU-PRO": 0.5086 + } + }, + { + "model_id": "Quazim0t0/Fugazi14b", + "name": "Fugazi14b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6998, + "BBH": 0.6941, + "MATH Level 5": 0.4653, + "GPQA": 0.3515, + "MUSR": 0.4546, + "MMLU-PRO": 0.5417 + } + }, + { + "model_id": "Quazim0t0/GZA-14B-sce", + "name": "GZA-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6274, + "BBH": 0.6687, + "MATH Level 5": 0.4721, + "GPQA": 0.302, + "MUSR": 0.4285, + "MMLU-PRO": 0.5232 + } + }, + { + "model_id": "Quazim0t0/Geedorah-14B", + "name": "Geedorah-14B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6873, + "BBH": 0.6964, + "MATH Level 5": 0.4449, + "GPQA": 0.3473, + "MUSR": 0.4547, + "MMLU-PRO": 0.5421 + } + }, + { + "model_id": "Quazim0t0/GivingTree-8b-sce", + "name": "GivingTree-8b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.5006, + "BBH": 0.504, + "MATH Level 5": 0.1526, + "GPQA": 0.3221, + "MUSR": 0.4051, + "MMLU-PRO": 0.3761 + } + }, + { + "model_id": "Quazim0t0/GuiltySpark-14B-ties", + "name": "GuiltySpark-14B-ties", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6854, + "BBH": 0.6914, + "MATH Level 5": 0.3837, + "GPQA": 0.3649, + "MUSR": 0.4557, + "MMLU-PRO": 0.54 + } + }, + { + "model_id": "Quazim0t0/Halo-14B-sce", + "name": "Halo-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6754, + "BBH": 0.6876, + "MATH Level 5": 0.429, + "GPQA": 0.3473, + "MUSR": 0.4401, + "MMLU-PRO": 0.5376 + } + }, + { + "model_id": "Quazim0t0/Heretic1.5b", + "name": "Heretic1.5b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.2062, + "BBH": 0.3529, + "MATH Level 5": 0.244, + "GPQA": 0.2685, + "MUSR": 0.3511, + "MMLU-PRO": 0.1728 + } + }, + { + "model_id": "Quazim0t0/Hyde-14b-sce", + "name": "Hyde-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6715, + "BBH": 0.6885, + "MATH Level 5": 0.2734, + "GPQA": 0.3414, + "MUSR": 0.4141, + "MMLU-PRO": 0.53 + } + }, + { + "model_id": "Quazim0t0/Imagine-v0.5-16bit", + "name": "Imagine-v0.5-16bit", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.2759, + "BBH": 0.6769, + "MATH Level 5": 0.1397, + "GPQA": 0.3649, + "MUSR": 0.4349, + "MMLU-PRO": 0.5354 + } + }, + { + "model_id": "Quazim0t0/Imbue-14b", + "name": "Imbue-14b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.52, + "BBH": 0.6845, + "MATH Level 5": 0.5317, + "GPQA": 0.3129, + "MUSR": 0.4167, + "MMLU-PRO": 0.5402 + } + }, + { + "model_id": "Quazim0t0/Insom", + "name": "Insom", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6818, + "BBH": 0.6881, + "MATH Level 5": 0.3852, + "GPQA": 0.3498, + "MUSR": 0.4311, + "MMLU-PRO": 0.5352 + } + }, + { + "model_id": "Quazim0t0/InspectorDeck-14B-sce", + "name": "InspectorDeck-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.3241, + "BBH": 0.6668, + "MATH Level 5": 0.3165, + "GPQA": 0.297, + "MUSR": 0.3982, + "MMLU-PRO": 0.5261 + } + }, + { + "model_id": "Quazim0t0/Jekyl-8b-sce", + "name": "Jekyl-8b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.4697, + "BBH": 0.4994, + "MATH Level 5": 0.1616, + "GPQA": 0.3381, + "MUSR": 0.4197, + "MMLU-PRO": 0.3686 + } + }, + { + "model_id": "Quazim0t0/Jigsaw-14B-Linear", + "name": "Jigsaw-14B-Linear", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.648, + "BBH": 0.6865, + "MATH Level 5": 0.2651, + "GPQA": 0.3406, + "MUSR": 0.4483, + "MMLU-PRO": 0.5234 + } + }, + { + "model_id": "Quazim0t0/Katana-8b-sce", + "name": "Katana-8b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.5107, + "BBH": 0.5075, + "MATH Level 5": 0.1511, + "GPQA": 0.3247, + "MUSR": 0.4038, + "MMLU-PRO": 0.3771 + } + }, + { + "model_id": "Quazim0t0/Knot-CoT-14B-sce", + "name": "Knot-CoT-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.4832, + "BBH": 0.6616, + "MATH Level 5": 0.3995, + "GPQA": 0.2936, + "MUSR": 0.414, + "MMLU-PRO": 0.5154 + } + }, + { + "model_id": "Quazim0t0/Lineage-14B", + "name": "Lineage-14B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.707, + "BBH": 0.6934, + "MATH Level 5": 0.4245, + "GPQA": 0.3599, + "MUSR": 0.4597, + "MMLU-PRO": 0.5411 + } + }, + { + "model_id": "Quazim0t0/Lo-Phi-14b", + "name": "Lo-Phi-14b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.4941, + "BBH": 0.6852, + "MATH Level 5": 0.5196, + "GPQA": 0.328, + "MUSR": 0.4232, + "MMLU-PRO": 0.5369 + } + }, + { + "model_id": "Quazim0t0/Loke-14B-sce", + "name": "Loke-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6848, + "BBH": 0.6924, + "MATH Level 5": 0.3905, + "GPQA": 0.3649, + "MUSR": 0.4637, + "MMLU-PRO": 0.5401 + } + }, + { + "model_id": "Quazim0t0/MFDOOM-14B", + "name": "MFDOOM-14B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6736, + "BBH": 0.6916, + "MATH Level 5": 0.5264, + "GPQA": 0.323, + "MUSR": 0.4377, + "MMLU-PRO": 0.5426 + } + }, + { + "model_id": "Quazim0t0/MFGRIMM-14B", + "name": "MFGRIMM-14B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6894, + "BBH": 0.6909, + "MATH Level 5": 0.506, + "GPQA": 0.3339, + "MUSR": 0.4361, + "MMLU-PRO": 0.5416 + } + }, + { + "model_id": "Quazim0t0/Math_Phi4_Reason", + "name": "Math_Phi4_Reason", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.322, + "BBH": 0.624, + "MATH Level 5": 0.3278, + "GPQA": 0.2903, + "MUSR": 0.4034, + "MMLU-PRO": 0.503 + } + }, + { + "model_id": "Quazim0t0/Mithril-14B-sce", + "name": "Mithril-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6958, + "BBH": 0.6926, + "MATH Level 5": 0.3822, + "GPQA": 0.3691, + "MUSR": 0.4611, + "MMLU-PRO": 0.5403 + } + }, + { + "model_id": "Quazim0t0/Mononoke-14B-sce", + "name": "Mononoke-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.3502, + "BBH": 0.6744, + "MATH Level 5": 0.4698, + "GPQA": 0.323, + "MUSR": 0.4155, + "MMLU-PRO": 0.5298 + } + }, + { + "model_id": "Quazim0t0/Motion-8B-Linear", + "name": "Motion-8B-Linear", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.7686, + "BBH": 0.5084, + "MATH Level 5": 0.1888, + "GPQA": 0.271, + "MUSR": 0.3606, + "MMLU-PRO": 0.3785 + } + }, + { + "model_id": "Quazim0t0/Mouse-9B", + "name": "Mouse-9B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.1325, + "BBH": 0.2979, + "MATH Level 5": 0.0053, + "GPQA": 0.2542, + "MUSR": 0.347, + "MMLU-PRO": 0.1139 + } + }, + { + "model_id": "Quazim0t0/Nova-14b-sce", + "name": "Nova-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.7022, + "BBH": 0.6935, + "MATH Level 5": 0.4162, + "GPQA": 0.3633, + "MUSR": 0.4571, + "MMLU-PRO": 0.5413 + } + }, + { + "model_id": "Quazim0t0/NovaScotia-14b-stock", + "name": "NovaScotia-14b-stock", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6787, + "BBH": 0.6935, + "MATH Level 5": 0.463, + "GPQA": 0.349, + "MUSR": 0.4493, + "MMLU-PRO": 0.5409 + } + }, + { + "model_id": "Quazim0t0/ODB-14B-sce", + "name": "ODB-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.2922, + "BBH": 0.6559, + "MATH Level 5": 0.2545, + "GPQA": 0.2659, + "MUSR": 0.3929, + "MMLU-PRO": 0.5207 + } + }, + { + "model_id": "Quazim0t0/ODB-14b-sce", + "name": "ODB-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.7016, + "BBH": 0.6942, + "MATH Level 5": 0.4116, + "GPQA": 0.3624, + "MUSR": 0.4571, + "MMLU-PRO": 0.5411 + } + }, + { + "model_id": "Quazim0t0/Oasis-14B-ties", + "name": "Oasis-14B-ties", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6937, + "BBH": 0.6915, + "MATH Level 5": 0.3754, + "GPQA": 0.3649, + "MUSR": 0.4571, + "MMLU-PRO": 0.5405 + } + }, + { + "model_id": "Quazim0t0/Origami-14B-sce", + "name": "Origami-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.3259, + "BBH": 0.662, + "MATH Level 5": 0.2915, + "GPQA": 0.2836, + "MUSR": 0.4035, + "MMLU-PRO": 0.5244 + } + }, + { + "model_id": "Quazim0t0/Phi4.Turn.R1Distill.16bit", + "name": "Phi4.Turn.R1Distill.16bit", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.3126, + "BBH": 0.6563, + "MATH Level 5": 0.2311, + "GPQA": 0.2945, + "MUSR": 0.3902, + "MMLU-PRO": 0.5257 + } + }, + { + "model_id": "Quazim0t0/Phi4.Turn.R1Distill_v1.5.1-Tensors", + "name": "Phi4.Turn.R1Distill_v1.5.1-Tensors", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.2995, + "BBH": 0.6456, + "MATH Level 5": 0.219, + "GPQA": 0.2685, + "MUSR": 0.3929, + "MMLU-PRO": 0.5117 + } + }, + { + "model_id": "Quazim0t0/Phi4Basis-14B-sce", + "name": "Phi4Basis-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6502, + "BBH": 0.6909, + "MATH Level 5": 0.4789, + "GPQA": 0.3289, + "MUSR": 0.4338, + "MMLU-PRO": 0.539 + } + }, + { + "model_id": "Quazim0t0/Ponder-14B-linear", + "name": "Ponder-14B-linear", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6906, + "BBH": 0.6943, + "MATH Level 5": 0.4282, + "GPQA": 0.3582, + "MUSR": 0.4558, + "MMLU-PRO": 0.5408 + } + }, + { + "model_id": "Quazim0t0/RZA-14B-sce", + "name": "RZA-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.4774, + "BBH": 0.6686, + "MATH Level 5": 0.5189, + "GPQA": 0.2903, + "MUSR": 0.4113, + "MMLU-PRO": 0.5383 + } + }, + { + "model_id": "Quazim0t0/Rosemary-14b", + "name": "Rosemary-14b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6915, + "BBH": 0.6955, + "MATH Level 5": 0.4388, + "GPQA": 0.3565, + "MUSR": 0.4492, + "MMLU-PRO": 0.5396 + } + }, + { + "model_id": "Quazim0t0/Rune-14b", + "name": "Rune-14b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.7016, + "BBH": 0.6937, + "MATH Level 5": 0.4585, + "GPQA": 0.3515, + "MUSR": 0.4533, + "MMLU-PRO": 0.5411 + } + }, + { + "model_id": "Quazim0t0/SZA-14B-sce", + "name": "SZA-14B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.5659, + "BBH": 0.6889, + "MATH Level 5": 0.5242, + "GPQA": 0.3305, + "MUSR": 0.4339, + "MMLU-PRO": 0.5353 + } + }, + { + "model_id": "Quazim0t0/Sake-20b", + "name": "Sake-20b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6693, + "BBH": 0.677, + "MATH Level 5": 0.4653, + "GPQA": 0.3188, + "MUSR": 0.4494, + "MMLU-PRO": 0.5391 + } + }, + { + "model_id": "Quazim0t0/Spok-14b-sce", + "name": "Spok-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6682, + "BBH": 0.6899, + "MATH Level 5": 0.2719, + "GPQA": 0.3456, + "MUSR": 0.4141, + "MMLU-PRO": 0.5298 + } + }, + { + "model_id": "Quazim0t0/Sumatra-20b", + "name": "Sumatra-20b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6738, + "BBH": 0.6855, + "MATH Level 5": 0.3671, + "GPQA": 0.3263, + "MUSR": 0.456, + "MMLU-PRO": 0.5415 + } + }, + { + "model_id": "Quazim0t0/SuperNova14b", + "name": "SuperNova14b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.7076, + "BBH": 0.6937, + "MATH Level 5": 0.4396, + "GPQA": 0.3523, + "MUSR": 0.4545, + "MMLU-PRO": 0.5435 + } + }, + { + "model_id": "Quazim0t0/TB0-8B-sce", + "name": "TB0-8B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.5107, + "BBH": 0.5075, + "MATH Level 5": 0.1511, + "GPQA": 0.3247, + "MUSR": 0.4038, + "MMLU-PRO": 0.3771 + } + }, + { + "model_id": "Quazim0t0/TBL-8B-sce", + "name": "TBL-8B-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.4581, + "BBH": 0.5008, + "MATH Level 5": 0.1533, + "GPQA": 0.3339, + "MUSR": 0.4236, + "MMLU-PRO": 0.3689 + } + }, + { + "model_id": "Quazim0t0/ThinkPhi1.1-Tensors", + "name": "ThinkPhi1.1-Tensors", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.3908, + "BBH": 0.6449, + "MATH Level 5": 0.182, + "GPQA": 0.2987, + "MUSR": 0.418, + "MMLU-PRO": 0.4908 + } + }, + { + "model_id": "Quazim0t0/Venti-20b", + "name": "Venti-20b", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6641, + "BBH": 0.6901, + "MATH Level 5": 0.3391, + "GPQA": 0.3322, + "MUSR": 0.448, + "MMLU-PRO": 0.5386 + } + }, + { + "model_id": "Quazim0t0/Venti-Blend-sce", + "name": "Venti-Blend-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6879, + "BBH": 0.6843, + "MATH Level 5": 0.4056, + "GPQA": 0.3163, + "MUSR": 0.4389, + "MMLU-PRO": 0.5414 + } + }, + { + "model_id": "Quazim0t0/Vine-14b-sce", + "name": "Vine-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6733, + "BBH": 0.6891, + "MATH Level 5": 0.5008, + "GPQA": 0.3339, + "MUSR": 0.4323, + "MMLU-PRO": 0.5408 + } + }, + { + "model_id": "Quazim0t0/Wendy-14B", + "name": "Wendy-14B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6772, + "BBH": 0.6958, + "MATH Level 5": 0.4834, + "GPQA": 0.3322, + "MUSR": 0.4428, + "MMLU-PRO": 0.5435 + } + }, + { + "model_id": "Quazim0t0/Wu-14b-sce", + "name": "Wu-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6718, + "BBH": 0.6885, + "MATH Level 5": 0.2613, + "GPQA": 0.3465, + "MUSR": 0.4114, + "MMLU-PRO": 0.5293 + } + }, + { + "model_id": "Quazim0t0/bloom-14b-stock", + "name": "bloom-14b-stock", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6575, + "BBH": 0.6878, + "MATH Level 5": 0.4811, + "GPQA": 0.3314, + "MUSR": 0.431, + "MMLU-PRO": 0.5373 + } + }, + { + "model_id": "Quazim0t0/caramel-14B", + "name": "caramel-14B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6745, + "BBH": 0.6919, + "MATH Level 5": 0.4713, + "GPQA": 0.3448, + "MUSR": 0.4454, + "MMLU-PRO": 0.5436 + } + }, + { + "model_id": "Quazim0t0/graphite-14b-sce", + "name": "graphite-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.3217, + "BBH": 0.6631, + "MATH Level 5": 0.3006, + "GPQA": 0.2894, + "MUSR": 0.3981, + "MMLU-PRO": 0.528 + } + }, + { + "model_id": "Quazim0t0/mocha-14B", + "name": "mocha-14B", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.5893, + "BBH": 0.6895, + "MATH Level 5": 0.5264, + "GPQA": 0.3305, + "MUSR": 0.4272, + "MMLU-PRO": 0.5384 + } + }, + { + "model_id": "Quazim0t0/mosaic-14b-sce", + "name": "mosaic-14b-sce", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6876, + "BBH": 0.6907, + "MATH Level 5": 0.4026, + "GPQA": 0.3624, + "MUSR": 0.4558, + "MMLU-PRO": 0.5396 + } + }, + { + "model_id": "Quazim0t0/tesseract-14b-stock", + "name": "tesseract-14b-stock", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.5848, + "BBH": 0.688, + "MATH Level 5": 0.5144, + "GPQA": 0.3272, + "MUSR": 0.4232, + "MMLU-PRO": 0.5389 + } + }, + { + "model_id": "Quazim0t0/time-14b-stock", + "name": "time-14b-stock", + "developer": "Quazim0t0", + "scores": { + "IFEval": 0.6699, + "BBH": 0.6897, + "MATH Level 5": 0.5083, + "GPQA": 0.3347, + "MUSR": 0.4323, + "MMLU-PRO": 0.5419 + } + }, + { + "model_id": "Qwen/QwQ-32B", + "name": "QwQ-32B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3977, + "BBH": 0.2983, + "MATH Level 5": 0.1609, + "GPQA": 0.2601, + "MUSR": 0.4206, + "MMLU-PRO": 0.1196 + } + }, + { + "model_id": "Qwen/QwQ-32B-Preview", + "name": "QwQ-32B-Preview", + "developer": "Qwen", + "scores": { + "IFEval": 0.4035, + "BBH": 0.6691, + "MATH Level 5": 0.4494, + "GPQA": 0.2819, + "MUSR": 0.411, + "MMLU-PRO": 0.5678 + } + }, + { + "model_id": "Qwen/Qwen1.5-0.5B", + "name": "Qwen1.5-0.5B", + "developer": "Qwen", + "scores": { + "IFEval": 0.1706, + "BBH": 0.3154, + "MATH Level 5": 0.0174, + "GPQA": 0.2542, + "MUSR": 0.3616, + "MMLU-PRO": 0.1307 + } + }, + { + "model_id": "Qwen/Qwen1.5-0.5B-Chat", + "name": "Qwen1.5-0.5B-Chat", + "developer": "Qwen", + "scores": { + "IFEval": 0.1807, + "BBH": 0.3167, + "MATH Level 5": 0.0068, + "GPQA": 0.2693, + "MUSR": 0.3837, + "MMLU-PRO": 0.1213 + } + }, + { + "model_id": "Qwen/Qwen1.5-1.8B", + "name": "Qwen1.5-1.8B", + "developer": "Qwen", + "scores": { + "IFEval": 0.2154, + "BBH": 0.3476, + "MATH Level 5": 0.0317, + "GPQA": 0.3054, + "MUSR": 0.3605, + "MMLU-PRO": 0.1882 + } + }, + { + "model_id": "Qwen/Qwen1.5-1.8B-Chat", + "name": "Qwen1.5-1.8B-Chat", + "developer": "Qwen", + "scores": { + "IFEval": 0.2019, + "BBH": 0.3256, + "MATH Level 5": 0.0196, + "GPQA": 0.2978, + "MUSR": 0.426, + "MMLU-PRO": 0.1804 + } + }, + { + "model_id": "Qwen/Qwen1.5-110B", + "name": "Qwen1.5-110B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3422, + "BBH": 0.61, + "MATH Level 5": 0.247, + "GPQA": 0.3523, + "MUSR": 0.4408, + "MMLU-PRO": 0.5361 + } + }, + { + "model_id": "Qwen/Qwen1.5-110B-Chat", + "name": "Qwen1.5-110B-Chat", + "developer": "Qwen", + "scores": { + "IFEval": 0.5939, + "BBH": 0.6184, + "MATH Level 5": 0.2341, + "GPQA": 0.3414, + "MUSR": 0.4522, + "MMLU-PRO": 0.4825 + } + }, + { + "model_id": "Qwen/Qwen1.5-14B", + "name": "Qwen1.5-14B", + "developer": "Qwen", + "scores": { + "IFEval": 0.2905, + "BBH": 0.508, + "MATH Level 5": 0.2024, + "GPQA": 0.2945, + "MUSR": 0.4186, + "MMLU-PRO": 0.3644 + } + }, + { + "model_id": "Qwen/Qwen1.5-14B-Chat", + "name": "Qwen1.5-14B-Chat", + "developer": "Qwen", + "scores": { + "IFEval": 0.4768, + "BBH": 0.5229, + "MATH Level 5": 0.1526, + "GPQA": 0.2701, + "MUSR": 0.44, + "MMLU-PRO": 0.3618 + } + }, + { + "model_id": "Qwen/Qwen1.5-32B", + "name": "Qwen1.5-32B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3297, + "BBH": 0.5715, + "MATH Level 5": 0.3029, + "GPQA": 0.3297, + "MUSR": 0.4278, + "MMLU-PRO": 0.45 + } + }, + { + "model_id": "Qwen/Qwen1.5-32B-Chat", + "name": "Qwen1.5-32B-Chat", + "developer": "Qwen", + "scores": { + "IFEval": 0.5532, + "BBH": 0.6067, + "MATH Level 5": 0.1956, + "GPQA": 0.3062, + "MUSR": 0.416, + "MMLU-PRO": 0.4457 + } + }, + { + "model_id": "Qwen/Qwen1.5-4B", + "name": "Qwen1.5-4B", + "developer": "Qwen", + "scores": { + "IFEval": 0.2445, + "BBH": 0.4054, + "MATH Level 5": 0.0529, + "GPQA": 0.2768, + "MUSR": 0.3604, + "MMLU-PRO": 0.246 + } + }, + { + "model_id": "Qwen/Qwen1.5-4B-Chat", + "name": "Qwen1.5-4B-Chat", + "developer": "Qwen", + "scores": { + "IFEval": 0.3157, + "BBH": 0.4006, + "MATH Level 5": 0.0279, + "GPQA": 0.2668, + "MUSR": 0.3978, + "MMLU-PRO": 0.2396 + } + }, + { + "model_id": "Qwen/Qwen1.5-7B", + "name": "Qwen1.5-7B", + "developer": "Qwen", + "scores": { + "IFEval": 0.2684, + "BBH": 0.456, + "MATH Level 5": 0.0929, + "GPQA": 0.2987, + "MUSR": 0.4103, + "MMLU-PRO": 0.2916 + } + }, + { + "model_id": "Qwen/Qwen1.5-7B-Chat", + "name": "Qwen1.5-7B-Chat", + "developer": "Qwen", + "scores": { + "IFEval": 0.4371, + "BBH": 0.451, + "MATH Level 5": 0.0627, + "GPQA": 0.3029, + "MUSR": 0.3779, + "MMLU-PRO": 0.2951 + } + }, + { + "model_id": "Qwen/Qwen1.5-MoE-A2.7B", + "name": "Qwen1.5-MoE-A2.7B", + "developer": "Qwen", + "scores": { + "IFEval": 0.266, + "BBH": 0.4114, + "MATH Level 5": 0.0929, + "GPQA": 0.2592, + "MUSR": 0.4013, + "MMLU-PRO": 0.2778 + } + }, + { + "model_id": "Qwen/Qwen1.5-MoE-A2.7B-Chat", + "name": "Qwen1.5-MoE-A2.7B-Chat", + "developer": "Qwen", + "scores": { + "IFEval": 0.3795, + "BBH": 0.4272, + "MATH Level 5": 0.0634, + "GPQA": 0.2743, + "MUSR": 0.3899, + "MMLU-PRO": 0.2923 + } + }, + { + "model_id": "Qwen/Qwen2-0.5B", + "name": "Qwen2-0.5B", + "developer": "Qwen", + "scores": { + "IFEval": 0.1873, + "BBH": 0.3239, + "MATH Level 5": 0.0264, + "GPQA": 0.2609, + "MUSR": 0.3752, + "MMLU-PRO": 0.172 + } + }, + { + "model_id": "Qwen/Qwen2-0.5B-Instruct", + "name": "Qwen2-0.5B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.2247, + "BBH": 0.3173, + "MATH Level 5": 0.0287, + "GPQA": 0.2466, + "MUSR": 0.3353, + "MMLU-PRO": 0.1531 + } + }, + { + "model_id": "Qwen/Qwen2-1.5B", + "name": "Qwen2-1.5B", + "developer": "Qwen", + "scores": { + "IFEval": 0.2113, + "BBH": 0.3575, + "MATH Level 5": 0.0702, + "GPQA": 0.2643, + "MUSR": 0.3658, + "MMLU-PRO": 0.2552 + } + }, + { + "model_id": "Qwen/Qwen2-1.5B-Instruct", + "name": "Qwen2-1.5B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.3371, + "BBH": 0.3852, + "MATH Level 5": 0.0718, + "GPQA": 0.2617, + "MUSR": 0.4293, + "MMLU-PRO": 0.2501 + } + }, + { + "model_id": "Qwen/Qwen2-57B-A14B", + "name": "Qwen2-57B-A14B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3113, + "BBH": 0.5618, + "MATH Level 5": 0.1866, + "GPQA": 0.3062, + "MUSR": 0.4174, + "MMLU-PRO": 0.4916 + } + }, + { + "model_id": "Qwen/Qwen2-57B-A14B-Instruct", + "name": "Qwen2-57B-A14B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.6338, + "BBH": 0.5888, + "MATH Level 5": 0.2817, + "GPQA": 0.3314, + "MUSR": 0.4361, + "MMLU-PRO": 0.4575 + } + }, + { + "model_id": "Qwen/Qwen2-72B", + "name": "Qwen2-72B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3824, + "BBH": 0.6617, + "MATH Level 5": 0.3112, + "GPQA": 0.3943, + "MUSR": 0.4704, + "MMLU-PRO": 0.5731 + } + }, + { + "model_id": "Qwen/Qwen2-72B-Instruct", + "name": "Qwen2-72B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.7989, + "BBH": 0.6977, + "MATH Level 5": 0.4177, + "GPQA": 0.3725, + "MUSR": 0.456, + "MMLU-PRO": 0.5403 + } + }, + { + "model_id": "Qwen/Qwen2-7B", + "name": "Qwen2-7B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3149, + "BBH": 0.5315, + "MATH Level 5": 0.2039, + "GPQA": 0.3045, + "MUSR": 0.4439, + "MMLU-PRO": 0.4183 + } + }, + { + "model_id": "Qwen/Qwen2-7B-Instruct", + "name": "Qwen2-7B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.5679, + "BBH": 0.5545, + "MATH Level 5": 0.2764, + "GPQA": 0.2978, + "MUSR": 0.3928, + "MMLU-PRO": 0.3847 + } + }, + { + "model_id": "Qwen/Qwen2-Math-72B-Instruct", + "name": "Qwen2-Math-72B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.5694, + "BBH": 0.6343, + "MATH Level 5": 0.5536, + "GPQA": 0.3683, + "MUSR": 0.4517, + "MMLU-PRO": 0.4273 + } + }, + { + "model_id": "Qwen/Qwen2-Math-7B", + "name": "Qwen2-Math-7B", + "developer": "Qwen", + "scores": { + "IFEval": 0.2687, + "BBH": 0.387, + "MATH Level 5": 0.2477, + "GPQA": 0.2634, + "MUSR": 0.3593, + "MMLU-PRO": 0.1197 + } + }, + { + "model_id": "Qwen/Qwen2-VL-72B-Instruct", + "name": "Qwen2-VL-72B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.5982, + "BBH": 0.6946, + "MATH Level 5": 0.3444, + "GPQA": 0.3876, + "MUSR": 0.4492, + "MMLU-PRO": 0.5717 + } + }, + { + "model_id": "Qwen/Qwen2-VL-7B-Instruct", + "name": "Qwen2-VL-7B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.4599, + "BBH": 0.5465, + "MATH Level 5": 0.1986, + "GPQA": 0.3196, + "MUSR": 0.4375, + "MMLU-PRO": 0.4095 + } + }, + { + "model_id": "Qwen/Qwen2.5-0.5B", + "name": "Qwen2.5-0.5B", + "developer": "Qwen", + "scores": { + "IFEval": 0.1627, + "BBH": 0.3275, + "MATH Level 5": 0.0393, + "GPQA": 0.2466, + "MUSR": 0.3433, + "MMLU-PRO": 0.1906 + } + }, + { + "model_id": "Qwen/Qwen2.5-0.5B-Instruct", + "name": "Qwen2.5-0.5B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.3153, + "BBH": 0.3322, + "MATH Level 5": 0.1035, + "GPQA": 0.2592, + "MUSR": 0.3342, + "MMLU-PRO": 0.172 + } + }, + { + "model_id": "Qwen/Qwen2.5-1.5B", + "name": "Qwen2.5-1.5B", + "developer": "Qwen", + "scores": { + "IFEval": 0.2674, + "BBH": 0.4078, + "MATH Level 5": 0.0914, + "GPQA": 0.2852, + "MUSR": 0.3576, + "MMLU-PRO": 0.2855 + } + }, + { + "model_id": "Qwen/Qwen2.5-1.5B-Instruct", + "name": "Qwen2.5-1.5B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.4476, + "BBH": 0.4289, + "MATH Level 5": 0.2205, + "GPQA": 0.2559, + "MUSR": 0.3663, + "MMLU-PRO": 0.2799 + } + }, + { + "model_id": "Qwen/Qwen2.5-14B", + "name": "Qwen2.5-14B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3694, + "BBH": 0.6161, + "MATH Level 5": 0.29, + "GPQA": 0.3817, + "MUSR": 0.4502, + "MMLU-PRO": 0.5249 + } + }, + { + "model_id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen2.5-14B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.8158, + "BBH": 0.639, + "MATH Level 5": 0.5476, + "GPQA": 0.3221, + "MUSR": 0.4101, + "MMLU-PRO": 0.4904 + } + }, + { + "model_id": "Qwen/Qwen2.5-14B-Instruct-1M", + "name": "Qwen2.5-14B-Instruct-1M", + "developer": "Qwen", + "scores": { + "IFEval": 0.8414, + "BBH": 0.6198, + "MATH Level 5": 0.5302, + "GPQA": 0.3431, + "MUSR": 0.418, + "MMLU-PRO": 0.485 + } + }, + { + "model_id": "Qwen/Qwen2.5-32B", + "name": "Qwen2.5-32B", + "developer": "Qwen", + "scores": { + "IFEval": 0.4077, + "BBH": 0.6771, + "MATH Level 5": 0.3565, + "GPQA": 0.4119, + "MUSR": 0.4978, + "MMLU-PRO": 0.5805 + } + }, + { + "model_id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen2.5-32B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.8346, + "BBH": 0.6913, + "MATH Level 5": 0.6254, + "GPQA": 0.3381, + "MUSR": 0.4261, + "MMLU-PRO": 0.5667 + } + }, + { + "model_id": "Qwen/Qwen2.5-3B", + "name": "Qwen2.5-3B", + "developer": "Qwen", + "scores": { + "IFEval": 0.269, + "BBH": 0.4612, + "MATH Level 5": 0.148, + "GPQA": 0.2978, + "MUSR": 0.4303, + "MMLU-PRO": 0.3203 + } + }, + { + "model_id": "Qwen/Qwen2.5-3B-Instruct", + "name": "Qwen2.5-3B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.6475, + "BBH": 0.4693, + "MATH Level 5": 0.3678, + "GPQA": 0.2727, + "MUSR": 0.3968, + "MMLU-PRO": 0.3255 + } + }, + { + "model_id": "Qwen/Qwen2.5-72B", + "name": "Qwen2.5-72B", + "developer": "Qwen", + "scores": { + "IFEval": 0.4137, + "BBH": 0.6797, + "MATH Level 5": 0.3912, + "GPQA": 0.4052, + "MUSR": 0.4771, + "MMLU-PRO": 0.5968 + } + }, + { + "model_id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen2.5-72B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.8638, + "BBH": 0.7273, + "MATH Level 5": 0.5982, + "GPQA": 0.375, + "MUSR": 0.4206, + "MMLU-PRO": 0.5626 + } + }, + { + "model_id": "Qwen/Qwen2.5-7B", + "name": "Qwen2.5-7B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3374, + "BBH": 0.5416, + "MATH Level 5": 0.2508, + "GPQA": 0.3247, + "MUSR": 0.4424, + "MMLU-PRO": 0.4365 + } + }, + { + "model_id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen2.5-7B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.7585, + "BBH": 0.5394, + "MATH Level 5": 0.5, + "GPQA": 0.2911, + "MUSR": 0.402, + "MMLU-PRO": 0.4287 + } + }, + { + "model_id": "Qwen/Qwen2.5-7B-Instruct-1M", + "name": "Qwen2.5-7B-Instruct-1M", + "developer": "Qwen", + "scores": { + "IFEval": 0.7448, + "BBH": 0.5404, + "MATH Level 5": 0.4335, + "GPQA": 0.2978, + "MUSR": 0.4087, + "MMLU-PRO": 0.3505 + } + }, + { + "model_id": "Qwen/Qwen2.5-Coder-14B", + "name": "Qwen2.5-Coder-14B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3473, + "BBH": 0.5865, + "MATH Level 5": 0.2251, + "GPQA": 0.2928, + "MUSR": 0.3874, + "MMLU-PRO": 0.4521 + } + }, + { + "model_id": "Qwen/Qwen2.5-Coder-14B-Instruct", + "name": "Qwen2.5-Coder-14B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.6908, + "BBH": 0.614, + "MATH Level 5": 0.3248, + "GPQA": 0.3045, + "MUSR": 0.3915, + "MMLU-PRO": 0.3939 + } + }, + { + "model_id": "Qwen/Qwen2.5-Coder-32B", + "name": "Qwen2.5-Coder-32B", + "developer": "Qwen", + "scores": { + "IFEval": 0.4363, + "BBH": 0.6404, + "MATH Level 5": 0.3089, + "GPQA": 0.3465, + "MUSR": 0.4528, + "MMLU-PRO": 0.5303 + } + }, + { + "model_id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.7265, + "BBH": 0.6625, + "MATH Level 5": 0.4955, + "GPQA": 0.349, + "MUSR": 0.4386, + "MMLU-PRO": 0.4413 + } + }, + { + "model_id": "Qwen/Qwen2.5-Coder-7B", + "name": "Qwen2.5-Coder-7B", + "developer": "Qwen", + "scores": { + "IFEval": 0.3446, + "BBH": 0.4856, + "MATH Level 5": 0.1918, + "GPQA": 0.2592, + "MUSR": 0.3449, + "MMLU-PRO": 0.3679 + } + }, + { + "model_id": "Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Qwen2.5-Coder-7B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.6147, + "BBH": 0.4999, + "MATH Level 5": 0.031, + "GPQA": 0.2936, + "MUSR": 0.4099, + "MMLU-PRO": 0.3354 + } + }, + { + "model_id": "Qwen/Qwen2.5-Math-1.5B-Instruct", + "name": "Qwen2.5-Math-1.5B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.1856, + "BBH": 0.3752, + "MATH Level 5": 0.2628, + "GPQA": 0.2651, + "MUSR": 0.3685, + "MMLU-PRO": 0.1801 + } + }, + { + "model_id": "Qwen/Qwen2.5-Math-72B-Instruct", + "name": "Qwen2.5-Math-72B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.4003, + "BBH": 0.6452, + "MATH Level 5": 0.6239, + "GPQA": 0.3314, + "MUSR": 0.4473, + "MMLU-PRO": 0.4812 + } + }, + { + "model_id": "Qwen/Qwen2.5-Math-7B", + "name": "Qwen2.5-Math-7B", + "developer": "Qwen", + "scores": { + "IFEval": 0.246, + "BBH": 0.4455, + "MATH Level 5": 0.3051, + "GPQA": 0.2936, + "MUSR": 0.3781, + "MMLU-PRO": 0.2718 + } + }, + { + "model_id": "Qwen/Qwen2.5-Math-7B-Instruct", + "name": "Qwen2.5-Math-7B-Instruct", + "developer": "Qwen", + "scores": { + "IFEval": 0.2636, + "BBH": 0.4388, + "MATH Level 5": 0.5808, + "GPQA": 0.2617, + "MUSR": 0.3647, + "MMLU-PRO": 0.282 + } + }, + { + "model_id": "RDson/WomboCombo-R1-Coder-14B-Preview", + "name": "WomboCombo-R1-Coder-14B-Preview", + "developer": "RDson", + "scores": { + "IFEval": 0.6286, + "BBH": 0.6392, + "MATH Level 5": 0.5989, + "GPQA": 0.3213, + "MUSR": 0.4844, + "MMLU-PRO": 0.5168 + } + }, + { + "model_id": "RESMPDEV/EVA-Qwen2.5-1.5B-FRFR", + "name": "EVA-Qwen2.5-1.5B-FRFR", + "developer": "RESMPDEV", + "scores": { + "IFEval": 0.3082, + "BBH": 0.3932, + "MATH Level 5": 0.1027, + "GPQA": 0.2794, + "MUSR": 0.3539, + "MMLU-PRO": 0.277 + } + }, + { + "model_id": "RESMPDEV/Qwen2-Wukong-0.5B", + "name": "Qwen2-Wukong-0.5B", + "developer": "RESMPDEV", + "scores": { + "IFEval": 0.1854, + "BBH": 0.3085, + "MATH Level 5": 0.0015, + "GPQA": 0.2366, + "MUSR": 0.3525, + "MMLU-PRO": 0.1327 + } + }, + { + "model_id": "RLHFlow/ArmoRM-Llama3-8B-v0.1", + "name": "ArmoRM-Llama3-8B-v0.1", + "developer": "RLHFlow", + "scores": { + "IFEval": 0.1897, + "BBH": 0.2876, + "MATH Level 5": 0.0, + "GPQA": 0.2492, + "MUSR": 0.3948, + "MMLU-PRO": 0.1078 + } + }, + { + "model_id": "RLHFlow/LLaMA3-iterative-DPO-final", + "name": "LLaMA3-iterative-DPO-final", + "developer": "RLHFlow", + "scores": { + "IFEval": 0.534, + "BBH": 0.5058, + "MATH Level 5": 0.0884, + "GPQA": 0.2836, + "MUSR": 0.3673, + "MMLU-PRO": 0.3257 + } + }, + { + "model_id": "RWKV/rwkv-raven-14b", + "name": "rwkv-raven-14b", + "developer": "RWKV", + "scores": { + "IFEval": 0.0768, + "BBH": 0.3307, + "MATH Level 5": 0.0045, + "GPQA": 0.229, + "MUSR": 0.3951, + "MMLU-PRO": 0.115 + } + }, + { + "model_id": "Rakuten/RakutenAI-2.0-mini-instruct", + "name": "RakutenAI-2.0-mini-instruct", + "developer": "Rakuten", + "scores": { + "IFEval": 0.6794, + "BBH": 0.2867, + "MATH Level 5": 0.0521, + "GPQA": 0.2668, + "MUSR": 0.3249, + "MMLU-PRO": 0.1118 + } + }, + { + "model_id": "Rakuten/RakutenAI-7B", + "name": "RakutenAI-7B", + "developer": "Rakuten", + "scores": { + "IFEval": 0.1556, + "BBH": 0.4315, + "MATH Level 5": 0.0196, + "GPQA": 0.2894, + "MUSR": 0.3738, + "MMLU-PRO": 0.2877 + } + }, + { + "model_id": "Rakuten/RakutenAI-7B-chat", + "name": "RakutenAI-7B-chat", + "developer": "Rakuten", + "scores": { + "IFEval": 0.2686, + "BBH": 0.4316, + "MATH Level 5": 0.0295, + "GPQA": 0.2567, + "MUSR": 0.379, + "MMLU-PRO": 0.2798 + } + }, + { + "model_id": "Replete-AI/L3-Pneuma-8B", + "name": "L3-Pneuma-8B", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.2413, + "BBH": 0.4909, + "MATH Level 5": 0.0544, + "GPQA": 0.318, + "MUSR": 0.4105, + "MMLU-PRO": 0.3176 + } + }, + { + "model_id": "Replete-AI/L3.1-Pneuma-8B", + "name": "L3.1-Pneuma-8B", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.7076, + "BBH": 0.505, + "MATH Level 5": 0.2198, + "GPQA": 0.3029, + "MUSR": 0.3871, + "MMLU-PRO": 0.3691 + } + }, + { + "model_id": "Replete-AI/Llama3-8B-Instruct-Replete-Adapted", + "name": "Llama3-8B-Instruct-Replete-Adapted", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.6915, + "BBH": 0.487, + "MATH Level 5": 0.071, + "GPQA": 0.281, + "MUSR": 0.3634, + "MMLU-PRO": 0.3391 + } + }, + { + "model_id": "Replete-AI/Replete-Coder-Instruct-8b-Merged", + "name": "Replete-Coder-Instruct-8b-Merged", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.5388, + "BBH": 0.4462, + "MATH Level 5": 0.0778, + "GPQA": 0.2693, + "MUSR": 0.366, + "MMLU-PRO": 0.1805 + } + }, + { + "model_id": "Replete-AI/Replete-Coder-Llama3-8B", + "name": "Replete-Coder-Llama3-8B", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.4729, + "BBH": 0.3271, + "MATH Level 5": 0.0476, + "GPQA": 0.2609, + "MUSR": 0.3953, + "MMLU-PRO": 0.1331 + } + }, + { + "model_id": "Replete-AI/Replete-Coder-Qwen2-1.5b", + "name": "Replete-Coder-Qwen2-1.5b", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.3014, + "BBH": 0.3475, + "MATH Level 5": 0.0385, + "GPQA": 0.2685, + "MUSR": 0.4073, + "MMLU-PRO": 0.2147 + } + }, + { + "model_id": "Replete-AI/Replete-LLM-Qwen2-7b", + "name": "Replete-LLM-Qwen2-7b", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.0932, + "BBH": 0.2977, + "MATH Level 5": 0.0, + "GPQA": 0.2475, + "MUSR": 0.3941, + "MMLU-PRO": 0.1157 + } + }, + { + "model_id": "Replete-AI/Replete-LLM-Qwen2-7b_Beta-Preview", + "name": "Replete-LLM-Qwen2-7b_Beta-Preview", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.0858, + "BBH": 0.2929, + "MATH Level 5": 0.0, + "GPQA": 0.2483, + "MUSR": 0.3981, + "MMLU-PRO": 0.1285 + } + }, + { + "model_id": "Replete-AI/Replete-LLM-V2-Llama-3.1-8b", + "name": "Replete-LLM-V2-Llama-3.1-8b", + "developer": "Replete-AI", + "scores": { + "IFEval": 0.5515, + "BBH": 0.5339, + "MATH Level 5": 0.1405, + "GPQA": 0.3138, + "MUSR": 0.4001, + "MMLU-PRO": 0.3753 + } + }, + { + "model_id": "RezVortex/JAJUKA-WEWILLNEVERFORGETYOU-3B", + "name": "JAJUKA-WEWILLNEVERFORGETYOU-3B", + "developer": "RezVortex", + "scores": { + "IFEval": 0.6858, + "BBH": 0.4619, + "MATH Level 5": 0.1548, + "GPQA": 0.2576, + "MUSR": 0.363, + "MMLU-PRO": 0.3143 + } + }, + { + "model_id": "RezVortex/Jajuka-3b", + "name": "Jajuka-3b", + "developer": "RezVortex", + "scores": { + "IFEval": 0.6925, + "BBH": 0.4594, + "MATH Level 5": 0.1594, + "GPQA": 0.2659, + "MUSR": 0.3671, + "MMLU-PRO": 0.3137 + } + }, + { + "model_id": "Ro-xe/FMixIA-7B-DARE-0", + "name": "FMixIA-7B-DARE-0", + "developer": "Ro-xe", + "scores": { + "IFEval": 0.3341, + "BBH": 0.5035, + "MATH Level 5": 0.0529, + "GPQA": 0.2894, + "MUSR": 0.4545, + "MMLU-PRO": 0.3016 + } + }, + { + "model_id": "Ro-xe/FMixIA-7B-SLERP-27", + "name": "FMixIA-7B-SLERP-27", + "developer": "Ro-xe", + "scores": { + "IFEval": 0.3765, + "BBH": 0.5151, + "MATH Level 5": 0.0634, + "GPQA": 0.2953, + "MUSR": 0.4412, + "MMLU-PRO": 0.3008 + } + }, + { + "model_id": "Ro-xe/FMixIA-7B-TIES-1", + "name": "FMixIA-7B-TIES-1", + "developer": "Ro-xe", + "scores": { + "IFEval": 0.3453, + "BBH": 0.5092, + "MATH Level 5": 0.0566, + "GPQA": 0.2886, + "MUSR": 0.4689, + "MMLU-PRO": 0.2992 + } + }, + { + "model_id": "Ro-xe/FMixIA-FrankenMerge-9.5B-PT-9", + "name": "FMixIA-FrankenMerge-9.5B-PT-9", + "developer": "Ro-xe", + "scores": { + "IFEval": 0.194, + "BBH": 0.5088, + "MATH Level 5": 0.003, + "GPQA": 0.3079, + "MUSR": 0.417, + "MMLU-PRO": 0.3657 + } + }, + { + "model_id": "Rombo-Org/Rombo-LLM-V2.5-Qwen-7b", + "name": "Rombo-LLM-V2.5-Qwen-7b", + "developer": "Rombo-Org", + "scores": { + "IFEval": 0.7482, + "BBH": 0.54, + "MATH Level 5": 0.5068, + "GPQA": 0.3012, + "MUSR": 0.398, + "MMLU-PRO": 0.4283 + } + }, + { + "model_id": "RubielLabarta/LogoS-7Bx2-MoE-13B-v0.2", + "name": "LogoS-7Bx2-MoE-13B-v0.2", + "developer": "RubielLabarta", + "scores": { + "IFEval": 0.4379, + "BBH": 0.5207, + "MATH Level 5": 0.0574, + "GPQA": 0.2777, + "MUSR": 0.4226, + "MMLU-PRO": 0.3088 + } + }, + { + "model_id": "SaisExperiments/Evil-Alpaca-3B-L3.2", + "name": "Evil-Alpaca-3B-L3.2", + "developer": "SaisExperiments", + "scores": { + "IFEval": 0.3251, + "BBH": 0.4341, + "MATH Level 5": 0.0702, + "GPQA": 0.2634, + "MUSR": 0.4198, + "MMLU-PRO": 0.2621 + } + }, + { + "model_id": "SaisExperiments/Gemma-2-2B-Opus-Instruct", + "name": "Gemma-2-2B-Opus-Instruct", + "developer": "SaisExperiments", + "scores": { + "IFEval": 0.475, + "BBH": 0.4293, + "MATH Level 5": 0.0506, + "GPQA": 0.2836, + "MUSR": 0.4057, + "MMLU-PRO": 0.265 + } + }, + { + "model_id": "SaisExperiments/Gemma-2-2B-Stheno-Filtered", + "name": "Gemma-2-2B-Stheno-Filtered", + "developer": "SaisExperiments", + "scores": { + "IFEval": 0.4197, + "BBH": 0.4149, + "MATH Level 5": 0.0461, + "GPQA": 0.2701, + "MUSR": 0.4003, + "MMLU-PRO": 0.263 + } + }, + { + "model_id": "SaisExperiments/Not-So-Small-Alpaca-24B", + "name": "Not-So-Small-Alpaca-24B", + "developer": "SaisExperiments", + "scores": { + "IFEval": 0.6244, + "BBH": 0.5339, + "MATH Level 5": 0.1828, + "GPQA": 0.3591, + "MUSR": 0.4282, + "MMLU-PRO": 0.3694 + } + }, + { + "model_id": "SaisExperiments/QwOwO-7B-V1", + "name": "QwOwO-7B-V1", + "developer": "SaisExperiments", + "scores": { + "IFEval": 0.4556, + "BBH": 0.5431, + "MATH Level 5": 0.386, + "GPQA": 0.2601, + "MUSR": 0.3835, + "MMLU-PRO": 0.4224 + } + }, + { + "model_id": "SaisExperiments/RightSheep-Llama3.2-3B", + "name": "RightSheep-Llama3.2-3B", + "developer": "SaisExperiments", + "scores": { + "IFEval": 0.4156, + "BBH": 0.4241, + "MATH Level 5": 0.0808, + "GPQA": 0.2869, + "MUSR": 0.3767, + "MMLU-PRO": 0.254 + } + }, + { + "model_id": "Sakalti/Anemoi-3B", + "name": "Anemoi-3B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3804, + "BBH": 0.4922, + "MATH Level 5": 0.1775, + "GPQA": 0.3054, + "MUSR": 0.4371, + "MMLU-PRO": 0.3766 + } + }, + { + "model_id": "Sakalti/Euphrates-14B", + "name": "Euphrates-14B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2647, + "BBH": 0.6138, + "MATH Level 5": 0.3051, + "GPQA": 0.3935, + "MUSR": 0.4516, + "MMLU-PRO": 0.5255 + } + }, + { + "model_id": "Sakalti/Llama3.2-3B-Uranus-1", + "name": "Llama3.2-3B-Uranus-1", + "developer": "Sakalti", + "scores": { + "IFEval": 0.5335, + "BBH": 0.4437, + "MATH Level 5": 0.1495, + "GPQA": 0.297, + "MUSR": 0.3669, + "MMLU-PRO": 0.3094 + } + }, + { + "model_id": "Sakalti/Magro-7B-v1.1", + "name": "Magro-7B-v1.1", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1204, + "BBH": 0.4179, + "MATH Level 5": 0.0249, + "GPQA": 0.2961, + "MUSR": 0.4433, + "MMLU-PRO": 0.2764 + } + }, + { + "model_id": "Sakalti/Neptuno-3B", + "name": "Neptuno-3B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4296, + "BBH": 0.4834, + "MATH Level 5": 0.2553, + "GPQA": 0.2961, + "MUSR": 0.4002, + "MMLU-PRO": 0.3773 + } + }, + { + "model_id": "Sakalti/Neptuno-Alpha", + "name": "Neptuno-Alpha", + "developer": "Sakalti", + "scores": { + "IFEval": 0.378, + "BBH": 0.4925, + "MATH Level 5": 0.1835, + "GPQA": 0.307, + "MUSR": 0.4371, + "MMLU-PRO": 0.3767 + } + }, + { + "model_id": "Sakalti/Oxyge1-33B", + "name": "Oxyge1-33B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4548, + "BBH": 0.7033, + "MATH Level 5": 0.4962, + "GPQA": 0.3826, + "MUSR": 0.5008, + "MMLU-PRO": 0.5909 + } + }, + { + "model_id": "Sakalti/Phi3.5-Comets-3.8B", + "name": "Phi3.5-Comets-3.8B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2094, + "BBH": 0.3335, + "MATH Level 5": 0.0008, + "GPQA": 0.2492, + "MUSR": 0.3764, + "MMLU-PRO": 0.1153 + } + }, + { + "model_id": "Sakalti/Qwen2.5-1B-Instruct", + "name": "Qwen2.5-1B-Instruct", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1751, + "BBH": 0.3027, + "MATH Level 5": 0.006, + "GPQA": 0.2559, + "MUSR": 0.3369, + "MMLU-PRO": 0.1213 + } + }, + { + "model_id": "Sakalti/QwenTest-7", + "name": "QwenTest-7", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1672, + "BBH": 0.3063, + "MATH Level 5": 0.0038, + "GPQA": 0.2601, + "MUSR": 0.3422, + "MMLU-PRO": 0.1212 + } + }, + { + "model_id": "Sakalti/SJT-0.5B", + "name": "SJT-0.5B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2425, + "BBH": 0.3306, + "MATH Level 5": 0.0521, + "GPQA": 0.2718, + "MUSR": 0.3196, + "MMLU-PRO": 0.1891 + } + }, + { + "model_id": "Sakalti/SJT-1.5B-Alpha", + "name": "SJT-1.5B-Alpha", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3449, + "BBH": 0.4241, + "MATH Level 5": 0.0997, + "GPQA": 0.2919, + "MUSR": 0.4226, + "MMLU-PRO": 0.2961 + } + }, + { + "model_id": "Sakalti/SJT-1.5B-Alpha-1.1", + "name": "SJT-1.5B-Alpha-1.1", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3439, + "BBH": 0.4243, + "MATH Level 5": 0.0959, + "GPQA": 0.2894, + "MUSR": 0.4239, + "MMLU-PRO": 0.2966 + } + }, + { + "model_id": "Sakalti/SJT-1.7B", + "name": "SJT-1.7B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1776, + "BBH": 0.2934, + "MATH Level 5": 0.0015, + "GPQA": 0.2416, + "MUSR": 0.3964, + "MMLU-PRO": 0.1133 + } + }, + { + "model_id": "Sakalti/SJT-14B", + "name": "SJT-14B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.5494, + "BBH": 0.6536, + "MATH Level 5": 0.3844, + "GPQA": 0.3867, + "MUSR": 0.4766, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "Sakalti/SJT-2.4B", + "name": "SJT-2.4B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2804, + "BBH": 0.349, + "MATH Level 5": 0.0219, + "GPQA": 0.2559, + "MUSR": 0.3699, + "MMLU-PRO": 0.1858 + } + }, + { + "model_id": "Sakalti/SJT-24B-Alpha", + "name": "SJT-24B-Alpha", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3206, + "BBH": 0.6081, + "MATH Level 5": 0.253, + "GPQA": 0.3809, + "MUSR": 0.4595, + "MMLU-PRO": 0.4857 + } + }, + { + "model_id": "Sakalti/SJT-2B", + "name": "SJT-2B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2151, + "BBH": 0.2936, + "MATH Level 5": 0.0008, + "GPQA": 0.2416, + "MUSR": 0.3564, + "MMLU-PRO": 0.1187 + } + }, + { + "model_id": "Sakalti/SJT-2B-V1.1", + "name": "SJT-2B-V1.1", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3977, + "BBH": 0.3984, + "MATH Level 5": 0.0483, + "GPQA": 0.2676, + "MUSR": 0.4299, + "MMLU-PRO": 0.2124 + } + }, + { + "model_id": "Sakalti/SJT-3.7B", + "name": "SJT-3.7B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1078, + "BBH": 0.3393, + "MATH Level 5": 0.0121, + "GPQA": 0.2559, + "MUSR": 0.3617, + "MMLU-PRO": 0.1505 + } + }, + { + "model_id": "Sakalti/SJT-4B", + "name": "SJT-4B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4077, + "BBH": 0.4886, + "MATH Level 5": 0.1156, + "GPQA": 0.2945, + "MUSR": 0.478, + "MMLU-PRO": 0.3281 + } + }, + { + "model_id": "Sakalti/SJT-7.5B", + "name": "SJT-7.5B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4223, + "BBH": 0.5367, + "MATH Level 5": 0.2168, + "GPQA": 0.3263, + "MUSR": 0.4399, + "MMLU-PRO": 0.3951 + } + }, + { + "model_id": "Sakalti/SJT-7B-V1.1", + "name": "SJT-7B-V1.1", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4703, + "BBH": 0.5419, + "MATH Level 5": 0.2432, + "GPQA": 0.3339, + "MUSR": 0.4411, + "MMLU-PRO": 0.4412 + } + }, + { + "model_id": "Sakalti/SJT-7B-V1.1-Multilingal", + "name": "SJT-7B-V1.1-Multilingal", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1949, + "BBH": 0.292, + "MATH Level 5": 0.0045, + "GPQA": 0.2601, + "MUSR": 0.3621, + "MMLU-PRO": 0.1137 + } + }, + { + "model_id": "Sakalti/SJT-8B", + "name": "SJT-8B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.6535, + "BBH": 0.5282, + "MATH Level 5": 0.2538, + "GPQA": 0.3297, + "MUSR": 0.408, + "MMLU-PRO": 0.4266 + } + }, + { + "model_id": "Sakalti/SJT-8B-V1.1", + "name": "SJT-8B-V1.1", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4621, + "BBH": 0.5121, + "MATH Level 5": 0.2069, + "GPQA": 0.3364, + "MUSR": 0.4266, + "MMLU-PRO": 0.4231 + } + }, + { + "model_id": "Sakalti/SJT-900M", + "name": "SJT-900M", + "developer": "Sakalti", + "scores": { + "IFEval": 0.241, + "BBH": 0.3169, + "MATH Level 5": 0.0136, + "GPQA": 0.2534, + "MUSR": 0.3595, + "MMLU-PRO": 0.1142 + } + }, + { + "model_id": "Sakalti/SJT-Moe2x7.5B", + "name": "SJT-Moe2x7.5B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4117, + "BBH": 0.5371, + "MATH Level 5": 0.2145, + "GPQA": 0.3263, + "MUSR": 0.4399, + "MMLU-PRO": 0.3954 + } + }, + { + "model_id": "Sakalti/SJTPass-2", + "name": "SJTPass-2", + "developer": "Sakalti", + "scores": { + "IFEval": 0.24, + "BBH": 0.3302, + "MATH Level 5": 0.0529, + "GPQA": 0.2727, + "MUSR": 0.3222, + "MMLU-PRO": 0.1902 + } + }, + { + "model_id": "Sakalti/SJTPass-4", + "name": "SJTPass-4", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1913, + "BBH": 0.2964, + "MATH Level 5": 0.0023, + "GPQA": 0.2601, + "MUSR": 0.3898, + "MMLU-PRO": 0.1083 + } + }, + { + "model_id": "Sakalti/SJTPass-5", + "name": "SJTPass-5", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2425, + "BBH": 0.3103, + "MATH Level 5": 0.0159, + "GPQA": 0.2668, + "MUSR": 0.3794, + "MMLU-PRO": 0.1327 + } + }, + { + "model_id": "Sakalti/Saba-Passthrough-2", + "name": "Saba-Passthrough-2", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1691, + "BBH": 0.3672, + "MATH Level 5": 0.0008, + "GPQA": 0.2634, + "MUSR": 0.3844, + "MMLU-PRO": 0.2077 + } + }, + { + "model_id": "Sakalti/Saba1-1.8B", + "name": "Saba1-1.8B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3333, + "BBH": 0.4147, + "MATH Level 5": 0.1541, + "GPQA": 0.2827, + "MUSR": 0.4239, + "MMLU-PRO": 0.2926 + } + }, + { + "model_id": "Sakalti/Saba1-7B", + "name": "Saba1-7B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4585, + "BBH": 0.5489, + "MATH Level 5": 0.3663, + "GPQA": 0.3163, + "MUSR": 0.4793, + "MMLU-PRO": 0.4376 + } + }, + { + "model_id": "Sakalti/Saba1.5-1.5B", + "name": "Saba1.5-1.5B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3333, + "BBH": 0.4147, + "MATH Level 5": 0.1541, + "GPQA": 0.2827, + "MUSR": 0.4239, + "MMLU-PRO": 0.2926 + } + }, + { + "model_id": "Sakalti/Saba1.5-Pro-3B", + "name": "Saba1.5-Pro-3B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2386, + "BBH": 0.3623, + "MATH Level 5": 0.0272, + "GPQA": 0.2685, + "MUSR": 0.4405, + "MMLU-PRO": 0.1958 + } + }, + { + "model_id": "Sakalti/Saba2-14B-Preview", + "name": "Saba2-14B-Preview", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4722, + "BBH": 0.6496, + "MATH Level 5": 0.3127, + "GPQA": 0.3826, + "MUSR": 0.4781, + "MMLU-PRO": 0.5384 + } + }, + { + "model_id": "Sakalti/Saba2-3B", + "name": "Saba2-3B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2865, + "BBH": 0.2801, + "MATH Level 5": 0.006, + "GPQA": 0.2617, + "MUSR": 0.3927, + "MMLU-PRO": 0.121 + } + }, + { + "model_id": "Sakalti/Sailor-japanese", + "name": "Sailor-japanese", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1605, + "BBH": 0.2913, + "MATH Level 5": 0.003, + "GPQA": 0.2534, + "MUSR": 0.3912, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "Sakalti/Saka-1.5B", + "name": "Saka-1.5B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2726, + "BBH": 0.3988, + "MATH Level 5": 0.0801, + "GPQA": 0.2903, + "MUSR": 0.3739, + "MMLU-PRO": 0.2415 + } + }, + { + "model_id": "Sakalti/Saka-14B", + "name": "Saka-14B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.7174, + "BBH": 0.6497, + "MATH Level 5": 0.4094, + "GPQA": 0.396, + "MUSR": 0.4886, + "MMLU-PRO": 0.5396 + } + }, + { + "model_id": "Sakalti/Saka-24B", + "name": "Saka-24B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3819, + "BBH": 0.6072, + "MATH Level 5": 0.1805, + "GPQA": 0.3423, + "MUSR": 0.4541, + "MMLU-PRO": 0.4766 + } + }, + { + "model_id": "Sakalti/Saka-7.2B", + "name": "Saka-7.2B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1545, + "BBH": 0.2945, + "MATH Level 5": 0.0, + "GPQA": 0.2391, + "MUSR": 0.3711, + "MMLU-PRO": 0.116 + } + }, + { + "model_id": "Sakalti/Saka-7.6B", + "name": "Saka-7.6B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4524, + "BBH": 0.5655, + "MATH Level 5": 0.3255, + "GPQA": 0.3163, + "MUSR": 0.4489, + "MMLU-PRO": 0.454 + } + }, + { + "model_id": "Sakalti/SakaMoe-3x1.6B-Instruct", + "name": "SakaMoe-3x1.6B-Instruct", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2371, + "BBH": 0.3282, + "MATH Level 5": 0.0544, + "GPQA": 0.2668, + "MUSR": 0.3342, + "MMLU-PRO": 0.1882 + } + }, + { + "model_id": "Sakalti/SakalFusion-7B-Alpha", + "name": "SakalFusion-7B-Alpha", + "developer": "Sakalti", + "scores": { + "IFEval": 0.529, + "BBH": 0.5591, + "MATH Level 5": 0.3844, + "GPQA": 0.3255, + "MUSR": 0.4581, + "MMLU-PRO": 0.4474 + } + }, + { + "model_id": "Sakalti/SakalFusion-7B-Beta", + "name": "SakalFusion-7B-Beta", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1809, + "BBH": 0.2881, + "MATH Level 5": 0.0, + "GPQA": 0.2433, + "MUSR": 0.3872, + "MMLU-PRO": 0.109 + } + }, + { + "model_id": "Sakalti/Tara-3.8B-v1.1", + "name": "Tara-3.8B-v1.1", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4062, + "BBH": 0.4886, + "MATH Level 5": 0.1156, + "GPQA": 0.2945, + "MUSR": 0.478, + "MMLU-PRO": 0.3281 + } + }, + { + "model_id": "Sakalti/light-1.1-3B", + "name": "light-1.1-3B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2735, + "BBH": 0.2803, + "MATH Level 5": 0.0113, + "GPQA": 0.2617, + "MUSR": 0.3901, + "MMLU-PRO": 0.1209 + } + }, + { + "model_id": "Sakalti/light-3B", + "name": "light-3B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.5337, + "BBH": 0.4831, + "MATH Level 5": 0.2591, + "GPQA": 0.2953, + "MUSR": 0.4015, + "MMLU-PRO": 0.3775 + } + }, + { + "model_id": "Sakalti/light-3b-beta", + "name": "light-3b-beta", + "developer": "Sakalti", + "scores": { + "IFEval": 0.5485, + "BBH": 0.4815, + "MATH Level 5": 0.2772, + "GPQA": 0.2978, + "MUSR": 0.4015, + "MMLU-PRO": 0.3758 + } + }, + { + "model_id": "Sakalti/light-7b-beta", + "name": "light-7b-beta", + "developer": "Sakalti", + "scores": { + "IFEval": 0.6234, + "BBH": 0.5548, + "MATH Level 5": 0.3769, + "GPQA": 0.3213, + "MUSR": 0.4291, + "MMLU-PRO": 0.4456 + } + }, + { + "model_id": "Sakalti/llama-3-yanyuedao-8b-instruct", + "name": "llama-3-yanyuedao-8b-instruct", + "developer": "Sakalti", + "scores": { + "IFEval": 0.2186, + "BBH": 0.435, + "MATH Level 5": 0.0385, + "GPQA": 0.2903, + "MUSR": 0.4199, + "MMLU-PRO": 0.2911 + } + }, + { + "model_id": "Sakalti/magro-7B", + "name": "magro-7B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1344, + "BBH": 0.4186, + "MATH Level 5": 0.0204, + "GPQA": 0.2953, + "MUSR": 0.446, + "MMLU-PRO": 0.2765 + } + }, + { + "model_id": "Sakalti/mergekit-01", + "name": "mergekit-01", + "developer": "Sakalti", + "scores": { + "IFEval": 0.6234, + "BBH": 0.5548, + "MATH Level 5": 0.3769, + "GPQA": 0.3213, + "MUSR": 0.4291, + "MMLU-PRO": 0.4456 + } + }, + { + "model_id": "Sakalti/mergekit-della_linear-vmeykci", + "name": "mergekit-della_linear-vmeykci", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1126, + "BBH": 0.2816, + "MATH Level 5": 0.0106, + "GPQA": 0.2634, + "MUSR": 0.3897, + "MMLU-PRO": 0.1089 + } + }, + { + "model_id": "Sakalti/model-3", + "name": "model-3", + "developer": "Sakalti", + "scores": { + "IFEval": 0.6264, + "BBH": 0.5542, + "MATH Level 5": 0.3708, + "GPQA": 0.3213, + "MUSR": 0.4264, + "MMLU-PRO": 0.4455 + } + }, + { + "model_id": "Sakalti/qwen2.5-2.3B", + "name": "qwen2.5-2.3B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.1288, + "BBH": 0.2849, + "MATH Level 5": 0.0053, + "GPQA": 0.2517, + "MUSR": 0.3857, + "MMLU-PRO": 0.1173 + } + }, + { + "model_id": "Sakalti/tara-3.8B", + "name": "tara-3.8B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.4077, + "BBH": 0.4886, + "MATH Level 5": 0.1156, + "GPQA": 0.2945, + "MUSR": 0.478, + "MMLU-PRO": 0.3281 + } + }, + { + "model_id": "Sakalti/ultiima-14B", + "name": "ultiima-14B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.5701, + "BBH": 0.6491, + "MATH Level 5": 0.4698, + "GPQA": 0.3742, + "MUSR": 0.4718, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "Sakalti/ultiima-14B-v0.2", + "name": "ultiima-14B-v0.2", + "developer": "Sakalti", + "scores": { + "IFEval": 0.707, + "BBH": 0.6472, + "MATH Level 5": 0.3995, + "GPQA": 0.3826, + "MUSR": 0.4794, + "MMLU-PRO": 0.5387 + } + }, + { + "model_id": "Sakalti/ultiima-14B-v0.3", + "name": "ultiima-14B-v0.3", + "developer": "Sakalti", + "scores": { + "IFEval": 0.704, + "BBH": 0.6398, + "MATH Level 5": 0.3965, + "GPQA": 0.3767, + "MUSR": 0.4754, + "MMLU-PRO": 0.5337 + } + }, + { + "model_id": "Sakalti/ultiima-14B-v0.4", + "name": "ultiima-14B-v0.4", + "developer": "Sakalti", + "scores": { + "IFEval": 0.3008, + "BBH": 0.642, + "MATH Level 5": 0.3535, + "GPQA": 0.396, + "MUSR": 0.4886, + "MMLU-PRO": 0.5278 + } + }, + { + "model_id": "Sakalti/ultiima-32B", + "name": "ultiima-32B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.6854, + "BBH": 0.7037, + "MATH Level 5": 0.4962, + "GPQA": 0.3809, + "MUSR": 0.4995, + "MMLU-PRO": 0.591 + } + }, + { + "model_id": "Sakalti/ultiima-72B", + "name": "ultiima-72B", + "developer": "Sakalti", + "scores": { + "IFEval": 0.714, + "BBH": 0.7218, + "MATH Level 5": 0.5355, + "GPQA": 0.4144, + "MUSR": 0.4652, + "MMLU-PRO": 0.5906 + } + }, + { + "model_id": "Sakalti/ultiima-72B-v1.5", + "name": "ultiima-72B-v1.5", + "developer": "Sakalti", + "scores": { + "IFEval": 0.655, + "BBH": 0.7392, + "MATH Level 5": 0.4396, + "GPQA": 0.4136, + "MUSR": 0.4691, + "MMLU-PRO": 0.6054 + } + }, + { + "model_id": "Salesforce/LLaMA-3-8B-SFR-Iterative-DPO-R", + "name": "LLaMA-3-8B-SFR-Iterative-DPO-R", + "developer": "Salesforce", + "scores": { + "IFEval": 0.3816, + "BBH": 0.5012, + "MATH Level 5": 0.0914, + "GPQA": 0.2878, + "MUSR": 0.3633, + "MMLU-PRO": 0.3172 + } + }, + { + "model_id": "SanjiWatsuki/Kunoichi-DPO-v2-7B", + "name": "Kunoichi-DPO-v2-7B", + "developer": "SanjiWatsuki", + "scores": { + "IFEval": 0.5431, + "BBH": 0.4416, + "MATH Level 5": 0.0763, + "GPQA": 0.2961, + "MUSR": 0.4188, + "MMLU-PRO": 0.3107 + } + }, + { + "model_id": "SanjiWatsuki/Silicon-Maid-7B", + "name": "Silicon-Maid-7B", + "developer": "SanjiWatsuki", + "scores": { + "IFEval": 0.5368, + "BBH": 0.4128, + "MATH Level 5": 0.065, + "GPQA": 0.2903, + "MUSR": 0.4188, + "MMLU-PRO": 0.3083 + } + }, + { + "model_id": "Sao10K/70B-L3.3-Cirrus-x1", + "name": "70B-L3.3-Cirrus-x1", + "developer": "Sao10K", + "scores": { + "IFEval": 0.6681, + "BBH": 0.7029, + "MATH Level 5": 0.3739, + "GPQA": 0.4497, + "MUSR": 0.4842, + "MMLU-PRO": 0.5378 + } + }, + { + "model_id": "Sao10K/Fimbulvetr-11B-v2", + "name": "Fimbulvetr-11B-v2", + "developer": "Sao10K", + "scores": { + "IFEval": 0.51, + "BBH": 0.4544, + "MATH Level 5": 0.068, + "GPQA": 0.2919, + "MUSR": 0.4354, + "MMLU-PRO": 0.3301 + } + }, + { + "model_id": "Sao10K/L3-70B-Euryale-v2.1", + "name": "L3-70B-Euryale-v2.1", + "developer": "Sao10K", + "scores": { + "IFEval": 0.7384, + "BBH": 0.6471, + "MATH Level 5": 0.2137, + "GPQA": 0.3314, + "MUSR": 0.4209, + "MMLU-PRO": 0.5104 + } + }, + { + "model_id": "Sao10K/L3-8B-Lunaris-v1", + "name": "L3-8B-Lunaris-v1", + "developer": "Sao10K", + "scores": { + "IFEval": 0.6895, + "BBH": 0.5235, + "MATH Level 5": 0.0906, + "GPQA": 0.3012, + "MUSR": 0.3727, + "MMLU-PRO": 0.3787 + } + }, + { + "model_id": "Sao10K/L3-8B-Niitama-v1", + "name": "L3-8B-Niitama-v1", + "developer": "Sao10K", + "scores": { + "IFEval": 0.6791, + "BBH": 0.5303, + "MATH Level 5": 0.0982, + "GPQA": 0.3079, + "MUSR": 0.3807, + "MMLU-PRO": 0.3701 + } + }, + { + "model_id": "Sao10K/L3-8B-Stheno-v3.2", + "name": "L3-8B-Stheno-v3.2", + "developer": "Sao10K", + "scores": { + "IFEval": 0.6873, + "BBH": 0.5228, + "MATH Level 5": 0.0929, + "GPQA": 0.3104, + "MUSR": 0.3794, + "MMLU-PRO": 0.3768 + } + }, + { + "model_id": "Sao10K/L3-8B-Stheno-v3.3-32K", + "name": "L3-8B-Stheno-v3.3-32K", + "developer": "Sao10K", + "scores": { + "IFEval": 0.4604, + "BBH": 0.3844, + "MATH Level 5": 0.0144, + "GPQA": 0.2567, + "MUSR": 0.3725, + "MMLU-PRO": 0.1896 + } + }, + { + "model_id": "Sao10K/MN-12B-Lyra-v3", + "name": "MN-12B-Lyra-v3", + "developer": "Sao10K", + "scores": { + "IFEval": 0.4486, + "BBH": 0.4804, + "MATH Level 5": 0.0937, + "GPQA": 0.2777, + "MUSR": 0.4019, + "MMLU-PRO": 0.3249 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Avengers-V1-32B", + "name": "Linkbricks-Horizon-AI-Avengers-V1-32B", + "developer": "Saxo", + "scores": { + "IFEval": 0.7972, + "BBH": 0.7001, + "MATH Level 5": 0.6027, + "GPQA": 0.3624, + "MUSR": 0.4538, + "MMLU-PRO": 0.5793 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Avengers-V2-32B", + "name": "Linkbricks-Horizon-AI-Avengers-V2-32B", + "developer": "Saxo", + "scores": { + "IFEval": 0.7956, + "BBH": 0.7023, + "MATH Level 5": 0.5665, + "GPQA": 0.2659, + "MUSR": 0.4166, + "MMLU-PRO": 0.572 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Avengers-V3-32B", + "name": "Linkbricks-Horizon-AI-Avengers-V3-32B", + "developer": "Saxo", + "scores": { + "IFEval": 0.8249, + "BBH": 0.6913, + "MATH Level 5": 0.6178, + "GPQA": 0.3381, + "MUSR": 0.4275, + "MMLU-PRO": 0.5664 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Avengers-V4-32B", + "name": "Linkbricks-Horizon-AI-Avengers-V4-32B", + "developer": "Saxo", + "scores": { + "IFEval": 0.7631, + "BBH": 0.692, + "MATH Level 5": 0.5363, + "GPQA": 0.3616, + "MUSR": 0.4643, + "MMLU-PRO": 0.5752 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Avengers-V5-32B", + "name": "Linkbricks-Horizon-AI-Avengers-V5-32B", + "developer": "Saxo", + "scores": { + "IFEval": 0.7516, + "BBH": 0.6929, + "MATH Level 5": 0.5461, + "GPQA": 0.3557, + "MUSR": 0.4709, + "MMLU-PRO": 0.5762 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Avengers-V6-32B", + "name": "Linkbricks-Horizon-AI-Avengers-V6-32B", + "developer": "Saxo", + "scores": { + "IFEval": 0.8209, + "BBH": 0.689, + "MATH Level 5": 0.6224, + "GPQA": 0.3347, + "MUSR": 0.4274, + "MMLU-PRO": 0.5672 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Korean-Avengers-V2-27B", + "name": "Linkbricks-Horizon-AI-Korean-Avengers-V2-27B", + "developer": "Saxo", + "scores": { + "IFEval": 0.8146, + "BBH": 0.6463, + "MATH Level 5": 0.2802, + "GPQA": 0.3473, + "MUSR": 0.4139, + "MMLU-PRO": 0.4599 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Korean-Avengers-V3-27B", + "name": "Linkbricks-Horizon-AI-Korean-Avengers-V3-27B", + "developer": "Saxo", + "scores": { + "IFEval": 0.8142, + "BBH": 0.6404, + "MATH Level 5": 0.2492, + "GPQA": 0.3591, + "MUSR": 0.4467, + "MMLU-PRO": 0.4524 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Korean-Superb-22B", + "name": "Linkbricks-Horizon-AI-Korean-Superb-22B", + "developer": "Saxo", + "scores": { + "IFEval": 0.6767, + "BBH": 0.5626, + "MATH Level 5": 0.2372, + "GPQA": 0.3263, + "MUSR": 0.3908, + "MMLU-PRO": 0.3871 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Korean-Superb-27B", + "name": "Linkbricks-Horizon-AI-Korean-Superb-27B", + "developer": "Saxo", + "scores": { + "IFEval": 0.7768, + "BBH": 0.6518, + "MATH Level 5": 0.2719, + "GPQA": 0.3599, + "MUSR": 0.4791, + "MMLU-PRO": 0.4647 + } + }, + { + "model_id": "Saxo/Linkbricks-Horizon-AI-Superb-27B", + "name": "Linkbricks-Horizon-AI-Superb-27B", + "developer": "Saxo", + "scores": { + "IFEval": 0.7302, + "BBH": 0.6186, + "MATH Level 5": 0.2221, + "GPQA": 0.3574, + "MUSR": 0.465, + "MMLU-PRO": 0.406 + } + }, + { + "model_id": "SeaLLMs/SeaLLM-7B-v2", + "name": "SeaLLM-7B-v2", + "developer": "SeaLLMs", + "scores": { + "IFEval": 0.3671, + "BBH": 0.4902, + "MATH Level 5": 0.0853, + "GPQA": 0.2785, + "MUSR": 0.407, + "MMLU-PRO": 0.3083 + } + }, + { + "model_id": "SeaLLMs/SeaLLM-7B-v2.5", + "name": "SeaLLM-7B-v2.5", + "developer": "SeaLLMs", + "scores": { + "IFEval": 0.4522, + "BBH": 0.498, + "MATH Level 5": 0.1088, + "GPQA": 0.276, + "MUSR": 0.4203, + "MMLU-PRO": 0.3203 + } + }, + { + "model_id": "SeaLLMs/SeaLLMs-v3-7B-Chat", + "name": "SeaLLMs-v3-7B-Chat", + "developer": "SeaLLMs", + "scores": { + "IFEval": 0.4377, + "BBH": 0.5266, + "MATH Level 5": 0.1858, + "GPQA": 0.2987, + "MUSR": 0.4174, + "MMLU-PRO": 0.3895 + } + }, + { + "model_id": "SenseLLM/ReflectionCoder-CL-34B", + "name": "ReflectionCoder-CL-34B", + "developer": "SenseLLM", + "scores": { + "IFEval": 0.4008, + "BBH": 0.3953, + "MATH Level 5": 0.0332, + "GPQA": 0.2508, + "MUSR": 0.4155, + "MMLU-PRO": 0.1424 + } + }, + { + "model_id": "SenseLLM/ReflectionCoder-DS-33B", + "name": "ReflectionCoder-DS-33B", + "developer": "SenseLLM", + "scores": { + "IFEval": 0.3787, + "BBH": 0.3449, + "MATH Level 5": 0.0302, + "GPQA": 0.2743, + "MUSR": 0.3343, + "MMLU-PRO": 0.1202 + } + }, + { + "model_id": "SentientAGI/Dobby-Mini-Leashed-Llama-3.1-8B", + "name": "Dobby-Mini-Leashed-Llama-3.1-8B", + "developer": "SentientAGI", + "scores": { + "IFEval": 0.7847, + "BBH": 0.5138, + "MATH Level 5": 0.1858, + "GPQA": 0.302, + "MUSR": 0.4254, + "MMLU-PRO": 0.3694 + } + }, + { + "model_id": "SentientAGI/Dobby-Mini-Unhinged-Llama-3.1-8B", + "name": "Dobby-Mini-Unhinged-Llama-3.1-8B", + "developer": "SentientAGI", + "scores": { + "IFEval": 0.7457, + "BBH": 0.5142, + "MATH Level 5": 0.1563, + "GPQA": 0.3062, + "MUSR": 0.4013, + "MMLU-PRO": 0.3585 + } + }, + { + "model_id": "SeppeV/SmolLM_pretrained_with_sft_trained_with_1pc_data_on_a_preference_dpo", + "name": "SmolLM_pretrained_with_sft_trained_with_1pc_data_on_a_preference_dpo", + "developer": "SeppeV", + "scores": { + "IFEval": 0.0955, + "BBH": 0.3073, + "MATH Level 5": 0.0121, + "GPQA": 0.2592, + "MUSR": 0.4032, + "MMLU-PRO": 0.1161 + } + }, + { + "model_id": "Sharathhebbar24/SSH_355M", + "name": "SSH_355M", + "developer": "Sharathhebbar24", + "scores": { + "IFEval": 0.1424, + "BBH": 0.3099, + "MATH Level 5": 0.0091, + "GPQA": 0.2584, + "MUSR": 0.4178, + "MMLU-PRO": 0.1176 + } + }, + { + "model_id": "Sharathhebbar24/chat_gpt2_dpo", + "name": "chat_gpt2_dpo", + "developer": "Sharathhebbar24", + "scores": { + "IFEval": 0.0986, + "BBH": 0.2902, + "MATH Level 5": 0.0053, + "GPQA": 0.2601, + "MUSR": 0.3818, + "MMLU-PRO": 0.1142 + } + }, + { + "model_id": "Shreyash2010/Uma-4x4B-Instruct-v0.1", + "name": "Uma-4x4B-Instruct-v0.1", + "developer": "Shreyash2010", + "scores": { + "IFEval": 0.5517, + "BBH": 0.5512, + "MATH Level 5": 0.1775, + "GPQA": 0.3347, + "MUSR": 0.4441, + "MMLU-PRO": 0.387 + } + }, + { + "model_id": "Sicarius-Prototyping/Brainy_LLAMA", + "name": "Brainy_LLAMA", + "developer": "Sicarius-Prototyping", + "scores": { + "IFEval": 0.5204, + "BBH": 0.5117, + "MATH Level 5": 0.1337, + "GPQA": 0.3138, + "MUSR": 0.4143, + "MMLU-PRO": 0.3849 + } + }, + { + "model_id": "Sicarius-Prototyping/Micropenis_1B", + "name": "Micropenis_1B", + "developer": "Sicarius-Prototyping", + "scores": { + "IFEval": 0.3461, + "BBH": 0.3372, + "MATH Level 5": 0.0461, + "GPQA": 0.2626, + "MUSR": 0.3325, + "MMLU-PRO": 0.186 + } + }, + { + "model_id": "Sicarius-Prototyping/bacon_and_food", + "name": "bacon_and_food", + "developer": "Sicarius-Prototyping", + "scores": { + "IFEval": 0.586, + "BBH": 0.4725, + "MATH Level 5": 0.0982, + "GPQA": 0.3096, + "MUSR": 0.3884, + "MMLU-PRO": 0.3263 + } + }, + { + "model_id": "SicariusSicariiStuff/2B-ad", + "name": "2B-ad", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.4379, + "BBH": 0.4092, + "MATH Level 5": 0.0506, + "GPQA": 0.281, + "MUSR": 0.4015, + "MMLU-PRO": 0.2662 + } + }, + { + "model_id": "SicariusSicariiStuff/2B_or_not_2B", + "name": "2B_or_not_2B", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.2062, + "BBH": 0.3416, + "MATH Level 5": 0.0196, + "GPQA": 0.2475, + "MUSR": 0.3791, + "MMLU-PRO": 0.1399 + } + }, + { + "model_id": "SicariusSicariiStuff/Dusk_Rainbow", + "name": "Dusk_Rainbow", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.3588, + "BBH": 0.4772, + "MATH Level 5": 0.0748, + "GPQA": 0.3087, + "MUSR": 0.4025, + "MMLU-PRO": 0.3443 + } + }, + { + "model_id": "SicariusSicariiStuff/Eximius_Persona_5B", + "name": "Eximius_Persona_5B", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.656, + "BBH": 0.4512, + "MATH Level 5": 0.102, + "GPQA": 0.2643, + "MUSR": 0.3818, + "MMLU-PRO": 0.314 + } + }, + { + "model_id": "SicariusSicariiStuff/Impish_LLAMA_3B", + "name": "Impish_LLAMA_3B", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.463, + "BBH": 0.4091, + "MATH Level 5": 0.1125, + "GPQA": 0.2878, + "MUSR": 0.3673, + "MMLU-PRO": 0.2941 + } + }, + { + "model_id": "SicariusSicariiStuff/Impish_Mind_8B", + "name": "Impish_Mind_8B", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.3179, + "BBH": 0.4674, + "MATH Level 5": 0.105, + "GPQA": 0.3045, + "MUSR": 0.407, + "MMLU-PRO": 0.3309 + } + }, + { + "model_id": "SicariusSicariiStuff/Impish_QWEN_14B-1M", + "name": "Impish_QWEN_14B-1M", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.7868, + "BBH": 0.6283, + "MATH Level 5": 0.3965, + "GPQA": 0.3507, + "MUSR": 0.4615, + "MMLU-PRO": 0.5044 + } + }, + { + "model_id": "SicariusSicariiStuff/Impish_QWEN_7B-1M", + "name": "Impish_QWEN_7B-1M", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.6382, + "BBH": 0.5372, + "MATH Level 5": 0.3089, + "GPQA": 0.2961, + "MUSR": 0.4074, + "MMLU-PRO": 0.4265 + } + }, + { + "model_id": "SicariusSicariiStuff/LLAMA-3_8B_Unaligned_BETA", + "name": "LLAMA-3_8B_Unaligned_BETA", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.3713, + "BBH": 0.4717, + "MATH Level 5": 0.0838, + "GPQA": 0.3054, + "MUSR": 0.4119, + "MMLU-PRO": 0.3465 + } + }, + { + "model_id": "SicariusSicariiStuff/Phi-Line_14B", + "name": "Phi-Line_14B", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.6496, + "BBH": 0.6154, + "MATH Level 5": 0.386, + "GPQA": 0.3532, + "MUSR": 0.4479, + "MMLU-PRO": 0.5454 + } + }, + { + "model_id": "SicariusSicariiStuff/Phi-lthy4", + "name": "Phi-lthy4", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.7679, + "BBH": 0.5879, + "MATH Level 5": 0.1367, + "GPQA": 0.2869, + "MUSR": 0.4083, + "MMLU-PRO": 0.4333 + } + }, + { + "model_id": "SicariusSicariiStuff/Qwen2.5-14B_Uncencored", + "name": "Qwen2.5-14B_Uncencored", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.3158, + "BBH": 0.6309, + "MATH Level 5": 0.318, + "GPQA": 0.3817, + "MUSR": 0.4517, + "MMLU-PRO": 0.5266 + } + }, + { + "model_id": "SicariusSicariiStuff/Qwen2.5-14B_Uncensored", + "name": "Qwen2.5-14B_Uncensored", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.3173, + "BBH": 0.6309, + "MATH Level 5": 0.318, + "GPQA": 0.3817, + "MUSR": 0.4517, + "MMLU-PRO": 0.5266 + } + }, + { + "model_id": "SicariusSicariiStuff/Qwen2.5-14B_Uncensored_Instruct", + "name": "Qwen2.5-14B_Uncensored_Instruct", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.3789, + "BBH": 0.5937, + "MATH Level 5": 0.3285, + "GPQA": 0.3297, + "MUSR": 0.3697, + "MMLU-PRO": 0.5127 + } + }, + { + "model_id": "SicariusSicariiStuff/Redemption_Wind_24B", + "name": "Redemption_Wind_24B", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.2501, + "BBH": 0.6428, + "MATH Level 5": 0.1858, + "GPQA": 0.3834, + "MUSR": 0.4262, + "MMLU-PRO": 0.5432 + } + }, + { + "model_id": "SicariusSicariiStuff/Winged_Imp_8B", + "name": "Winged_Imp_8B", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.743, + "BBH": 0.512, + "MATH Level 5": 0.1201, + "GPQA": 0.2827, + "MUSR": 0.4148, + "MMLU-PRO": 0.3639 + } + }, + { + "model_id": "SicariusSicariiStuff/Wingless_Imp_8B", + "name": "Wingless_Imp_8B", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.743, + "BBH": 0.512, + "MATH Level 5": 0.1201, + "GPQA": 0.2827, + "MUSR": 0.4148, + "MMLU-PRO": 0.3639 + } + }, + { + "model_id": "SicariusSicariiStuff/Zion_Alpha", + "name": "Zion_Alpha", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.3324, + "BBH": 0.4932, + "MATH Level 5": 0.0521, + "GPQA": 0.2903, + "MUSR": 0.4727, + "MMLU-PRO": 0.3132 + } + }, + { + "model_id": "SicariusSicariiStuff/dn_ep02", + "name": "dn_ep02", + "developer": "SicariusSicariiStuff", + "scores": { + "IFEval": 0.5064, + "BBH": 0.5266, + "MATH Level 5": 0.142, + "GPQA": 0.3154, + "MUSR": 0.4316, + "MMLU-PRO": 0.3998 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.1-8B-lora", + "name": "SKY-Ko-Llama3.1-8B-lora", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.5058, + "BBH": 0.5088, + "MATH Level 5": 0.1548, + "GPQA": 0.3213, + "MUSR": 0.3998, + "MMLU-PRO": 0.3777 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.1-8B-lora-epoch1", + "name": "SKY-Ko-Llama3.1-8B-lora-epoch1", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.5058, + "BBH": 0.5088, + "MATH Level 5": 0.1548, + "GPQA": 0.3213, + "MUSR": 0.3998, + "MMLU-PRO": 0.3777 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.2-1B-lora-epoch3", + "name": "SKY-Ko-Llama3.2-1B-lora-epoch3", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.3247, + "BBH": 0.3167, + "MATH Level 5": 0.0272, + "GPQA": 0.2517, + "MUSR": 0.3382, + "MMLU-PRO": 0.1279 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.2-1B-lora-epoch5", + "name": "SKY-Ko-Llama3.2-1B-lora-epoch5", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.436, + "BBH": 0.3406, + "MATH Level 5": 0.0521, + "GPQA": 0.2592, + "MUSR": 0.3471, + "MMLU-PRO": 0.1946 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.2-1B-lora-v2-epoch3", + "name": "SKY-Ko-Llama3.2-1B-lora-v2-epoch3", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.436, + "BBH": 0.3406, + "MATH Level 5": 0.0521, + "GPQA": 0.2592, + "MUSR": 0.3471, + "MMLU-PRO": 0.1946 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.2-1B-lora-v2-epoch5", + "name": "SKY-Ko-Llama3.2-1B-lora-v2-epoch5", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.4247, + "BBH": 0.3397, + "MATH Level 5": 0.0506, + "GPQA": 0.2542, + "MUSR": 0.3458, + "MMLU-PRO": 0.1946 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.2-3B-lora-epoch1", + "name": "SKY-Ko-Llama3.2-3B-lora-epoch1", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.5331, + "BBH": 0.44, + "MATH Level 5": 0.1458, + "GPQA": 0.2919, + "MUSR": 0.3522, + "MMLU-PRO": 0.3004 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.2-3B-lora-epoch2", + "name": "SKY-Ko-Llama3.2-3B-lora-epoch2", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.5331, + "BBH": 0.44, + "MATH Level 5": 0.1458, + "GPQA": 0.2919, + "MUSR": 0.3522, + "MMLU-PRO": 0.3004 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Llama3.2-3B-lora-epoch3", + "name": "SKY-Ko-Llama3.2-3B-lora-epoch3", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.5331, + "BBH": 0.44, + "MATH Level 5": 0.1458, + "GPQA": 0.2919, + "MUSR": 0.3522, + "MMLU-PRO": 0.3004 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Qwen2.5-3B-Instruct", + "name": "SKY-Ko-Qwen2.5-3B-Instruct", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.3534, + "BBH": 0.4265, + "MATH Level 5": 0.0695, + "GPQA": 0.2794, + "MUSR": 0.4024, + "MMLU-PRO": 0.2812 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Qwen2.5-7B-Instruct-SFT-step-15000", + "name": "SKY-Ko-Qwen2.5-7B-Instruct-SFT-step-15000", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.3819, + "BBH": 0.5078, + "MATH Level 5": 0.1866, + "GPQA": 0.3272, + "MUSR": 0.4436, + "MMLU-PRO": 0.3914 + } + }, + { + "model_id": "SkyOrbis/SKY-Ko-Qwen2.5-7B-Instruct-SFT-step-5000", + "name": "SKY-Ko-Qwen2.5-7B-Instruct-SFT-step-5000", + "developer": "SkyOrbis", + "scores": { + "IFEval": 0.3812, + "BBH": 0.539, + "MATH Level 5": 0.21, + "GPQA": 0.3029, + "MUSR": 0.4238, + "MMLU-PRO": 0.4238 + } + }, + { + "model_id": "Skywork/Skywork-Reward-Gemma-2-27B-v0.2", + "name": "Skywork-Reward-Gemma-2-27B-v0.2", + "developer": "Skywork", + "scores": { + "IFEval": 0.7807, + "BBH": 0.636, + "MATH Level 5": 0.2273, + "GPQA": 0.344, + "MUSR": 0.4231, + "MMLU-PRO": 0.4103 + } + }, + { + "model_id": "Skywork/Skywork-o1-Open-Llama-3.1-8B", + "name": "Skywork-o1-Open-Llama-3.1-8B", + "developer": "Skywork", + "scores": { + "IFEval": 0.3518, + "BBH": 0.4516, + "MATH Level 5": 0.5211, + "GPQA": 0.2592, + "MUSR": 0.3156, + "MMLU-PRO": 0.203 + } + }, + { + "model_id": "Solshine/Brimful-merged-replete", + "name": "Brimful-merged-replete", + "developer": "Solshine", + "scores": { + "IFEval": 0.1761, + "BBH": 0.2883, + "MATH Level 5": 0.003, + "GPQA": 0.2576, + "MUSR": 0.3421, + "MMLU-PRO": 0.1085 + } + }, + { + "model_id": "Solshine/Llama-3-1-big-thoughtful-passthrough-merge-2", + "name": "Llama-3-1-big-thoughtful-passthrough-merge-2", + "developer": "Solshine", + "scores": { + "IFEval": 0.2547, + "BBH": 0.3209, + "MATH Level 5": 0.0106, + "GPQA": 0.2592, + "MUSR": 0.3889, + "MMLU-PRO": 0.1185 + } + }, + { + "model_id": "Sorawiz/Gemma-9B-Base", + "name": "Gemma-9B-Base", + "developer": "Sorawiz", + "scores": { + "IFEval": 0.1667, + "BBH": 0.593, + "MATH Level 5": 0.0982, + "GPQA": 0.3398, + "MUSR": 0.4045, + "MMLU-PRO": 0.4235 + } + }, + { + "model_id": "Sorawiz/Gemma-Creative-9B-Base", + "name": "Gemma-Creative-9B-Base", + "developer": "Sorawiz", + "scores": { + "IFEval": 0.1515, + "BBH": 0.5459, + "MATH Level 5": 0.0778, + "GPQA": 0.3297, + "MUSR": 0.4019, + "MMLU-PRO": 0.4008 + } + }, + { + "model_id": "Sourjayon/DeepSeek-R1-8b-Sify", + "name": "DeepSeek-R1-8b-Sify", + "developer": "Sourjayon", + "scores": { + "IFEval": 0.3679, + "BBH": 0.3379, + "MATH Level 5": 0.2447, + "GPQA": 0.2525, + "MUSR": 0.3303, + "MMLU-PRO": 0.1981 + } + }, + { + "model_id": "Sourjayon/DeepSeek-R1-ForumNXT", + "name": "DeepSeek-R1-ForumNXT", + "developer": "Sourjayon", + "scores": { + "IFEval": 0.2603, + "BBH": 0.331, + "MATH Level 5": 0.2576, + "GPQA": 0.2743, + "MUSR": 0.3392, + "MMLU-PRO": 0.1648 + } + }, + { + "model_id": "SpaceYL/ECE_Poirot", + "name": "ECE_Poirot", + "developer": "SpaceYL", + "scores": { + "IFEval": 0.3107, + "BBH": 0.4262, + "MATH Level 5": 0.0914, + "GPQA": 0.2978, + "MUSR": 0.4026, + "MMLU-PRO": 0.2883 + } + }, + { + "model_id": "Spestly/Athena-1-3B", + "name": "Athena-1-3B", + "developer": "Spestly", + "scores": { + "IFEval": 0.5569, + "BBH": 0.4702, + "MATH Level 5": 0.2379, + "GPQA": 0.2936, + "MUSR": 0.4362, + "MMLU-PRO": 0.3519 + } + }, + { + "model_id": "Spestly/Atlas-Pro-1.5B-Preview", + "name": "Atlas-Pro-1.5B-Preview", + "developer": "Spestly", + "scores": { + "IFEval": 0.243, + "BBH": 0.3499, + "MATH Level 5": 0.3195, + "GPQA": 0.297, + "MUSR": 0.3354, + "MMLU-PRO": 0.1925 + } + }, + { + "model_id": "Spestly/Atlas-Pro-7B-Preview", + "name": "Atlas-Pro-7B-Preview", + "developer": "Spestly", + "scores": { + "IFEval": 0.3154, + "BBH": 0.4668, + "MATH Level 5": 0.5083, + "GPQA": 0.3372, + "MUSR": 0.3911, + "MMLU-PRO": 0.297 + } + }, + { + "model_id": "Stark2008/GutenLaserPi", + "name": "GutenLaserPi", + "developer": "Stark2008", + "scores": { + "IFEval": 0.4227, + "BBH": 0.5212, + "MATH Level 5": 0.0785, + "GPQA": 0.2869, + "MUSR": 0.462, + "MMLU-PRO": 0.3106 + } + }, + { + "model_id": "Stark2008/LayleleFlamPi", + "name": "LayleleFlamPi", + "developer": "Stark2008", + "scores": { + "IFEval": 0.4284, + "BBH": 0.5116, + "MATH Level 5": 0.0665, + "GPQA": 0.2852, + "MUSR": 0.4608, + "MMLU-PRO": 0.3093 + } + }, + { + "model_id": "Stark2008/VisFlamCat", + "name": "VisFlamCat", + "developer": "Stark2008", + "scores": { + "IFEval": 0.4366, + "BBH": 0.5217, + "MATH Level 5": 0.0763, + "GPQA": 0.2903, + "MUSR": 0.4463, + "MMLU-PRO": 0.3144 + } + }, + { + "model_id": "Steelskull/L3.3-MS-Nevoria-70b", + "name": "L3.3-MS-Nevoria-70b", + "developer": "Steelskull", + "scores": { + "IFEval": 0.6963, + "BBH": 0.6998, + "MATH Level 5": 0.3958, + "GPQA": 0.4706, + "MUSR": 0.4682, + "MMLU-PRO": 0.5535 + } + }, + { + "model_id": "Steelskull/L3.3-Nevoria-R1-70b", + "name": "L3.3-Nevoria-R1-70b", + "developer": "Steelskull", + "scores": { + "IFEval": 0.6024, + "BBH": 0.6972, + "MATH Level 5": 0.463, + "GPQA": 0.469, + "MUSR": 0.4775, + "MMLU-PRO": 0.5463 + } + }, + { + "model_id": "StelleX/Qwen2.5_Math_7B_Cot", + "name": "Qwen2.5_Math_7B_Cot", + "developer": "StelleX", + "scores": { + "IFEval": 0.2143, + "BBH": 0.4313, + "MATH Level 5": 0.3263, + "GPQA": 0.2945, + "MUSR": 0.3924, + "MMLU-PRO": 0.281 + } + }, + { + "model_id": "StelleX/Vorisatex-7B-preview", + "name": "Vorisatex-7B-preview", + "developer": "StelleX", + "scores": { + "IFEval": 0.1515, + "BBH": 0.3112, + "MATH Level 5": 0.0287, + "GPQA": 0.2517, + "MUSR": 0.4192, + "MMLU-PRO": 0.1166 + } + }, + { + "model_id": "SultanR/SmolTulu-1.7b-Instruct", + "name": "SmolTulu-1.7b-Instruct", + "developer": "SultanR", + "scores": { + "IFEval": 0.6541, + "BBH": 0.3713, + "MATH Level 5": 0.0793, + "GPQA": 0.2693, + "MUSR": 0.354, + "MMLU-PRO": 0.171 + } + }, + { + "model_id": "SultanR/SmolTulu-1.7b-Reinforced", + "name": "SmolTulu-1.7b-Reinforced", + "developer": "SultanR", + "scores": { + "IFEval": 0.6791, + "BBH": 0.3552, + "MATH Level 5": 0.0718, + "GPQA": 0.276, + "MUSR": 0.3406, + "MMLU-PRO": 0.1763 + } + }, + { + "model_id": "SultanR/SmolTulu-1.7b-it-v0", + "name": "SmolTulu-1.7b-it-v0", + "developer": "SultanR", + "scores": { + "IFEval": 0.6541, + "BBH": 0.3713, + "MATH Level 5": 0.0793, + "GPQA": 0.2693, + "MUSR": 0.354, + "MMLU-PRO": 0.171 + } + }, + { + "model_id": "Supichi/BBA-123", + "name": "BBA-123", + "developer": "Supichi", + "scores": { + "IFEval": 0.208, + "BBH": 0.292, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3499, + "MMLU-PRO": 0.1167 + } + }, + { + "model_id": "Supichi/BBA99", + "name": "BBA99", + "developer": "Supichi", + "scores": { + "IFEval": 0.1407, + "BBH": 0.2769, + "MATH Level 5": 0.0, + "GPQA": 0.2634, + "MUSR": 0.3218, + "MMLU-PRO": 0.1112 + } + }, + { + "model_id": "Supichi/BBAIK29", + "name": "BBAIK29", + "developer": "Supichi", + "scores": { + "IFEval": 0.4588, + "BBH": 0.559, + "MATH Level 5": 0.3678, + "GPQA": 0.3121, + "MUSR": 0.4501, + "MMLU-PRO": 0.4469 + } + }, + { + "model_id": "Supichi/BBAI_135_Gemma", + "name": "BBAI_135_Gemma", + "developer": "Supichi", + "scores": { + "IFEval": 0.0656, + "BBH": 0.3568, + "MATH Level 5": 0.0, + "GPQA": 0.2676, + "MUSR": 0.3805, + "MMLU-PRO": 0.1672 + } + }, + { + "model_id": "Supichi/BBAI_250_Xia0_gZ", + "name": "BBAI_250_Xia0_gZ", + "developer": "Supichi", + "scores": { + "IFEval": 0.4685, + "BBH": 0.5568, + "MATH Level 5": 0.364, + "GPQA": 0.3213, + "MUSR": 0.4579, + "MMLU-PRO": 0.4465 + } + }, + { + "model_id": "Supichi/BBAI_275_Tsunami_gZ", + "name": "BBAI_275_Tsunami_gZ", + "developer": "Supichi", + "scores": { + "IFEval": 0.537, + "BBH": 0.5531, + "MATH Level 5": 0.3285, + "GPQA": 0.3213, + "MUSR": 0.4448, + "MMLU-PRO": 0.4492 + } + }, + { + "model_id": "Supichi/BBAI_525_Tsu_gZ_Xia0", + "name": "BBAI_525_Tsu_gZ_Xia0", + "developer": "Supichi", + "scores": { + "IFEval": 0.5339, + "BBH": 0.5562, + "MATH Level 5": 0.3429, + "GPQA": 0.3121, + "MUSR": 0.4474, + "MMLU-PRO": 0.4477 + } + }, + { + "model_id": "Supichi/BBAI_78B_Calme_3_1_Ties", + "name": "BBAI_78B_Calme_3_1_Ties", + "developer": "Supichi", + "scores": { + "IFEval": 0.1828, + "BBH": 0.2828, + "MATH Level 5": 0.0, + "GPQA": 0.229, + "MUSR": 0.31, + "MMLU-PRO": 0.1144 + } + }, + { + "model_id": "Supichi/BBAI_QWEEN_V000000_LUMEN_14B", + "name": "BBAI_QWEEN_V000000_LUMEN_14B", + "developer": "Supichi", + "scores": { + "IFEval": 0.1815, + "BBH": 0.2297, + "MATH Level 5": 0.0, + "GPQA": 0.2315, + "MUSR": 0.3445, + "MMLU-PRO": 0.116 + } + }, + { + "model_id": "Supichi/HF_TOKEN", + "name": "HF_TOKEN", + "developer": "Supichi", + "scores": { + "IFEval": 0.138, + "BBH": 0.2764, + "MATH Level 5": 0.0008, + "GPQA": 0.2634, + "MUSR": 0.3272, + "MMLU-PRO": 0.111 + } + }, + { + "model_id": "Supichi/NJS26", + "name": "NJS26", + "developer": "Supichi", + "scores": { + "IFEval": 0.0448, + "BBH": 0.478, + "MATH Level 5": 0.0325, + "GPQA": 0.318, + "MUSR": 0.3854, + "MMLU-PRO": 0.3037 + } + }, + { + "model_id": "Svak/MN-12B-Inferor-v0.0", + "name": "MN-12B-Inferor-v0.0", + "developer": "Svak", + "scores": { + "IFEval": 0.5708, + "BBH": 0.5195, + "MATH Level 5": 0.102, + "GPQA": 0.3087, + "MUSR": 0.4639, + "MMLU-PRO": 0.3559 + } + }, + { + "model_id": "Svak/MN-12B-Inferor-v0.1", + "name": "MN-12B-Inferor-v0.1", + "developer": "Svak", + "scores": { + "IFEval": 0.6347, + "BBH": 0.5147, + "MATH Level 5": 0.1261, + "GPQA": 0.3255, + "MUSR": 0.4351, + "MMLU-PRO": 0.3662 + } + }, + { + "model_id": "Syed-Hasan-8503/Phi-3-mini-4K-instruct-cpo-simpo", + "name": "Phi-3-mini-4K-instruct-cpo-simpo", + "developer": "Syed-Hasan-8503", + "scores": { + "IFEval": 0.5714, + "BBH": 0.5682, + "MATH Level 5": 0.1571, + "GPQA": 0.3305, + "MUSR": 0.3964, + "MMLU-PRO": 0.3861 + } + }, + { + "model_id": "T145/KRONOS-8B-V1-P1", + "name": "KRONOS-8B-V1-P1", + "developer": "T145", + "scores": { + "IFEval": 0.785, + "BBH": 0.5085, + "MATH Level 5": 0.1979, + "GPQA": 0.2953, + "MUSR": 0.3881, + "MMLU-PRO": 0.376 + } + }, + { + "model_id": "T145/KRONOS-8B-V1-P2", + "name": "KRONOS-8B-V1-P2", + "developer": "T145", + "scores": { + "IFEval": 0.6724, + "BBH": 0.4772, + "MATH Level 5": 0.1601, + "GPQA": 0.2919, + "MUSR": 0.3568, + "MMLU-PRO": 0.3453 + } + }, + { + "model_id": "T145/KRONOS-8B-V1-P3", + "name": "KRONOS-8B-V1-P3", + "developer": "T145", + "scores": { + "IFEval": 0.7137, + "BBH": 0.5128, + "MATH Level 5": 0.1926, + "GPQA": 0.2601, + "MUSR": 0.3616, + "MMLU-PRO": 0.3405 + } + }, + { + "model_id": "T145/KRONOS-8B-V2", + "name": "KRONOS-8B-V2", + "developer": "T145", + "scores": { + "IFEval": 0.518, + "BBH": 0.5133, + "MATH Level 5": 0.2266, + "GPQA": 0.2987, + "MUSR": 0.3829, + "MMLU-PRO": 0.3738 + } + }, + { + "model_id": "T145/KRONOS-8B-V3", + "name": "KRONOS-8B-V3", + "developer": "T145", + "scores": { + "IFEval": 0.5475, + "BBH": 0.5119, + "MATH Level 5": 0.2598, + "GPQA": 0.2886, + "MUSR": 0.3922, + "MMLU-PRO": 0.3738 + } + }, + { + "model_id": "T145/KRONOS-8B-V4", + "name": "KRONOS-8B-V4", + "developer": "T145", + "scores": { + "IFEval": 0.7889, + "BBH": 0.5092, + "MATH Level 5": 0.1949, + "GPQA": 0.2894, + "MUSR": 0.383, + "MMLU-PRO": 0.3786 + } + }, + { + "model_id": "T145/KRONOS-8B-V5", + "name": "KRONOS-8B-V5", + "developer": "T145", + "scores": { + "IFEval": 0.5405, + "BBH": 0.5089, + "MATH Level 5": 0.2689, + "GPQA": 0.2903, + "MUSR": 0.4055, + "MMLU-PRO": 0.3759 + } + }, + { + "model_id": "T145/KRONOS-8B-V6", + "name": "KRONOS-8B-V6", + "developer": "T145", + "scores": { + "IFEval": 0.7022, + "BBH": 0.5034, + "MATH Level 5": 0.2598, + "GPQA": 0.2794, + "MUSR": 0.4121, + "MMLU-PRO": 0.3501 + } + }, + { + "model_id": "T145/KRONOS-8B-V7", + "name": "KRONOS-8B-V7", + "developer": "T145", + "scores": { + "IFEval": 0.3529, + "BBH": 0.4526, + "MATH Level 5": 0.111, + "GPQA": 0.2668, + "MUSR": 0.3671, + "MMLU-PRO": 0.2697 + } + }, + { + "model_id": "T145/KRONOS-8B-V8", + "name": "KRONOS-8B-V8", + "developer": "T145", + "scores": { + "IFEval": 0.777, + "BBH": 0.5094, + "MATH Level 5": 0.2047, + "GPQA": 0.2894, + "MUSR": 0.3869, + "MMLU-PRO": 0.3782 + } + }, + { + "model_id": "T145/KRONOS-8B-V9", + "name": "KRONOS-8B-V9", + "developer": "T145", + "scores": { + "IFEval": 0.7856, + "BBH": 0.5099, + "MATH Level 5": 0.1986, + "GPQA": 0.2961, + "MUSR": 0.3868, + "MMLU-PRO": 0.3752 + } + }, + { + "model_id": "T145/Llama-3.1-8B-Instruct-Zeus", + "name": "Llama-3.1-8B-Instruct-Zeus", + "developer": "T145", + "scores": { + "IFEval": 0.7941, + "BBH": 0.5174, + "MATH Level 5": 0.1956, + "GPQA": 0.3012, + "MUSR": 0.3976, + "MMLU-PRO": 0.3893 + } + }, + { + "model_id": "T145/Llama-3.1-8B-Zeus", + "name": "Llama-3.1-8B-Zeus", + "developer": "T145", + "scores": { + "IFEval": 0.3518, + "BBH": 0.3671, + "MATH Level 5": 0.0144, + "GPQA": 0.2651, + "MUSR": 0.3316, + "MMLU-PRO": 0.1332 + } + }, + { + "model_id": "T145/Meta-Llama-3.1-8B-Instruct-TIES", + "name": "Meta-Llama-3.1-8B-Instruct-TIES", + "developer": "T145", + "scores": { + "IFEval": 0.5424, + "BBH": 0.507, + "MATH Level 5": 0.21, + "GPQA": 0.2945, + "MUSR": 0.3843, + "MMLU-PRO": 0.378 + } + }, + { + "model_id": "T145/ZEUS-8B-V10", + "name": "ZEUS-8B-V10", + "developer": "T145", + "scores": { + "IFEval": 0.7707, + "BBH": 0.527, + "MATH Level 5": 0.2115, + "GPQA": 0.3247, + "MUSR": 0.3898, + "MMLU-PRO": 0.3904 + } + }, + { + "model_id": "T145/ZEUS-8B-V11", + "name": "ZEUS-8B-V11", + "developer": "T145", + "scores": { + "IFEval": 0.81, + "BBH": 0.5162, + "MATH Level 5": 0.1964, + "GPQA": 0.3146, + "MUSR": 0.3807, + "MMLU-PRO": 0.3884 + } + }, + { + "model_id": "T145/ZEUS-8B-V12", + "name": "ZEUS-8B-V12", + "developer": "T145", + "scores": { + "IFEval": 0.7816, + "BBH": 0.5254, + "MATH Level 5": 0.2115, + "GPQA": 0.3205, + "MUSR": 0.3858, + "MMLU-PRO": 0.3912 + } + }, + { + "model_id": "T145/ZEUS-8B-V13", + "name": "ZEUS-8B-V13", + "developer": "T145", + "scores": { + "IFEval": 0.7904, + "BBH": 0.5277, + "MATH Level 5": 0.2137, + "GPQA": 0.3238, + "MUSR": 0.3845, + "MMLU-PRO": 0.3911 + } + }, + { + "model_id": "T145/ZEUS-8B-V13-abliterated", + "name": "ZEUS-8B-V13-abliterated", + "developer": "T145", + "scores": { + "IFEval": 0.7878, + "BBH": 0.5198, + "MATH Level 5": 0.179, + "GPQA": 0.3112, + "MUSR": 0.3871, + "MMLU-PRO": 0.3872 + } + }, + { + "model_id": "T145/ZEUS-8B-V14", + "name": "ZEUS-8B-V14", + "developer": "T145", + "scores": { + "IFEval": 0.7709, + "BBH": 0.5275, + "MATH Level 5": 0.213, + "GPQA": 0.3205, + "MUSR": 0.3844, + "MMLU-PRO": 0.3914 + } + }, + { + "model_id": "T145/ZEUS-8B-V15", + "name": "ZEUS-8B-V15", + "developer": "T145", + "scores": { + "IFEval": 0.7013, + "BBH": 0.5538, + "MATH Level 5": 0.2304, + "GPQA": 0.276, + "MUSR": 0.402, + "MMLU-PRO": 0.4059 + } + }, + { + "model_id": "T145/ZEUS-8B-V16", + "name": "ZEUS-8B-V16", + "developer": "T145", + "scores": { + "IFEval": 0.7925, + "BBH": 0.5266, + "MATH Level 5": 0.2205, + "GPQA": 0.307, + "MUSR": 0.3951, + "MMLU-PRO": 0.3926 + } + }, + { + "model_id": "T145/ZEUS-8B-V17", + "name": "ZEUS-8B-V17", + "developer": "T145", + "scores": { + "IFEval": 0.7941, + "BBH": 0.5251, + "MATH Level 5": 0.2243, + "GPQA": 0.3221, + "MUSR": 0.4016, + "MMLU-PRO": 0.3935 + } + }, + { + "model_id": "T145/ZEUS-8B-V17-abliterated", + "name": "ZEUS-8B-V17-abliterated", + "developer": "T145", + "scores": { + "IFEval": 0.7576, + "BBH": 0.52, + "MATH Level 5": 0.0438, + "GPQA": 0.3037, + "MUSR": 0.4269, + "MMLU-PRO": 0.3622 + } + }, + { + "model_id": "T145/ZEUS-8B-V17-abliterated-V2", + "name": "ZEUS-8B-V17-abliterated-V2", + "developer": "T145", + "scores": { + "IFEval": 0.6532, + "BBH": 0.4928, + "MATH Level 5": 0.1118, + "GPQA": 0.2735, + "MUSR": 0.3407, + "MMLU-PRO": 0.3402 + } + }, + { + "model_id": "T145/ZEUS-8B-V17-abliterated-V4", + "name": "ZEUS-8B-V17-abliterated-V4", + "developer": "T145", + "scores": { + "IFEval": 0.7228, + "BBH": 0.5169, + "MATH Level 5": 0.0937, + "GPQA": 0.2836, + "MUSR": 0.4187, + "MMLU-PRO": 0.3774 + } + }, + { + "model_id": "T145/ZEUS-8B-V18", + "name": "ZEUS-8B-V18", + "developer": "T145", + "scores": { + "IFEval": 0.7834, + "BBH": 0.527, + "MATH Level 5": 0.2183, + "GPQA": 0.3213, + "MUSR": 0.4043, + "MMLU-PRO": 0.3942 + } + }, + { + "model_id": "T145/ZEUS-8B-V19", + "name": "ZEUS-8B-V19", + "developer": "T145", + "scores": { + "IFEval": 0.7883, + "BBH": 0.5276, + "MATH Level 5": 0.2205, + "GPQA": 0.3221, + "MUSR": 0.4043, + "MMLU-PRO": 0.3934 + } + }, + { + "model_id": "T145/ZEUS-8B-V2", + "name": "ZEUS-8B-V2", + "developer": "T145", + "scores": { + "IFEval": 0.8029, + "BBH": 0.5194, + "MATH Level 5": 0.216, + "GPQA": 0.302, + "MUSR": 0.391, + "MMLU-PRO": 0.3896 + } + }, + { + "model_id": "T145/ZEUS-8B-V2-ORPO", + "name": "ZEUS-8B-V2-ORPO", + "developer": "T145", + "scores": { + "IFEval": 0.7187, + "BBH": 0.5075, + "MATH Level 5": 0.1828, + "GPQA": 0.3104, + "MUSR": 0.3935, + "MMLU-PRO": 0.3678 + } + }, + { + "model_id": "T145/ZEUS-8B-V2-abliterated", + "name": "ZEUS-8B-V2-abliterated", + "developer": "T145", + "scores": { + "IFEval": 0.7895, + "BBH": 0.5129, + "MATH Level 5": 0.2115, + "GPQA": 0.3129, + "MUSR": 0.3911, + "MMLU-PRO": 0.3825 + } + }, + { + "model_id": "T145/ZEUS-8B-V20", + "name": "ZEUS-8B-V20", + "developer": "T145", + "scores": { + "IFEval": 0.7956, + "BBH": 0.5244, + "MATH Level 5": 0.219, + "GPQA": 0.323, + "MUSR": 0.4043, + "MMLU-PRO": 0.393 + } + }, + { + "model_id": "T145/ZEUS-8B-V21", + "name": "ZEUS-8B-V21", + "developer": "T145", + "scores": { + "IFEval": 0.3785, + "BBH": 0.3398, + "MATH Level 5": 0.1594, + "GPQA": 0.2643, + "MUSR": 0.3262, + "MMLU-PRO": 0.1714 + } + }, + { + "model_id": "T145/ZEUS-8B-V22", + "name": "ZEUS-8B-V22", + "developer": "T145", + "scores": { + "IFEval": 0.7995, + "BBH": 0.5245, + "MATH Level 5": 0.2228, + "GPQA": 0.328, + "MUSR": 0.399, + "MMLU-PRO": 0.3938 + } + }, + { + "model_id": "T145/ZEUS-8B-V23", + "name": "ZEUS-8B-V23", + "developer": "T145", + "scores": { + "IFEval": 0.7621, + "BBH": 0.5195, + "MATH Level 5": 0.182, + "GPQA": 0.3096, + "MUSR": 0.3922, + "MMLU-PRO": 0.3666 + } + }, + { + "model_id": "T145/ZEUS-8B-V24", + "name": "ZEUS-8B-V24", + "developer": "T145", + "scores": { + "IFEval": 0.6, + "BBH": 0.4778, + "MATH Level 5": 0.1458, + "GPQA": 0.2617, + "MUSR": 0.3729, + "MMLU-PRO": 0.3285 + } + }, + { + "model_id": "T145/ZEUS-8B-V25", + "name": "ZEUS-8B-V25", + "developer": "T145", + "scores": { + "IFEval": 0.332, + "BBH": 0.4547, + "MATH Level 5": 0.2039, + "GPQA": 0.2643, + "MUSR": 0.3488, + "MMLU-PRO": 0.2885 + } + }, + { + "model_id": "T145/ZEUS-8B-V26", + "name": "ZEUS-8B-V26", + "developer": "T145", + "scores": { + "IFEval": 0.6708, + "BBH": 0.5232, + "MATH Level 5": 0.1246, + "GPQA": 0.2953, + "MUSR": 0.4016, + "MMLU-PRO": 0.3907 + } + }, + { + "model_id": "T145/ZEUS-8B-V27", + "name": "ZEUS-8B-V27", + "developer": "T145", + "scores": { + "IFEval": 0.6544, + "BBH": 0.523, + "MATH Level 5": 0.1344, + "GPQA": 0.3079, + "MUSR": 0.3977, + "MMLU-PRO": 0.3902 + } + }, + { + "model_id": "T145/ZEUS-8B-V28", + "name": "ZEUS-8B-V28", + "developer": "T145", + "scores": { + "IFEval": 0.6353, + "BBH": 0.5254, + "MATH Level 5": 0.1269, + "GPQA": 0.3037, + "MUSR": 0.3896, + "MMLU-PRO": 0.3902 + } + }, + { + "model_id": "T145/ZEUS-8B-V29", + "name": "ZEUS-8B-V29", + "developer": "T145", + "scores": { + "IFEval": 0.7418, + "BBH": 0.5253, + "MATH Level 5": 0.1601, + "GPQA": 0.3263, + "MUSR": 0.4003, + "MMLU-PRO": 0.392 + } + }, + { + "model_id": "T145/ZEUS-8B-V2L1", + "name": "ZEUS-8B-V2L1", + "developer": "T145", + "scores": { + "IFEval": 0.3192, + "BBH": 0.5013, + "MATH Level 5": 0.1239, + "GPQA": 0.3129, + "MUSR": 0.3882, + "MMLU-PRO": 0.3638 + } + }, + { + "model_id": "T145/ZEUS-8B-V2L2", + "name": "ZEUS-8B-V2L2", + "developer": "T145", + "scores": { + "IFEval": 0.8021, + "BBH": 0.5203, + "MATH Level 5": 0.2017, + "GPQA": 0.2995, + "MUSR": 0.3975, + "MMLU-PRO": 0.3884 + } + }, + { + "model_id": "T145/ZEUS-8B-V3", + "name": "ZEUS-8B-V3", + "developer": "T145", + "scores": { + "IFEval": 0.7887, + "BBH": 0.5265, + "MATH Level 5": 0.1677, + "GPQA": 0.3221, + "MUSR": 0.4017, + "MMLU-PRO": 0.3804 + } + }, + { + "model_id": "T145/ZEUS-8B-V30", + "name": "ZEUS-8B-V30", + "developer": "T145", + "scores": { + "IFEval": 0.7436, + "BBH": 0.5243, + "MATH Level 5": 0.1586, + "GPQA": 0.3205, + "MUSR": 0.4029, + "MMLU-PRO": 0.3944 + } + }, + { + "model_id": "T145/ZEUS-8B-V4", + "name": "ZEUS-8B-V4", + "developer": "T145", + "scores": { + "IFEval": 0.7807, + "BBH": 0.5246, + "MATH Level 5": 0.1926, + "GPQA": 0.307, + "MUSR": 0.4029, + "MMLU-PRO": 0.3788 + } + }, + { + "model_id": "T145/ZEUS-8B-V6", + "name": "ZEUS-8B-V6", + "developer": "T145", + "scores": { + "IFEval": 0.7838, + "BBH": 0.524, + "MATH Level 5": 0.2024, + "GPQA": 0.3045, + "MUSR": 0.4068, + "MMLU-PRO": 0.3759 + } + }, + { + "model_id": "T145/ZEUS-8B-V7", + "name": "ZEUS-8B-V7", + "developer": "T145", + "scores": { + "IFEval": 0.7786, + "BBH": 0.507, + "MATH Level 5": 0.148, + "GPQA": 0.297, + "MUSR": 0.4162, + "MMLU-PRO": 0.3812 + } + }, + { + "model_id": "T145/ZEUS-8B-V8", + "name": "ZEUS-8B-V8", + "developer": "T145", + "scores": { + "IFEval": 0.7914, + "BBH": 0.5065, + "MATH Level 5": 0.1329, + "GPQA": 0.2878, + "MUSR": 0.4214, + "MMLU-PRO": 0.3761 + } + }, + { + "model_id": "T145/ZEUS-8B-V9", + "name": "ZEUS-8B-V9", + "developer": "T145", + "scores": { + "IFEval": 0.5551, + "BBH": 0.5207, + "MATH Level 5": 0.2137, + "GPQA": 0.2911, + "MUSR": 0.3949, + "MMLU-PRO": 0.3901 + } + }, + { + "model_id": "T145/qwen-2.5-3B-merge-test", + "name": "qwen-2.5-3B-merge-test", + "developer": "T145", + "scores": { + "IFEval": 0.5751, + "BBH": 0.4842, + "MATH Level 5": 0.3202, + "GPQA": 0.2852, + "MUSR": 0.4007, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "THUDM/glm-4-9b", + "name": "glm-4-9b", + "developer": "THUDM", + "scores": { + "IFEval": 0.1426, + "BBH": 0.5528, + "MATH Level 5": 0.0, + "GPQA": 0.3163, + "MUSR": 0.4386, + "MMLU-PRO": 0.4145 + } + }, + { + "model_id": "THUDM/glm-4-9b-chat", + "name": "glm-4-9b-chat", + "developer": "THUDM", + "scores": { + "IFEval": 0.0, + "BBH": 0.4736, + "MATH Level 5": 0.0, + "GPQA": 0.3138, + "MUSR": 0.3994, + "MMLU-PRO": 0.3167 + } + }, + { + "model_id": "THUDM/glm-4-9b-chat-1m", + "name": "glm-4-9b-chat-1m", + "developer": "THUDM", + "scores": { + "IFEval": 0.0, + "BBH": 0.418, + "MATH Level 5": 0.0, + "GPQA": 0.3037, + "MUSR": 0.3795, + "MMLU-PRO": 0.3163 + } + }, + { + "model_id": "THUDM/glm-4-9b-chat-1m-hf", + "name": "glm-4-9b-chat-1m-hf", + "developer": "THUDM", + "scores": { + "IFEval": 0.5341, + "BBH": 0.3901, + "MATH Level 5": 0.0483, + "GPQA": 0.2919, + "MUSR": 0.3689, + "MMLU-PRO": 0.1814 + } + }, + { + "model_id": "THUDM/glm-4-9b-chat-hf", + "name": "glm-4-9b-chat-hf", + "developer": "THUDM", + "scores": { + "IFEval": 0.6513, + "BBH": 0.4432, + "MATH Level 5": 0.0846, + "GPQA": 0.3029, + "MUSR": 0.3593, + "MMLU-PRO": 0.2774 + } + }, + { + "model_id": "TIGER-Lab/AceCodeRM-7B", + "name": "AceCodeRM-7B", + "developer": "TIGER-Lab", + "scores": { + "IFEval": 0.5855, + "BBH": 0.4773, + "MATH Level 5": 0.3467, + "GPQA": 0.3045, + "MUSR": 0.4192, + "MMLU-PRO": 0.3361 + } + }, + { + "model_id": "TIGER-Lab/AceCoder-Qwen2.5-7B-Ins-Rule", + "name": "AceCoder-Qwen2.5-7B-Ins-Rule", + "developer": "TIGER-Lab", + "scores": { + "IFEval": 0.7424, + "BBH": 0.5404, + "MATH Level 5": 0.4992, + "GPQA": 0.3012, + "MUSR": 0.398, + "MMLU-PRO": 0.4322 + } + }, + { + "model_id": "TIGER-Lab/AceCoder-Qwen2.5-Coder-7B-Base-Rule", + "name": "AceCoder-Qwen2.5-Coder-7B-Base-Rule", + "developer": "TIGER-Lab", + "scores": { + "IFEval": 0.4408, + "BBH": 0.4902, + "MATH Level 5": 0.2017, + "GPQA": 0.2718, + "MUSR": 0.3449, + "MMLU-PRO": 0.3745 + } + }, + { + "model_id": "TIGER-Lab/AceCoder-Qwen2.5-Coder-7B-Ins-Rule", + "name": "AceCoder-Qwen2.5-Coder-7B-Ins-Rule", + "developer": "TIGER-Lab", + "scores": { + "IFEval": 0.6222, + "BBH": 0.5089, + "MATH Level 5": 0.3603, + "GPQA": 0.2777, + "MUSR": 0.4046, + "MMLU-PRO": 0.3428 + } + }, + { + "model_id": "TIGER-Lab/MAmmoTH2-7B-Plus", + "name": "MAmmoTH2-7B-Plus", + "developer": "TIGER-Lab", + "scores": { + "IFEval": 0.5575, + "BBH": 0.4235, + "MATH Level 5": 0.1858, + "GPQA": 0.2802, + "MUSR": 0.4124, + "MMLU-PRO": 0.3017 + } + }, + { + "model_id": "TIGER-Lab/Qwen2.5-Math-7B-CFT", + "name": "Qwen2.5-Math-7B-CFT", + "developer": "TIGER-Lab", + "scores": { + "IFEval": 0.2777, + "BBH": 0.4637, + "MATH Level 5": 0.5574, + "GPQA": 0.2861, + "MUSR": 0.3887, + "MMLU-PRO": 0.2945 + } + }, + { + "model_id": "TTTXXX01/Mistral-7B-Base-SimPO2-5e-7", + "name": "Mistral-7B-Base-SimPO2-5e-7", + "developer": "TTTXXX01", + "scores": { + "IFEval": 0.4392, + "BBH": 0.432, + "MATH Level 5": 0.0264, + "GPQA": 0.2978, + "MUSR": 0.3604, + "MMLU-PRO": 0.2766 + } + }, + { + "model_id": "Tarek07/Progenitor-V1.1-LLaMa-70B", + "name": "Progenitor-V1.1-LLaMa-70B", + "developer": "Tarek07", + "scores": { + "IFEval": 0.6906, + "BBH": 0.6971, + "MATH Level 5": 0.3573, + "GPQA": 0.4581, + "MUSR": 0.4736, + "MMLU-PRO": 0.5465 + } + }, + { + "model_id": "Tarek07/Thalassic-Alpha-LLaMa-70B", + "name": "Thalassic-Alpha-LLaMa-70B", + "developer": "Tarek07", + "scores": { + "IFEval": 0.7003, + "BBH": 0.694, + "MATH Level 5": 0.315, + "GPQA": 0.4438, + "MUSR": 0.4802, + "MMLU-PRO": 0.5435 + } + }, + { + "model_id": "TeeZee/DoubleBagel-57B-v1.0", + "name": "DoubleBagel-57B-v1.0", + "developer": "TeeZee", + "scores": { + "IFEval": 0.2336, + "BBH": 0.3251, + "MATH Level 5": 0.0098, + "GPQA": 0.276, + "MUSR": 0.4315, + "MMLU-PRO": 0.1478 + } + }, + { + "model_id": "Telugu-LLM-Labs/Indic-gemma-2b-finetuned-sft-Navarasa-2.0", + "name": "Indic-gemma-2b-finetuned-sft-Navarasa-2.0", + "developer": "Telugu-LLM-Labs", + "scores": { + "IFEval": 0.2103, + "BBH": 0.3241, + "MATH Level 5": 0.0272, + "GPQA": 0.2433, + "MUSR": 0.3899, + "MMLU-PRO": 0.1279 + } + }, + { + "model_id": "Telugu-LLM-Labs/Indic-gemma-7b-finetuned-sft-Navarasa-2.0", + "name": "Indic-gemma-7b-finetuned-sft-Navarasa-2.0", + "developer": "Telugu-LLM-Labs", + "scores": { + "IFEval": 0.3237, + "BBH": 0.4023, + "MATH Level 5": 0.0257, + "GPQA": 0.2701, + "MUSR": 0.4083, + "MMLU-PRO": 0.235 + } + }, + { + "model_id": "TencentARC/LLaMA-Pro-8B", + "name": "LLaMA-Pro-8B", + "developer": "TencentARC", + "scores": { + "IFEval": 0.2277, + "BBH": 0.3484, + "MATH Level 5": 0.0189, + "GPQA": 0.2601, + "MUSR": 0.4018, + "MMLU-PRO": 0.1811 + } + }, + { + "model_id": "TencentARC/LLaMA-Pro-8B-Instruct", + "name": "LLaMA-Pro-8B-Instruct", + "developer": "TencentARC", + "scores": { + "IFEval": 0.4486, + "BBH": 0.4224, + "MATH Level 5": 0.0249, + "GPQA": 0.2743, + "MUSR": 0.419, + "MMLU-PRO": 0.1946 + } + }, + { + "model_id": "TencentARC/MetaMath-Mistral-Pro", + "name": "MetaMath-Mistral-Pro", + "developer": "TencentARC", + "scores": { + "IFEval": 0.2119, + "BBH": 0.4413, + "MATH Level 5": 0.0763, + "GPQA": 0.2693, + "MUSR": 0.3524, + "MMLU-PRO": 0.2472 + } + }, + { + "model_id": "TencentARC/Mistral_Pro_8B_v0.1", + "name": "Mistral_Pro_8B_v0.1", + "developer": "TencentARC", + "scores": { + "IFEval": 0.2115, + "BBH": 0.4526, + "MATH Level 5": 0.0566, + "GPQA": 0.2802, + "MUSR": 0.4242, + "MMLU-PRO": 0.2765 + } + }, + { + "model_id": "TheDrummer/Cydonia-22B-v1.2", + "name": "Cydonia-22B-v1.2", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.5635, + "BBH": 0.5809, + "MATH Level 5": 0.2032, + "GPQA": 0.3305, + "MUSR": 0.4022, + "MMLU-PRO": 0.4141 + } + }, + { + "model_id": "TheDrummer/Gemmasutra-9B-v1", + "name": "Gemmasutra-9B-v1", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.2416, + "BBH": 0.5887, + "MATH Level 5": 0.0831, + "GPQA": 0.3104, + "MUSR": 0.4846, + "MMLU-PRO": 0.4045 + } + }, + { + "model_id": "TheDrummer/Gemmasutra-Mini-2B-v1", + "name": "Gemmasutra-Mini-2B-v1", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.2549, + "BBH": 0.3575, + "MATH Level 5": 0.0378, + "GPQA": 0.271, + "MUSR": 0.349, + "MMLU-PRO": 0.2055 + } + }, + { + "model_id": "TheDrummer/Llama-3SOME-8B-v2", + "name": "Llama-3SOME-8B-v2", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.4508, + "BBH": 0.5203, + "MATH Level 5": 0.0937, + "GPQA": 0.302, + "MUSR": 0.3833, + "MMLU-PRO": 0.3753 + } + }, + { + "model_id": "TheDrummer/Ministrations-8B-v1", + "name": "Ministrations-8B-v1", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.2822, + "BBH": 0.4877, + "MATH Level 5": 0.1843, + "GPQA": 0.3247, + "MUSR": 0.4449, + "MMLU-PRO": 0.3644 + } + }, + { + "model_id": "TheDrummer/Rocinante-12B-v1", + "name": "Rocinante-12B-v1", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.6076, + "BBH": 0.5065, + "MATH Level 5": 0.1269, + "GPQA": 0.2911, + "MUSR": 0.4017, + "MMLU-PRO": 0.3477 + } + }, + { + "model_id": "TheDrummer/Tiger-Gemma-9B-v1", + "name": "Tiger-Gemma-9B-v1", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.7282, + "BBH": 0.5704, + "MATH Level 5": 0.1835, + "GPQA": 0.3389, + "MUSR": 0.4162, + "MMLU-PRO": 0.4118 + } + }, + { + "model_id": "TheDrummer/Tiger-Gemma-9B-v2", + "name": "Tiger-Gemma-9B-v2", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.6986, + "BBH": 0.5617, + "MATH Level 5": 0.182, + "GPQA": 0.3398, + "MUSR": 0.4084, + "MMLU-PRO": 0.4112 + } + }, + { + "model_id": "TheDrummer/Tiger-Gemma-9B-v3", + "name": "Tiger-Gemma-9B-v3", + "developer": "TheDrummer", + "scores": { + "IFEval": 0.6821, + "BBH": 0.5812, + "MATH Level 5": 0.1624, + "GPQA": 0.3389, + "MUSR": 0.4004, + "MMLU-PRO": 0.4059 + } + }, + { + "model_id": "TheDrunkenSnail/Daughter-of-Rhodia-12B", + "name": "Daughter-of-Rhodia-12B", + "developer": "TheDrunkenSnail", + "scores": { + "IFEval": 0.6904, + "BBH": 0.5179, + "MATH Level 5": 0.1224, + "GPQA": 0.3171, + "MUSR": 0.4348, + "MMLU-PRO": 0.3641 + } + }, + { + "model_id": "TheDrunkenSnail/Mother-of-Rhodia-12B", + "name": "Mother-of-Rhodia-12B", + "developer": "TheDrunkenSnail", + "scores": { + "IFEval": 0.6505, + "BBH": 0.4948, + "MATH Level 5": 0.1224, + "GPQA": 0.2987, + "MUSR": 0.4124, + "MMLU-PRO": 0.3551 + } + }, + { + "model_id": "TheDrunkenSnail/Son-of-Rhodia", + "name": "Son-of-Rhodia", + "developer": "TheDrunkenSnail", + "scores": { + "IFEval": 0.7046, + "BBH": 0.5097, + "MATH Level 5": 0.1314, + "GPQA": 0.3129, + "MUSR": 0.4203, + "MMLU-PRO": 0.3608 + } + }, + { + "model_id": "TheHierophant/Underground-Cognitive-V0.3-test", + "name": "Underground-Cognitive-V0.3-test", + "developer": "TheHierophant", + "scores": { + "IFEval": 0.4808, + "BBH": 0.529, + "MATH Level 5": 0.0589, + "GPQA": 0.2987, + "MUSR": 0.4351, + "MMLU-PRO": 0.3318 + } + }, + { + "model_id": "TheTsar1209/nemo-carpmuscle-v0.1", + "name": "nemo-carpmuscle-v0.1", + "developer": "TheTsar1209", + "scores": { + "IFEval": 0.2276, + "BBH": 0.5084, + "MATH Level 5": 0.0476, + "GPQA": 0.297, + "MUSR": 0.4135, + "MMLU-PRO": 0.3406 + } + }, + { + "model_id": "TheTsar1209/qwen-carpmuscle-r-v0.3", + "name": "qwen-carpmuscle-r-v0.3", + "developer": "TheTsar1209", + "scores": { + "IFEval": 0.4455, + "BBH": 0.6227, + "MATH Level 5": 0.3006, + "GPQA": 0.3507, + "MUSR": 0.4278, + "MMLU-PRO": 0.5103 + } + }, + { + "model_id": "TheTsar1209/qwen-carpmuscle-v0.1", + "name": "qwen-carpmuscle-v0.1", + "developer": "TheTsar1209", + "scores": { + "IFEval": 0.5622, + "BBH": 0.6434, + "MATH Level 5": 0.2628, + "GPQA": 0.344, + "MUSR": 0.4161, + "MMLU-PRO": 0.52 + } + }, + { + "model_id": "TheTsar1209/qwen-carpmuscle-v0.2", + "name": "qwen-carpmuscle-v0.2", + "developer": "TheTsar1209", + "scores": { + "IFEval": 0.5257, + "BBH": 0.6387, + "MATH Level 5": 0.2832, + "GPQA": 0.3557, + "MUSR": 0.4346, + "MMLU-PRO": 0.5147 + } + }, + { + "model_id": "TheTsar1209/qwen-carpmuscle-v0.3", + "name": "qwen-carpmuscle-v0.3", + "developer": "TheTsar1209", + "scores": { + "IFEval": 0.4476, + "BBH": 0.6152, + "MATH Level 5": 0.3134, + "GPQA": 0.3565, + "MUSR": 0.4132, + "MMLU-PRO": 0.5062 + } + }, + { + "model_id": "TheTsar1209/qwen-carpmuscle-v0.4", + "name": "qwen-carpmuscle-v0.4", + "developer": "TheTsar1209", + "scores": { + "IFEval": 0.7202, + "BBH": 0.6454, + "MATH Level 5": 0.2772, + "GPQA": 0.3523, + "MUSR": 0.4516, + "MMLU-PRO": 0.5144 + } + }, + { + "model_id": "TheTsar1209/qwen-carpmuscle-v0.4.1", + "name": "qwen-carpmuscle-v0.4.1", + "developer": "TheTsar1209", + "scores": { + "IFEval": 0.736, + "BBH": 0.6507, + "MATH Level 5": 0.2779, + "GPQA": 0.3456, + "MUSR": 0.4489, + "MMLU-PRO": 0.5191 + } + }, + { + "model_id": "Tijmen2/cosmosage-v3", + "name": "cosmosage-v3", + "developer": "Tijmen2", + "scores": { + "IFEval": 0.4482, + "BBH": 0.4551, + "MATH Level 5": 0.0506, + "GPQA": 0.2827, + "MUSR": 0.4199, + "MMLU-PRO": 0.2486 + } + }, + { + "model_id": "TinyLlama/TinyLlama-1.1B-Chat-v0.1", + "name": "TinyLlama-1.1B-Chat-v0.1", + "developer": "TinyLlama", + "scores": { + "IFEval": 0.1479, + "BBH": 0.3084, + "MATH Level 5": 0.006, + "GPQA": 0.229, + "MUSR": 0.3592, + "MMLU-PRO": 0.1098 + } + }, + { + "model_id": "TinyLlama/TinyLlama-1.1B-Chat-v0.5", + "name": "TinyLlama-1.1B-Chat-v0.5", + "developer": "TinyLlama", + "scores": { + "IFEval": 0.1634, + "BBH": 0.3105, + "MATH Level 5": 0.0038, + "GPQA": 0.2483, + "MUSR": 0.3661, + "MMLU-PRO": 0.1096 + } + }, + { + "model_id": "TinyLlama/TinyLlama-1.1B-Chat-v0.6", + "name": "TinyLlama-1.1B-Chat-v0.6", + "developer": "TinyLlama", + "scores": { + "IFEval": 0.1574, + "BBH": 0.3067, + "MATH Level 5": 0.0159, + "GPQA": 0.2584, + "MUSR": 0.3422, + "MMLU-PRO": 0.1149 + } + }, + { + "model_id": "TinyLlama/TinyLlama-1.1B-Chat-v1.0", + "name": "TinyLlama-1.1B-Chat-v1.0", + "developer": "TinyLlama", + "scores": { + "IFEval": 0.0596, + "BBH": 0.3104, + "MATH Level 5": 0.0151, + "GPQA": 0.25, + "MUSR": 0.3515, + "MMLU-PRO": 0.1101 + } + }, + { + "model_id": "TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T", + "name": "TinyLlama-1.1B-intermediate-step-1431k-3T", + "developer": "TinyLlama", + "scores": { + "IFEval": 0.2277, + "BBH": 0.3071, + "MATH Level 5": 0.0121, + "GPQA": 0.2525, + "MUSR": 0.338, + "MMLU-PRO": 0.112 + } + }, + { + "model_id": "TinyLlama/TinyLlama_v1.1", + "name": "TinyLlama_v1.1", + "developer": "TinyLlama", + "scores": { + "IFEval": 0.2001, + "BBH": 0.3024, + "MATH Level 5": 0.0121, + "GPQA": 0.2458, + "MUSR": 0.37, + "MMLU-PRO": 0.1049 + } + }, + { + "model_id": "ToastyPigeon/Sto-vo-kor-12B", + "name": "Sto-vo-kor-12B", + "developer": "ToastyPigeon", + "scores": { + "IFEval": 0.5501, + "BBH": 0.5065, + "MATH Level 5": 0.1088, + "GPQA": 0.3054, + "MUSR": 0.3938, + "MMLU-PRO": 0.3398 + } + }, + { + "model_id": "Trappu/Magnum-Picaro-0.7-v2-12b", + "name": "Magnum-Picaro-0.7-v2-12b", + "developer": "Trappu", + "scores": { + "IFEval": 0.3003, + "BBH": 0.5507, + "MATH Level 5": 0.0665, + "GPQA": 0.323, + "MUSR": 0.4727, + "MMLU-PRO": 0.358 + } + }, + { + "model_id": "Trappu/Nemo-Picaro-12B", + "name": "Nemo-Picaro-12B", + "developer": "Trappu", + "scores": { + "IFEval": 0.2577, + "BBH": 0.549, + "MATH Level 5": 0.0846, + "GPQA": 0.3272, + "MUSR": 0.4726, + "MMLU-PRO": 0.3605 + } + }, + { + "model_id": "Tremontaine/L3-12B-Lunaris-v1", + "name": "L3-12B-Lunaris-v1", + "developer": "Tremontaine", + "scores": { + "IFEval": 0.6909, + "BBH": 0.523, + "MATH Level 5": 0.0876, + "GPQA": 0.3096, + "MUSR": 0.3674, + "MMLU-PRO": 0.3775 + } + }, + { + "model_id": "Triangle104/Annunaki-12b", + "name": "Annunaki-12b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3872, + "BBH": 0.5499, + "MATH Level 5": 0.1216, + "GPQA": 0.3213, + "MUSR": 0.4409, + "MMLU-PRO": 0.3721 + } + }, + { + "model_id": "Triangle104/BigTalker-Lite-8B", + "name": "BigTalker-Lite-8B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3689, + "BBH": 0.5308, + "MATH Level 5": 0.102, + "GPQA": 0.3104, + "MUSR": 0.4208, + "MMLU-PRO": 0.3431 + } + }, + { + "model_id": "Triangle104/Chatty-Harry_V2.0", + "name": "Chatty-Harry_V2.0", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3326, + "BBH": 0.5319, + "MATH Level 5": 0.139, + "GPQA": 0.323, + "MUSR": 0.4078, + "MMLU-PRO": 0.3683 + } + }, + { + "model_id": "Triangle104/Chatty-Harry_V3.0", + "name": "Chatty-Harry_V3.0", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3675, + "BBH": 0.5526, + "MATH Level 5": 0.1125, + "GPQA": 0.323, + "MUSR": 0.4408, + "MMLU-PRO": 0.3702 + } + }, + { + "model_id": "Triangle104/Chronos-Prism_V1.0", + "name": "Chronos-Prism_V1.0", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3259, + "BBH": 0.5554, + "MATH Level 5": 0.1201, + "GPQA": 0.3096, + "MUSR": 0.4263, + "MMLU-PRO": 0.3673 + } + }, + { + "model_id": "Triangle104/DS-Distilled-Hermes-Llama-3.1", + "name": "DS-Distilled-Hermes-Llama-3.1", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3229, + "BBH": 0.5117, + "MATH Level 5": 0.2931, + "GPQA": 0.3188, + "MUSR": 0.4039, + "MMLU-PRO": 0.311 + } + }, + { + "model_id": "Triangle104/DS-Distilled-Hermes-Llama-3.1_TIES", + "name": "DS-Distilled-Hermes-Llama-3.1_TIES", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1364, + "BBH": 0.2928, + "MATH Level 5": 0.0091, + "GPQA": 0.245, + "MUSR": 0.3621, + "MMLU-PRO": 0.1104 + } + }, + { + "model_id": "Triangle104/DS-R1-Distill-Q2.5-10B-Harmony", + "name": "DS-R1-Distill-Q2.5-10B-Harmony", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1751, + "BBH": 0.2643, + "MATH Level 5": 0.0, + "GPQA": 0.2106, + "MUSR": 0.3128, + "MMLU-PRO": 0.1173 + } + }, + { + "model_id": "Triangle104/DS-R1-Distill-Q2.5-14B-Harmony_V0.1", + "name": "DS-R1-Distill-Q2.5-14B-Harmony_V0.1", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4515, + "BBH": 0.5783, + "MATH Level 5": 0.5551, + "GPQA": 0.3935, + "MUSR": 0.5567, + "MMLU-PRO": 0.4601 + } + }, + { + "model_id": "Triangle104/DS-R1-Distill-Q2.5-7B-RP", + "name": "DS-R1-Distill-Q2.5-7B-RP", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3445, + "BBH": 0.4383, + "MATH Level 5": 0.4683, + "GPQA": 0.3138, + "MUSR": 0.403, + "MMLU-PRO": 0.2891 + } + }, + { + "model_id": "Triangle104/DS-R1-Llama-8B-Harmony", + "name": "DS-R1-Llama-8B-Harmony", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3566, + "BBH": 0.4154, + "MATH Level 5": 0.4282, + "GPQA": 0.2919, + "MUSR": 0.3762, + "MMLU-PRO": 0.2744 + } + }, + { + "model_id": "Triangle104/DSR1-Distill-Llama-Lit-8B", + "name": "DSR1-Distill-Llama-Lit-8B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1885, + "BBH": 0.4284, + "MATH Level 5": 0.352, + "GPQA": 0.3029, + "MUSR": 0.3535, + "MMLU-PRO": 0.2798 + } + }, + { + "model_id": "Triangle104/DSR1-Distill-Qwen-7B-RP", + "name": "DSR1-Distill-Qwen-7B-RP", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3609, + "BBH": 0.4326, + "MATH Level 5": 0.4804, + "GPQA": 0.3196, + "MUSR": 0.4045, + "MMLU-PRO": 0.3028 + } + }, + { + "model_id": "Triangle104/Dark-Chivalry_V1.0", + "name": "Dark-Chivalry_V1.0", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4326, + "BBH": 0.4974, + "MATH Level 5": 0.1314, + "GPQA": 0.2936, + "MUSR": 0.4182, + "MMLU-PRO": 0.3444 + } + }, + { + "model_id": "Triangle104/Distilled-DarkPlanet-Allades-8B", + "name": "Distilled-DarkPlanet-Allades-8B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.346, + "BBH": 0.4634, + "MATH Level 5": 0.4003, + "GPQA": 0.3054, + "MUSR": 0.3538, + "MMLU-PRO": 0.2901 + } + }, + { + "model_id": "Triangle104/Distilled-DarkPlanet-Allades-8B_TIES", + "name": "Distilled-DarkPlanet-Allades-8B_TIES", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3892, + "BBH": 0.5042, + "MATH Level 5": 0.0906, + "GPQA": 0.3146, + "MUSR": 0.3868, + "MMLU-PRO": 0.3401 + } + }, + { + "model_id": "Triangle104/Distilled-Whiskey-8b", + "name": "Distilled-Whiskey-8b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3448, + "BBH": 0.5028, + "MATH Level 5": 0.2545, + "GPQA": 0.3314, + "MUSR": 0.4172, + "MMLU-PRO": 0.3367 + } + }, + { + "model_id": "Triangle104/Dolphin3-Llama3.2-Smart", + "name": "Dolphin3-Llama3.2-Smart", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4137, + "BBH": 0.3975, + "MATH Level 5": 0.0438, + "GPQA": 0.2693, + "MUSR": 0.3922, + "MMLU-PRO": 0.2195 + } + }, + { + "model_id": "Triangle104/Gemmadevi-Stock-10B", + "name": "Gemmadevi-Stock-10B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1582, + "BBH": 0.6066, + "MATH Level 5": 0.0967, + "GPQA": 0.3532, + "MUSR": 0.4621, + "MMLU-PRO": 0.4262 + } + }, + { + "model_id": "Triangle104/Hermes-Llama-3.2-CoT", + "name": "Hermes-Llama-3.2-CoT", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4178, + "BBH": 0.4616, + "MATH Level 5": 0.0952, + "GPQA": 0.2794, + "MUSR": 0.3698, + "MMLU-PRO": 0.2947 + } + }, + { + "model_id": "Triangle104/Hermes-Llama-3.2-CoT-Summary", + "name": "Hermes-Llama-3.2-CoT-Summary", + "developer": "Triangle104", + "scores": { + "IFEval": 0.483, + "BBH": 0.42, + "MATH Level 5": 0.0831, + "GPQA": 0.2559, + "MUSR": 0.3575, + "MMLU-PRO": 0.2901 + } + }, + { + "model_id": "Triangle104/Hermes3-L3.1-DirtyHarry-8B", + "name": "Hermes3-L3.1-DirtyHarry-8B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3242, + "BBH": 0.5066, + "MATH Level 5": 0.0718, + "GPQA": 0.302, + "MUSR": 0.4069, + "MMLU-PRO": 0.3339 + } + }, + { + "model_id": "Triangle104/Herodotos-14B", + "name": "Herodotos-14B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4667, + "BBH": 0.6435, + "MATH Level 5": 0.5045, + "GPQA": 0.3733, + "MUSR": 0.4795, + "MMLU-PRO": 0.529 + } + }, + { + "model_id": "Triangle104/Herodotos-14B_V0.1", + "name": "Herodotos-14B_V0.1", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1879, + "BBH": 0.3017, + "MATH Level 5": 0.0, + "GPQA": 0.224, + "MUSR": 0.3684, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "Triangle104/L3.1-8B-Dusky-Ink", + "name": "L3.1-8B-Dusky-Ink", + "developer": "Triangle104", + "scores": { + "IFEval": 0.453, + "BBH": 0.5098, + "MATH Level 5": 0.1231, + "GPQA": 0.2894, + "MUSR": 0.4224, + "MMLU-PRO": 0.3683 + } + }, + { + "model_id": "Triangle104/L3.1-8B-Dusky-Ink_v0.r1", + "name": "L3.1-8B-Dusky-Ink_v0.r1", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1985, + "BBH": 0.4337, + "MATH Level 5": 0.0431, + "GPQA": 0.3037, + "MUSR": 0.3988, + "MMLU-PRO": 0.3206 + } + }, + { + "model_id": "Triangle104/LThreePointOne-8B-HermesBlackroot", + "name": "LThreePointOne-8B-HermesBlackroot", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1792, + "BBH": 0.4998, + "MATH Level 5": 0.0196, + "GPQA": 0.307, + "MUSR": 0.3586, + "MMLU-PRO": 0.3285 + } + }, + { + "model_id": "Triangle104/LThreePointOne-8B-HermesInk", + "name": "LThreePointOne-8B-HermesInk", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4031, + "BBH": 0.5223, + "MATH Level 5": 0.1722, + "GPQA": 0.323, + "MUSR": 0.4129, + "MMLU-PRO": 0.3467 + } + }, + { + "model_id": "Triangle104/Llama3.1-Allades-Lit-8b", + "name": "Llama3.1-Allades-Lit-8b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.2461, + "BBH": 0.4183, + "MATH Level 5": 0.0023, + "GPQA": 0.2844, + "MUSR": 0.3708, + "MMLU-PRO": 0.2724 + } + }, + { + "model_id": "Triangle104/Llama3.1-cc-Lit-8b", + "name": "Llama3.1-cc-Lit-8b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.2993, + "BBH": 0.3848, + "MATH Level 5": 0.003, + "GPQA": 0.2777, + "MUSR": 0.3854, + "MMLU-PRO": 0.3004 + } + }, + { + "model_id": "Triangle104/Minerva-1.5b", + "name": "Minerva-1.5b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.2694, + "BBH": 0.4026, + "MATH Level 5": 0.1027, + "GPQA": 0.3104, + "MUSR": 0.3655, + "MMLU-PRO": 0.2698 + } + }, + { + "model_id": "Triangle104/Minerva-1.5b_V0.2", + "name": "Minerva-1.5b_V0.2", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3083, + "BBH": 0.3989, + "MATH Level 5": 0.114, + "GPQA": 0.2852, + "MUSR": 0.396, + "MMLU-PRO": 0.2911 + } + }, + { + "model_id": "Triangle104/Minerva-10b", + "name": "Minerva-10b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1879, + "BBH": 0.4462, + "MATH Level 5": 0.0, + "GPQA": 0.281, + "MUSR": 0.3627, + "MMLU-PRO": 0.2318 + } + }, + { + "model_id": "Triangle104/Minerva-14b", + "name": "Minerva-14b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3468, + "BBH": 0.6301, + "MATH Level 5": 0.3051, + "GPQA": 0.3742, + "MUSR": 0.4766, + "MMLU-PRO": 0.5194 + } + }, + { + "model_id": "Triangle104/Minerva-14b-V0.1", + "name": "Minerva-14b-V0.1", + "developer": "Triangle104", + "scores": { + "IFEval": 0.0861, + "BBH": 0.609, + "MATH Level 5": 0.3051, + "GPQA": 0.3658, + "MUSR": 0.47, + "MMLU-PRO": 0.5118 + } + }, + { + "model_id": "Triangle104/Minerva-7b", + "name": "Minerva-7b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3724, + "BBH": 0.5498, + "MATH Level 5": 0.284, + "GPQA": 0.323, + "MUSR": 0.4143, + "MMLU-PRO": 0.4444 + } + }, + { + "model_id": "Triangle104/Minerva-8b", + "name": "Minerva-8b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1721, + "BBH": 0.4669, + "MATH Level 5": 0.0045, + "GPQA": 0.3121, + "MUSR": 0.4273, + "MMLU-PRO": 0.3089 + } + }, + { + "model_id": "Triangle104/Mistral-Redemption-Arc", + "name": "Mistral-Redemption-Arc", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4029, + "BBH": 0.6255, + "MATH Level 5": 0.4101, + "GPQA": 0.3473, + "MUSR": 0.4595, + "MMLU-PRO": 0.451 + } + }, + { + "model_id": "Triangle104/Mistral-Small-24b-Harmony", + "name": "Mistral-Small-24b-Harmony", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1687, + "BBH": 0.6434, + "MATH Level 5": 0.1911, + "GPQA": 0.3842, + "MUSR": 0.4276, + "MMLU-PRO": 0.5431 + } + }, + { + "model_id": "Triangle104/Pans_Gutenbergum_V0.1", + "name": "Pans_Gutenbergum_V0.1", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3097, + "BBH": 0.5541, + "MATH Level 5": 0.1057, + "GPQA": 0.323, + "MUSR": 0.4528, + "MMLU-PRO": 0.3697 + } + }, + { + "model_id": "Triangle104/Pans_Gutenbergum_V0.2", + "name": "Pans_Gutenbergum_V0.2", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3215, + "BBH": 0.5526, + "MATH Level 5": 0.0687, + "GPQA": 0.3121, + "MUSR": 0.4673, + "MMLU-PRO": 0.3585 + } + }, + { + "model_id": "Triangle104/Pantheon_ChatWaifu_V0.2", + "name": "Pantheon_ChatWaifu_V0.2", + "developer": "Triangle104", + "scores": { + "IFEval": 0.2683, + "BBH": 0.5532, + "MATH Level 5": 0.0566, + "GPQA": 0.318, + "MUSR": 0.4755, + "MMLU-PRO": 0.3442 + } + }, + { + "model_id": "Triangle104/Phi-4-AbliteratedRP", + "name": "Phi-4-AbliteratedRP", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4923, + "BBH": 0.6709, + "MATH Level 5": 0.3074, + "GPQA": 0.3951, + "MUSR": 0.5098, + "MMLU-PRO": 0.5308 + } + }, + { + "model_id": "Triangle104/Phi4-RP-o1", + "name": "Phi4-RP-o1", + "developer": "Triangle104", + "scores": { + "IFEval": 0.022, + "BBH": 0.6653, + "MATH Level 5": 0.3776, + "GPQA": 0.3733, + "MUSR": 0.4756, + "MMLU-PRO": 0.5111 + } + }, + { + "model_id": "Triangle104/Phi4-RP-o1-Ablit", + "name": "Phi4-RP-o1-Ablit", + "developer": "Triangle104", + "scores": { + "IFEval": 0.0239, + "BBH": 0.663, + "MATH Level 5": 0.3882, + "GPQA": 0.3633, + "MUSR": 0.4754, + "MMLU-PRO": 0.5105 + } + }, + { + "model_id": "Triangle104/Porpoise-R1-Llama3.2-3b", + "name": "Porpoise-R1-Llama3.2-3b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4352, + "BBH": 0.3824, + "MATH Level 5": 0.0423, + "GPQA": 0.2668, + "MUSR": 0.3576, + "MMLU-PRO": 0.2117 + } + }, + { + "model_id": "Triangle104/Q2.5-14B-Instruct-1M-Harmony", + "name": "Q2.5-14B-Instruct-1M-Harmony", + "developer": "Triangle104", + "scores": { + "IFEval": 0.5986, + "BBH": 0.6339, + "MATH Level 5": 0.3769, + "GPQA": 0.375, + "MUSR": 0.4795, + "MMLU-PRO": 0.5075 + } + }, + { + "model_id": "Triangle104/Q2.5-AthensCOT", + "name": "Q2.5-AthensCOT", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4573, + "BBH": 0.5542, + "MATH Level 5": 0.2915, + "GPQA": 0.3003, + "MUSR": 0.4578, + "MMLU-PRO": 0.4379 + } + }, + { + "model_id": "Triangle104/Q2.5-CodeR1-3B", + "name": "Q2.5-CodeR1-3B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3588, + "BBH": 0.4661, + "MATH Level 5": 0.1639, + "GPQA": 0.3037, + "MUSR": 0.4315, + "MMLU-PRO": 0.2979 + } + }, + { + "model_id": "Triangle104/Q2.5-EVACOT-7b", + "name": "Q2.5-EVACOT-7b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.5784, + "BBH": 0.5506, + "MATH Level 5": 0.2825, + "GPQA": 0.318, + "MUSR": 0.4499, + "MMLU-PRO": 0.4331 + } + }, + { + "model_id": "Triangle104/Q2.5-EvaHumane-RP", + "name": "Q2.5-EvaHumane-RP", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3676, + "BBH": 0.5328, + "MATH Level 5": 0.2923, + "GPQA": 0.3188, + "MUSR": 0.4276, + "MMLU-PRO": 0.4412 + } + }, + { + "model_id": "Triangle104/Q2.5-Humane-RP", + "name": "Q2.5-Humane-RP", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4412, + "BBH": 0.5649, + "MATH Level 5": 0.3391, + "GPQA": 0.3188, + "MUSR": 0.4528, + "MMLU-PRO": 0.4492 + } + }, + { + "model_id": "Triangle104/Q2.5-Instruct-1M_Harmony", + "name": "Q2.5-Instruct-1M_Harmony", + "developer": "Triangle104", + "scores": { + "IFEval": 0.6038, + "BBH": 0.5373, + "MATH Level 5": 0.3323, + "GPQA": 0.323, + "MUSR": 0.4688, + "MMLU-PRO": 0.4366 + } + }, + { + "model_id": "Triangle104/Q2.5-R1-3B", + "name": "Q2.5-R1-3B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.4214, + "BBH": 0.4812, + "MATH Level 5": 0.2674, + "GPQA": 0.3096, + "MUSR": 0.432, + "MMLU-PRO": 0.3813 + } + }, + { + "model_id": "Triangle104/Q2.5-R1-7B", + "name": "Q2.5-R1-7B", + "developer": "Triangle104", + "scores": { + "IFEval": 0.1346, + "BBH": 0.3007, + "MATH Level 5": 0.0166, + "GPQA": 0.2525, + "MUSR": 0.3607, + "MMLU-PRO": 0.118 + } + }, + { + "model_id": "Triangle104/Robo-Gutenberg_V1.0", + "name": "Robo-Gutenberg_V1.0", + "developer": "Triangle104", + "scores": { + "IFEval": 0.6008, + "BBH": 0.6537, + "MATH Level 5": 0.4562, + "GPQA": 0.3859, + "MUSR": 0.4744, + "MMLU-PRO": 0.5391 + } + }, + { + "model_id": "Triangle104/Rocinante-Prism_V2.0", + "name": "Rocinante-Prism_V2.0", + "developer": "Triangle104", + "scores": { + "IFEval": 0.2616, + "BBH": 0.5361, + "MATH Level 5": 0.111, + "GPQA": 0.3205, + "MUSR": 0.445, + "MMLU-PRO": 0.364 + } + }, + { + "model_id": "Triangle104/Rocinante-Prism_V2.1", + "name": "Rocinante-Prism_V2.1", + "developer": "Triangle104", + "scores": { + "IFEval": 0.2558, + "BBH": 0.5333, + "MATH Level 5": 0.1125, + "GPQA": 0.3196, + "MUSR": 0.449, + "MMLU-PRO": 0.3651 + } + }, + { + "model_id": "Triangle104/RomboHermes3-R1-Llama3.2-3b", + "name": "RomboHermes3-R1-Llama3.2-3b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.3007, + "BBH": 0.4264, + "MATH Level 5": 0.0816, + "GPQA": 0.2836, + "MUSR": 0.3657, + "MMLU-PRO": 0.2957 + } + }, + { + "model_id": "Triangle104/Rombos-Novasky-7B_V1c", + "name": "Rombos-Novasky-7B_V1c", + "developer": "Triangle104", + "scores": { + "IFEval": 0.408, + "BBH": 0.4349, + "MATH Level 5": 0.0853, + "GPQA": 0.2961, + "MUSR": 0.4465, + "MMLU-PRO": 0.2738 + } + }, + { + "model_id": "Triangle104/Set-70b", + "name": "Set-70b", + "developer": "Triangle104", + "scores": { + "IFEval": 0.7643, + "BBH": 0.7014, + "MATH Level 5": 0.364, + "GPQA": 0.4463, + "MUSR": 0.4696, + "MMLU-PRO": 0.5442 + } + }, + { + "model_id": "Tsunami-th/Tsunami-0.5-7B-Instruct", + "name": "Tsunami-0.5-7B-Instruct", + "developer": "Tsunami-th", + "scores": { + "IFEval": 0.74, + "BBH": 0.5524, + "MATH Level 5": 0.5045, + "GPQA": 0.3087, + "MUSR": 0.4257, + "MMLU-PRO": 0.4413 + } + }, + { + "model_id": "Tsunami-th/Tsunami-0.5x-7B-Instruct", + "name": "Tsunami-0.5x-7B-Instruct", + "developer": "Tsunami-th", + "scores": { + "IFEval": 0.7099, + "BBH": 0.5593, + "MATH Level 5": 0.4207, + "GPQA": 0.3146, + "MUSR": 0.4667, + "MMLU-PRO": 0.4458 + } + }, + { + "model_id": "Tsunami-th/Tsunami-1.0-14B-Instruct", + "name": "Tsunami-1.0-14B-Instruct", + "developer": "Tsunami-th", + "scores": { + "IFEval": 0.7829, + "BBH": 0.6439, + "MATH Level 5": 0.4585, + "GPQA": 0.3565, + "MUSR": 0.4459, + "MMLU-PRO": 0.5249 + } + }, + { + "model_id": "Tsunami-th/Tsunami-1.0-7B-Instruct", + "name": "Tsunami-1.0-7B-Instruct", + "developer": "Tsunami-th", + "scores": { + "IFEval": 0.7309, + "BBH": 0.5491, + "MATH Level 5": 0.4335, + "GPQA": 0.3129, + "MUSR": 0.4493, + "MMLU-PRO": 0.4424 + } + }, + { + "model_id": "UCLA-AGI/Gemma-2-9B-It-SPPO-Iter1", + "name": "Gemma-2-9B-It-SPPO-Iter1", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.3082, + "BBH": 0.5969, + "MATH Level 5": 0.0899, + "GPQA": 0.3364, + "MUSR": 0.4099, + "MMLU-PRO": 0.3907 + } + }, + { + "model_id": "UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2", + "name": "Gemma-2-9B-It-SPPO-Iter2", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.31, + "BBH": 0.599, + "MATH Level 5": 0.0808, + "GPQA": 0.3347, + "MUSR": 0.4139, + "MMLU-PRO": 0.387 + } + }, + { + "model_id": "UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3", + "name": "Gemma-2-9B-It-SPPO-Iter3", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.3167, + "BBH": 0.6007, + "MATH Level 5": 0.071, + "GPQA": 0.3389, + "MUSR": 0.4166, + "MMLU-PRO": 0.3826 + } + }, + { + "model_id": "UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter1", + "name": "Llama-3-Instruct-8B-SPPO-Iter1", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.7299, + "BBH": 0.5058, + "MATH Level 5": 0.1148, + "GPQA": 0.2676, + "MUSR": 0.3568, + "MMLU-PRO": 0.3711 + } + }, + { + "model_id": "UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter2", + "name": "Llama-3-Instruct-8B-SPPO-Iter2", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.6989, + "BBH": 0.5089, + "MATH Level 5": 0.1035, + "GPQA": 0.2668, + "MUSR": 0.3594, + "MMLU-PRO": 0.3692 + } + }, + { + "model_id": "UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3", + "name": "Llama-3-Instruct-8B-SPPO-Iter3", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.6703, + "BBH": 0.5076, + "MATH Level 5": 0.0718, + "GPQA": 0.2651, + "MUSR": 0.3647, + "MMLU-PRO": 0.3658 + } + }, + { + "model_id": "UCLA-AGI/Mistral7B-PairRM-SPPO", + "name": "Mistral7B-PairRM-SPPO", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.4355, + "BBH": 0.4439, + "MATH Level 5": 0.031, + "GPQA": 0.281, + "MUSR": 0.3965, + "MMLU-PRO": 0.2621 + } + }, + { + "model_id": "UCLA-AGI/Mistral7B-PairRM-SPPO-Iter1", + "name": "Mistral7B-PairRM-SPPO-Iter1", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.5047, + "BBH": 0.4468, + "MATH Level 5": 0.0249, + "GPQA": 0.2836, + "MUSR": 0.3992, + "MMLU-PRO": 0.2695 + } + }, + { + "model_id": "UCLA-AGI/Mistral7B-PairRM-SPPO-Iter2", + "name": "Mistral7B-PairRM-SPPO-Iter2", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.4446, + "BBH": 0.4466, + "MATH Level 5": 0.0219, + "GPQA": 0.2886, + "MUSR": 0.4085, + "MMLU-PRO": 0.2677 + } + }, + { + "model_id": "UCLA-AGI/Mistral7B-PairRM-SPPO-Iter3", + "name": "Mistral7B-PairRM-SPPO-Iter3", + "developer": "UCLA-AGI", + "scores": { + "IFEval": 0.4351, + "BBH": 0.4397, + "MATH Level 5": 0.0234, + "GPQA": 0.2752, + "MUSR": 0.4071, + "MMLU-PRO": 0.2658 + } + }, + { + "model_id": "UKzExecution/LlamaExecutor-8B-3.0.5", + "name": "LlamaExecutor-8B-3.0.5", + "developer": "UKzExecution", + "scores": { + "IFEval": 0.7403, + "BBH": 0.5006, + "MATH Level 5": 0.102, + "GPQA": 0.2559, + "MUSR": 0.3754, + "MMLU-PRO": 0.3625 + } + }, + { + "model_id": "Unbabel/TowerInstruct-Mistral-7B-v0.2", + "name": "TowerInstruct-Mistral-7B-v0.2", + "developer": "Unbabel", + "scores": { + "IFEval": 0.2843, + "BBH": 0.3882, + "MATH Level 5": 0.0204, + "GPQA": 0.2475, + "MUSR": 0.4522, + "MMLU-PRO": 0.1968 + } + }, + { + "model_id": "Undi95/MG-FinalMix-72B", + "name": "MG-FinalMix-72B", + "developer": "Undi95", + "scores": { + "IFEval": 0.8014, + "BBH": 0.6973, + "MATH Level 5": 0.3973, + "GPQA": 0.3851, + "MUSR": 0.4823, + "MMLU-PRO": 0.5427 + } + }, + { + "model_id": "Undi95/Phi4-abliterated", + "name": "Phi4-abliterated", + "developer": "Undi95", + "scores": { + "IFEval": 0.6618, + "BBH": 0.6809, + "MATH Level 5": 0.3701, + "GPQA": 0.3305, + "MUSR": 0.4034, + "MMLU-PRO": 0.5281 + } + }, + { + "model_id": "V3N0M/Jenna-Tiny-2.0", + "name": "Jenna-Tiny-2.0", + "developer": "V3N0M", + "scores": { + "IFEval": 0.2309, + "BBH": 0.3148, + "MATH Level 5": 0.0121, + "GPQA": 0.25, + "MUSR": 0.3367, + "MMLU-PRO": 0.1147 + } + }, + { + "model_id": "VAGOsolutions/Llama-3-SauerkrautLM-70b-Instruct", + "name": "Llama-3-SauerkrautLM-70b-Instruct", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.8045, + "BBH": 0.6663, + "MATH Level 5": 0.2281, + "GPQA": 0.328, + "MUSR": 0.4339, + "MMLU-PRO": 0.5392 + } + }, + { + "model_id": "VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct", + "name": "Llama-3-SauerkrautLM-8b-Instruct", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.7445, + "BBH": 0.4943, + "MATH Level 5": 0.0665, + "GPQA": 0.3087, + "MUSR": 0.4241, + "MMLU-PRO": 0.3857 + } + }, + { + "model_id": "VAGOsolutions/Llama-3.1-SauerkrautLM-70b-Instruct", + "name": "Llama-3.1-SauerkrautLM-70b-Instruct", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.8656, + "BBH": 0.7006, + "MATH Level 5": 0.3693, + "GPQA": 0.3414, + "MUSR": 0.4711, + "MMLU-PRO": 0.5335 + } + }, + { + "model_id": "VAGOsolutions/Llama-3.1-SauerkrautLM-8b-Instruct", + "name": "Llama-3.1-SauerkrautLM-8b-Instruct", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.8017, + "BBH": 0.5115, + "MATH Level 5": 0.1941, + "GPQA": 0.2903, + "MUSR": 0.4148, + "MMLU-PRO": 0.389 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-1.5b", + "name": "SauerkrautLM-1.5b", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.2404, + "BBH": 0.3704, + "MATH Level 5": 0.0363, + "GPQA": 0.271, + "MUSR": 0.3739, + "MMLU-PRO": 0.2151 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-7b-HerO", + "name": "SauerkrautLM-7b-HerO", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.5346, + "BBH": 0.4904, + "MATH Level 5": 0.0393, + "GPQA": 0.2727, + "MUSR": 0.3924, + "MMLU-PRO": 0.3046 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-7b-LaserChat", + "name": "SauerkrautLM-7b-LaserChat", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.5988, + "BBH": 0.4543, + "MATH Level 5": 0.0778, + "GPQA": 0.3003, + "MUSR": 0.4148, + "MMLU-PRO": 0.3305 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-Gemma-2b", + "name": "SauerkrautLM-Gemma-2b", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.2475, + "BBH": 0.3416, + "MATH Level 5": 0.0279, + "GPQA": 0.2567, + "MUSR": 0.3676, + "MMLU-PRO": 0.1469 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-Gemma-7b", + "name": "SauerkrautLM-Gemma-7b", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.3407, + "BBH": 0.4188, + "MATH Level 5": 0.0672, + "GPQA": 0.2861, + "MUSR": 0.3594, + "MMLU-PRO": 0.2961 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-Mixtral-8x7B-Instruct", + "name": "SauerkrautLM-Mixtral-8x7B-Instruct", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.5602, + "BBH": 0.5277, + "MATH Level 5": 0.0982, + "GPQA": 0.2978, + "MUSR": 0.4204, + "MMLU-PRO": 0.365 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-Nemo-12b-Instruct", + "name": "SauerkrautLM-Nemo-12b-Instruct", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.6113, + "BBH": 0.5214, + "MATH Level 5": 0.1224, + "GPQA": 0.3096, + "MUSR": 0.4469, + "MMLU-PRO": 0.3385 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-Phi-3-medium", + "name": "SauerkrautLM-Phi-3-medium", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.4409, + "BBH": 0.6433, + "MATH Level 5": 0.1601, + "GPQA": 0.3347, + "MUSR": 0.4845, + "MMLU-PRO": 0.4665 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-SOLAR-Instruct", + "name": "SauerkrautLM-SOLAR-Instruct", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.4917, + "BBH": 0.5169, + "MATH Level 5": 0.0634, + "GPQA": 0.3054, + "MUSR": 0.3965, + "MMLU-PRO": 0.3183 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-gemma-2-2b-it", + "name": "SauerkrautLM-gemma-2-2b-it", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.1321, + "BBH": 0.4241, + "MATH Level 5": 0.0219, + "GPQA": 0.2727, + "MUSR": 0.3995, + "MMLU-PRO": 0.2693 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-gemma-2-9b-it", + "name": "SauerkrautLM-gemma-2-9b-it", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.3024, + "BBH": 0.6073, + "MATH Level 5": 0.0838, + "GPQA": 0.3272, + "MUSR": 0.4318, + "MMLU-PRO": 0.4091 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-v2-14b-DPO", + "name": "SauerkrautLM-v2-14b-DPO", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.7412, + "BBH": 0.656, + "MATH Level 5": 0.3165, + "GPQA": 0.3196, + "MUSR": 0.4375, + "MMLU-PRO": 0.5117 + } + }, + { + "model_id": "VAGOsolutions/SauerkrautLM-v2-14b-SFT", + "name": "SauerkrautLM-v2-14b-SFT", + "developer": "VAGOsolutions", + "scores": { + "IFEval": 0.6949, + "BBH": 0.621, + "MATH Level 5": 0.3285, + "GPQA": 0.3356, + "MUSR": 0.4179, + "MMLU-PRO": 0.5205 + } + }, + { + "model_id": "VIRNECT/llama-3-Korean-8B", + "name": "llama-3-Korean-8B", + "developer": "VIRNECT", + "scores": { + "IFEval": 0.5021, + "BBH": 0.4918, + "MATH Level 5": 0.108, + "GPQA": 0.271, + "MUSR": 0.3648, + "MMLU-PRO": 0.3536 + } + }, + { + "model_id": "VIRNECT/llama-3-Korean-8B-r-v-0.1", + "name": "llama-3-Korean-8B-r-v-0.1", + "developer": "VIRNECT", + "scores": { + "IFEval": 0.4916, + "BBH": 0.4806, + "MATH Level 5": 0.0861, + "GPQA": 0.2424, + "MUSR": 0.3675, + "MMLU-PRO": 0.326 + } + }, + { + "model_id": "ValiantLabs/Llama3-70B-Fireplace", + "name": "Llama3-70B-Fireplace", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.7774, + "BBH": 0.6489, + "MATH Level 5": 0.2145, + "GPQA": 0.3549, + "MUSR": 0.4449, + "MMLU-PRO": 0.4893 + } + }, + { + "model_id": "ValiantLabs/Llama3-70B-ShiningValiant2", + "name": "Llama3-70B-ShiningValiant2", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.6122, + "BBH": 0.6338, + "MATH Level 5": 0.2077, + "GPQA": 0.3305, + "MUSR": 0.4326, + "MMLU-PRO": 0.4898 + } + }, + { + "model_id": "ValiantLabs/Llama3.1-70B-ShiningValiant2", + "name": "Llama3.1-70B-ShiningValiant2", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.5355, + "BBH": 0.6738, + "MATH Level 5": 0.2915, + "GPQA": 0.3926, + "MUSR": 0.4681, + "MMLU-PRO": 0.5173 + } + }, + { + "model_id": "ValiantLabs/Llama3.1-8B-Cobalt", + "name": "Llama3.1-8B-Cobalt", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.7168, + "BBH": 0.4911, + "MATH Level 5": 0.1533, + "GPQA": 0.2861, + "MUSR": 0.3512, + "MMLU-PRO": 0.3663 + } + }, + { + "model_id": "ValiantLabs/Llama3.1-8B-Enigma", + "name": "Llama3.1-8B-Enigma", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.2681, + "BBH": 0.4478, + "MATH Level 5": 0.0891, + "GPQA": 0.2878, + "MUSR": 0.4196, + "MMLU-PRO": 0.3409 + } + }, + { + "model_id": "ValiantLabs/Llama3.1-8B-Esper2", + "name": "Llama3.1-8B-Esper2", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.2567, + "BBH": 0.447, + "MATH Level 5": 0.0589, + "GPQA": 0.2727, + "MUSR": 0.3561, + "MMLU-PRO": 0.2904 + } + }, + { + "model_id": "ValiantLabs/Llama3.1-8B-Fireplace2", + "name": "Llama3.1-8B-Fireplace2", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.5483, + "BBH": 0.461, + "MATH Level 5": 0.0582, + "GPQA": 0.2886, + "MUSR": 0.3433, + "MMLU-PRO": 0.2407 + } + }, + { + "model_id": "ValiantLabs/Llama3.1-8B-ShiningValiant2", + "name": "Llama3.1-8B-ShiningValiant2", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.2678, + "BBH": 0.4429, + "MATH Level 5": 0.0521, + "GPQA": 0.302, + "MUSR": 0.3959, + "MMLU-PRO": 0.2927 + } + }, + { + "model_id": "ValiantLabs/Llama3.2-3B-Enigma", + "name": "Llama3.2-3B-Enigma", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.2786, + "BBH": 0.3723, + "MATH Level 5": 0.0438, + "GPQA": 0.2617, + "MUSR": 0.3921, + "MMLU-PRO": 0.2428 + } + }, + { + "model_id": "ValiantLabs/Llama3.2-3B-Esper2", + "name": "Llama3.2-3B-Esper2", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.275, + "BBH": 0.3808, + "MATH Level 5": 0.0363, + "GPQA": 0.2701, + "MUSR": 0.355, + "MMLU-PRO": 0.2257 + } + }, + { + "model_id": "ValiantLabs/Llama3.2-3B-ShiningValiant2", + "name": "Llama3.2-3B-ShiningValiant2", + "developer": "ValiantLabs", + "scores": { + "IFEval": 0.2625, + "BBH": 0.4226, + "MATH Level 5": 0.0823, + "GPQA": 0.2802, + "MUSR": 0.3866, + "MMLU-PRO": 0.2829 + } + }, + { + "model_id": "Vikhrmodels/Vikhr-Llama3.1-8B-Instruct-R-21-09-24", + "name": "Vikhr-Llama3.1-8B-Instruct-R-21-09-24", + "developer": "Vikhrmodels", + "scores": { + "IFEval": 0.6431, + "BBH": 0.5272, + "MATH Level 5": 0.2175, + "GPQA": 0.245, + "MUSR": 0.3754, + "MMLU-PRO": 0.3547 + } + }, + { + "model_id": "Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24", + "name": "Vikhr-Nemo-12B-Instruct-R-21-09-24", + "developer": "Vikhrmodels", + "scores": { + "IFEval": 0.5999, + "BBH": 0.5212, + "MATH Level 5": 0.1715, + "GPQA": 0.2911, + "MUSR": 0.4073, + "MMLU-PRO": 0.3398 + } + }, + { + "model_id": "Weyaxi/Bagel-Hermes-2x34B", + "name": "Bagel-Hermes-2x34B", + "developer": "Weyaxi", + "scores": { + "IFEval": 0.5432, + "BBH": 0.4917, + "MATH Level 5": 0.0604, + "GPQA": 0.328, + "MUSR": 0.4517, + "MMLU-PRO": 0.4589 + } + }, + { + "model_id": "Weyaxi/Bagel-Hermes-34B-Slerp", + "name": "Bagel-Hermes-34B-Slerp", + "developer": "Weyaxi", + "scores": { + "IFEval": 0.4603, + "BBH": 0.5922, + "MATH Level 5": 0.0604, + "GPQA": 0.3347, + "MUSR": 0.4622, + "MMLU-PRO": 0.4703 + } + }, + { + "model_id": "Weyaxi/Einstein-v4-7B", + "name": "Einstein-v4-7B", + "developer": "Weyaxi", + "scores": { + "IFEval": 0.4708, + "BBH": 0.3849, + "MATH Level 5": 0.0189, + "GPQA": 0.2819, + "MUSR": 0.4682, + "MMLU-PRO": 0.2259 + } + }, + { + "model_id": "Weyaxi/Einstein-v6.1-Llama3-8B", + "name": "Einstein-v6.1-Llama3-8B", + "developer": "Weyaxi", + "scores": { + "IFEval": 0.4568, + "BBH": 0.5008, + "MATH Level 5": 0.068, + "GPQA": 0.2819, + "MUSR": 0.4213, + "MMLU-PRO": 0.3131 + } + }, + { + "model_id": "Weyaxi/Einstein-v6.1-developed-by-Weyaxi-Llama3-8B", + "name": "Einstein-v6.1-developed-by-Weyaxi-Llama3-8B", + "developer": "Weyaxi", + "scores": { + "IFEval": 0.3927, + "BBH": 0.5044, + "MATH Level 5": 0.0718, + "GPQA": 0.2735, + "MUSR": 0.4332, + "MMLU-PRO": 0.3093 + } + }, + { + "model_id": "Weyaxi/Einstein-v7-Qwen2-7B", + "name": "Einstein-v7-Qwen2-7B", + "developer": "Weyaxi", + "scores": { + "IFEval": 0.41, + "BBH": 0.5161, + "MATH Level 5": 0.1994, + "GPQA": 0.2995, + "MUSR": 0.44, + "MMLU-PRO": 0.4096 + } + }, + { + "model_id": "Weyaxi/Einstein-v8-Llama3.2-1B", + "name": "Einstein-v8-Llama3.2-1B", + "developer": "Weyaxi", + "scores": { + "IFEval": 0.1862, + "BBH": 0.3018, + "MATH Level 5": 0.0008, + "GPQA": 0.2584, + "MUSR": 0.3618, + "MMLU-PRO": 0.1161 + } + }, + { + "model_id": "Weyaxi/SauerkrautLM-UNA-SOLAR-Instruct", + "name": "SauerkrautLM-UNA-SOLAR-Instruct", + "developer": "Weyaxi", + "scores": { + "IFEval": 0.4573, + "BBH": 0.5166, + "MATH Level 5": 0.0461, + "GPQA": 0.3112, + "MUSR": 0.3979, + "MMLU-PRO": 0.3153 + } + }, + { + "model_id": "WizardLMTeam/WizardLM-13B-V1.0", + "name": "WizardLM-13B-V1.0", + "developer": "WizardLMTeam", + "scores": { + "IFEval": 0.185, + "BBH": 0.2913, + "MATH Level 5": 0.0, + "GPQA": 0.2592, + "MUSR": 0.3497, + "MMLU-PRO": 0.1166 + } + }, + { + "model_id": "WizardLMTeam/WizardLM-13B-V1.2", + "name": "WizardLM-13B-V1.2", + "developer": "WizardLMTeam", + "scores": { + "IFEval": 0.3392, + "BBH": 0.4462, + "MATH Level 5": 0.0189, + "GPQA": 0.2609, + "MUSR": 0.4378, + "MMLU-PRO": 0.2519 + } + }, + { + "model_id": "WizardLMTeam/WizardLM-70B-V1.0", + "name": "WizardLM-70B-V1.0", + "developer": "WizardLMTeam", + "scores": { + "IFEval": 0.4951, + "BBH": 0.559, + "MATH Level 5": 0.0393, + "GPQA": 0.2659, + "MUSR": 0.4391, + "MMLU-PRO": 0.3447 + } + }, + { + "model_id": "Wladastic/Mini-Think-Base-1B", + "name": "Mini-Think-Base-1B", + "developer": "Wladastic", + "scores": { + "IFEval": 0.5588, + "BBH": 0.3574, + "MATH Level 5": 0.0733, + "GPQA": 0.2634, + "MUSR": 0.3275, + "MMLU-PRO": 0.1772 + } + }, + { + "model_id": "Xclbr7/Arcanum-12b", + "name": "Arcanum-12b", + "developer": "Xclbr7", + "scores": { + "IFEval": 0.2907, + "BBH": 0.5265, + "MATH Level 5": 0.1193, + "GPQA": 0.3205, + "MUSR": 0.417, + "MMLU-PRO": 0.3586 + } + }, + { + "model_id": "Xclbr7/Hyena-12b", + "name": "Hyena-12b", + "developer": "Xclbr7", + "scores": { + "IFEval": 0.3404, + "BBH": 0.5457, + "MATH Level 5": 0.1133, + "GPQA": 0.2978, + "MUSR": 0.3984, + "MMLU-PRO": 0.3439 + } + }, + { + "model_id": "Xclbr7/caliburn-12b", + "name": "caliburn-12b", + "developer": "Xclbr7", + "scores": { + "IFEval": 0.3576, + "BBH": 0.5519, + "MATH Level 5": 0.1125, + "GPQA": 0.3364, + "MUSR": 0.4292, + "MMLU-PRO": 0.3675 + } + }, + { + "model_id": "Xclbr7/caliburn-v2-12b", + "name": "caliburn-v2-12b", + "developer": "Xclbr7", + "scores": { + "IFEval": 0.2967, + "BBH": 0.5141, + "MATH Level 5": 0.105, + "GPQA": 0.3263, + "MUSR": 0.437, + "MMLU-PRO": 0.3784 + } + }, + { + "model_id": "Xiaojian9992024/Llama3.2-1B-THREADRIPPER", + "name": "Llama3.2-1B-THREADRIPPER", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.5576, + "BBH": 0.3544, + "MATH Level 5": 0.074, + "GPQA": 0.2609, + "MUSR": 0.313, + "MMLU-PRO": 0.1763 + } + }, + { + "model_id": "Xiaojian9992024/Llama3.2-1B-THREADRIPPER-v0.2", + "name": "Llama3.2-1B-THREADRIPPER-v0.2", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.5318, + "BBH": 0.3528, + "MATH Level 5": 0.0657, + "GPQA": 0.2659, + "MUSR": 0.3316, + "MMLU-PRO": 0.1745 + } + }, + { + "model_id": "Xiaojian9992024/Phi-4-Megatron-Empathetic", + "name": "Phi-4-Megatron-Empathetic", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.0173, + "BBH": 0.6673, + "MATH Level 5": 0.2696, + "GPQA": 0.3859, + "MUSR": 0.5071, + "MMLU-PRO": 0.5082 + } + }, + { + "model_id": "Xiaojian9992024/Phi-4-mini-UNOFFICAL", + "name": "Phi-4-mini-UNOFFICAL", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.1273, + "BBH": 0.2944, + "MATH Level 5": 0.0, + "GPQA": 0.2408, + "MUSR": 0.3368, + "MMLU-PRO": 0.1144 + } + }, + { + "model_id": "Xiaojian9992024/Qwen2.5-7B-MS-Destroyer", + "name": "Qwen2.5-7B-MS-Destroyer", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.7296, + "BBH": 0.547, + "MATH Level 5": 0.4592, + "GPQA": 0.3045, + "MUSR": 0.427, + "MMLU-PRO": 0.4412 + } + }, + { + "model_id": "Xiaojian9992024/Qwen2.5-Dyanka-7B-Preview", + "name": "Qwen2.5-Dyanka-7B-Preview", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.764, + "BBH": 0.5543, + "MATH Level 5": 0.4879, + "GPQA": 0.3171, + "MUSR": 0.4481, + "MMLU-PRO": 0.4376 + } + }, + { + "model_id": "Xiaojian9992024/Qwen2.5-Dyanka-7B-Preview-v0.2", + "name": "Qwen2.5-Dyanka-7B-Preview-v0.2", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.6702, + "BBH": 0.5374, + "MATH Level 5": 0.4721, + "GPQA": 0.2936, + "MUSR": 0.4467, + "MMLU-PRO": 0.4371 + } + }, + { + "model_id": "Xiaojian9992024/Qwen2.5-THREADRIPPER-Medium-Censored", + "name": "Qwen2.5-THREADRIPPER-Medium-Censored", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.8112, + "BBH": 0.6431, + "MATH Level 5": 0.534, + "GPQA": 0.3347, + "MUSR": 0.414, + "MMLU-PRO": 0.4929 + } + }, + { + "model_id": "Xiaojian9992024/Qwen2.5-THREADRIPPER-Small", + "name": "Qwen2.5-THREADRIPPER-Small", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.7689, + "BBH": 0.549, + "MATH Level 5": 0.4736, + "GPQA": 0.3104, + "MUSR": 0.4349, + "MMLU-PRO": 0.4357 + } + }, + { + "model_id": "Xiaojian9992024/Qwen2.5-THREADRIPPER-Small-AnniversaryEdition", + "name": "Qwen2.5-THREADRIPPER-Small-AnniversaryEdition", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.7404, + "BBH": 0.5465, + "MATH Level 5": 0.5076, + "GPQA": 0.2685, + "MUSR": 0.3807, + "MMLU-PRO": 0.4393 + } + }, + { + "model_id": "Xiaojian9992024/Qwen2.5-Ultra-1.5B-25.02-Exp", + "name": "Qwen2.5-Ultra-1.5B-25.02-Exp", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.4073, + "BBH": 0.4066, + "MATH Level 5": 0.0831, + "GPQA": 0.2584, + "MUSR": 0.3383, + "MMLU-PRO": 0.2641 + } + }, + { + "model_id": "Xiaojian9992024/Reflection-L3.2-JametMiniMix-3B", + "name": "Reflection-L3.2-JametMiniMix-3B", + "developer": "Xiaojian9992024", + "scores": { + "IFEval": 0.4619, + "BBH": 0.439, + "MATH Level 5": 0.1193, + "GPQA": 0.2945, + "MUSR": 0.3667, + "MMLU-PRO": 0.2988 + } + }, + { + "model_id": "Xkev/Llama-3.2V-11B-cot", + "name": "Llama-3.2V-11B-cot", + "developer": "Xkev", + "scores": { + "IFEval": 0.4158, + "BBH": 0.4959, + "MATH Level 5": 0.1556, + "GPQA": 0.2953, + "MUSR": 0.4159, + "MMLU-PRO": 0.3587 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-1M-YOYO-V3", + "name": "Qwen2.5-14B-1M-YOYO-V3", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.8398, + "BBH": 0.6448, + "MATH Level 5": 0.5355, + "GPQA": 0.3289, + "MUSR": 0.4141, + "MMLU-PRO": 0.5207 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-0505", + "name": "Qwen2.5-14B-YOYO-0505", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5883, + "BBH": 0.6539, + "MATH Level 5": 0.4434, + "GPQA": 0.3733, + "MUSR": 0.4757, + "MMLU-PRO": 0.5371 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-0510-v2", + "name": "Qwen2.5-14B-YOYO-0510-v2", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5947, + "BBH": 0.6553, + "MATH Level 5": 0.4441, + "GPQA": 0.3817, + "MUSR": 0.4744, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-0805", + "name": "Qwen2.5-14B-YOYO-0805", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5883, + "BBH": 0.6539, + "MATH Level 5": 0.4434, + "GPQA": 0.3733, + "MUSR": 0.4757, + "MMLU-PRO": 0.5371 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-1005", + "name": "Qwen2.5-14B-YOYO-1005", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5972, + "BBH": 0.6542, + "MATH Level 5": 0.4524, + "GPQA": 0.3809, + "MUSR": 0.473, + "MMLU-PRO": 0.5382 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-1005-v2", + "name": "Qwen2.5-14B-YOYO-1005-v2", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5953, + "BBH": 0.6551, + "MATH Level 5": 0.4434, + "GPQA": 0.3842, + "MUSR": 0.4731, + "MMLU-PRO": 0.5372 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-1010", + "name": "Qwen2.5-14B-YOYO-1010", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.7905, + "BBH": 0.6406, + "MATH Level 5": 0.0, + "GPQA": 0.3163, + "MUSR": 0.4181, + "MMLU-PRO": 0.4944 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-1010-v2", + "name": "Qwen2.5-14B-YOYO-1010-v2", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5947, + "BBH": 0.6553, + "MATH Level 5": 0.4441, + "GPQA": 0.3817, + "MUSR": 0.4744, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-SCE", + "name": "Qwen2.5-14B-YOYO-SCE", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5844, + "BBH": 0.6489, + "MATH Level 5": 0.4615, + "GPQA": 0.3742, + "MUSR": 0.4704, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-V4", + "name": "Qwen2.5-14B-YOYO-V4", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.8398, + "BBH": 0.649, + "MATH Level 5": 0.5347, + "GPQA": 0.3221, + "MUSR": 0.4115, + "MMLU-PRO": 0.517 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-V4-p1", + "name": "Qwen2.5-14B-YOYO-V4-p1", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.8203, + "BBH": 0.6516, + "MATH Level 5": 0.5332, + "GPQA": 0.3456, + "MUSR": 0.4194, + "MMLU-PRO": 0.502 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-V4-p2", + "name": "Qwen2.5-14B-YOYO-V4-p2", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.8048, + "BBH": 0.6339, + "MATH Level 5": 0.5166, + "GPQA": 0.3272, + "MUSR": 0.4435, + "MMLU-PRO": 0.4968 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-latest", + "name": "Qwen2.5-14B-YOYO-latest", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5911, + "BBH": 0.6656, + "MATH Level 5": 0.4418, + "GPQA": 0.3826, + "MUSR": 0.4691, + "MMLU-PRO": 0.5371 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-YOYO-latest-V2", + "name": "Qwen2.5-14B-YOYO-latest-V2", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.7771, + "BBH": 0.6299, + "MATH Level 5": 0.5159, + "GPQA": 0.354, + "MUSR": 0.4299, + "MMLU-PRO": 0.5224 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-14B-it-restore", + "name": "Qwen2.5-14B-it-restore", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.8209, + "BBH": 0.6388, + "MATH Level 5": 0.537, + "GPQA": 0.3372, + "MUSR": 0.4087, + "MMLU-PRO": 0.49 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-7B-it-restore", + "name": "Qwen2.5-7B-it-restore", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.7531, + "BBH": 0.5407, + "MATH Level 5": 0.5, + "GPQA": 0.3012, + "MUSR": 0.4007, + "MMLU-PRO": 0.4288 + } + }, + { + "model_id": "YOYO-AI/Qwen2.5-Coder-14B-YOYO-1010", + "name": "Qwen2.5-Coder-14B-YOYO-1010", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5336, + "BBH": 0.6187, + "MATH Level 5": 0.3218, + "GPQA": 0.3523, + "MUSR": 0.4422, + "MMLU-PRO": 0.4075 + } + }, + { + "model_id": "YOYO-AI/ZYH-LLM-Qwen2.5-14B", + "name": "ZYH-LLM-Qwen2.5-14B", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5941, + "BBH": 0.6644, + "MATH Level 5": 0.4116, + "GPQA": 0.3859, + "MUSR": 0.4757, + "MMLU-PRO": 0.5351 + } + }, + { + "model_id": "YOYO-AI/ZYH-LLM-Qwen2.5-14B-V2", + "name": "ZYH-LLM-Qwen2.5-14B-V2", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.5071, + "BBH": 0.6452, + "MATH Level 5": 0.3542, + "GPQA": 0.3792, + "MUSR": 0.4689, + "MMLU-PRO": 0.5372 + } + }, + { + "model_id": "YOYO-AI/ZYH-LLM-Qwen2.5-14B-V3", + "name": "ZYH-LLM-Qwen2.5-14B-V3", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.8578, + "BBH": 0.6359, + "MATH Level 5": 0.5272, + "GPQA": 0.3322, + "MUSR": 0.4022, + "MMLU-PRO": 0.4881 + } + }, + { + "model_id": "YOYO-AI/ZYH-LLM-Qwen2.5-14B-V4", + "name": "ZYH-LLM-Qwen2.5-14B-V4", + "developer": "YOYO-AI", + "scores": { + "IFEval": 0.8365, + "BBH": 0.6515, + "MATH Level 5": 0.5393, + "GPQA": 0.3146, + "MUSR": 0.4434, + "MMLU-PRO": 0.5204 + } + }, + { + "model_id": "Yash21/TinyYi-7B-Test", + "name": "TinyYi-7B-Test", + "developer": "Yash21", + "scores": { + "IFEval": 0.1856, + "BBH": 0.291, + "MATH Level 5": 0.0, + "GPQA": 0.2643, + "MUSR": 0.3364, + "MMLU-PRO": 0.1091 + } + }, + { + "model_id": "Youlln/1PARAMMYL-8B-ModelStock", + "name": "1PARAMMYL-8B-ModelStock", + "developer": "Youlln", + "scores": { + "IFEval": 0.5371, + "BBH": 0.5216, + "MATH Level 5": 0.1488, + "GPQA": 0.3238, + "MUSR": 0.4409, + "MMLU-PRO": 0.4 + } + }, + { + "model_id": "Youlln/2PRYMMAL-Yi1.5-6B-SLERP", + "name": "2PRYMMAL-Yi1.5-6B-SLERP", + "developer": "Youlln", + "scores": { + "IFEval": 0.2826, + "BBH": 0.4665, + "MATH Level 5": 0.1133, + "GPQA": 0.307, + "MUSR": 0.4756, + "MMLU-PRO": 0.317 + } + }, + { + "model_id": "Youlln/3PRYMMAL-PHI3-3B-SLERP", + "name": "3PRYMMAL-PHI3-3B-SLERP", + "developer": "Youlln", + "scores": { + "IFEval": 0.3656, + "BBH": 0.5422, + "MATH Level 5": 0.1715, + "GPQA": 0.3263, + "MUSR": 0.4648, + "MMLU-PRO": 0.4002 + } + }, + { + "model_id": "Youlln/4PRYMMAL-GEMMA2-9B-SLERP", + "name": "4PRYMMAL-GEMMA2-9B-SLERP", + "developer": "Youlln", + "scores": { + "IFEval": 0.2714, + "BBH": 0.5923, + "MATH Level 5": 0.0906, + "GPQA": 0.3305, + "MUSR": 0.4672, + "MMLU-PRO": 0.421 + } + }, + { + "model_id": "Youlln/ECE-MIRAGE-1-12B", + "name": "ECE-MIRAGE-1-12B", + "developer": "Youlln", + "scores": { + "IFEval": 0.207, + "BBH": 0.3011, + "MATH Level 5": 0.0, + "GPQA": 0.2634, + "MUSR": 0.3219, + "MMLU-PRO": 0.111 + } + }, + { + "model_id": "Youlln/ECE-MIRAGE-1-15B", + "name": "ECE-MIRAGE-1-15B", + "developer": "Youlln", + "scores": { + "IFEval": 0.207, + "BBH": 0.3011, + "MATH Level 5": 0.0, + "GPQA": 0.2634, + "MUSR": 0.3219, + "MMLU-PRO": 0.111 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL-0.5B-FT-V3", + "name": "ECE-PRYMMAL-0.5B-FT-V3", + "developer": "Youlln", + "scores": { + "IFEval": 0.1642, + "BBH": 0.3093, + "MATH Level 5": 0.003, + "GPQA": 0.2576, + "MUSR": 0.3644, + "MMLU-PRO": 0.1161 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL-0.5B-FT-V3-MUSR", + "name": "ECE-PRYMMAL-0.5B-FT-V3-MUSR", + "developer": "Youlln", + "scores": { + "IFEval": 0.1533, + "BBH": 0.3041, + "MATH Level 5": 0.0242, + "GPQA": 0.2492, + "MUSR": 0.366, + "MMLU-PRO": 0.1645 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL-0.5B-FT-V4-MUSR", + "name": "ECE-PRYMMAL-0.5B-FT-V4-MUSR", + "developer": "Youlln", + "scores": { + "IFEval": 0.1138, + "BBH": 0.3038, + "MATH Level 5": 0.0121, + "GPQA": 0.2701, + "MUSR": 0.3529, + "MMLU-PRO": 0.1321 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL-0.5B-SLERP-V2", + "name": "ECE-PRYMMAL-0.5B-SLERP-V2", + "developer": "Youlln", + "scores": { + "IFEval": 0.1612, + "BBH": 0.2935, + "MATH Level 5": 0.0008, + "GPQA": 0.2743, + "MUSR": 0.3831, + "MMLU-PRO": 0.1095 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL-0.5B-SLERP-V3", + "name": "ECE-PRYMMAL-0.5B-SLERP-V3", + "developer": "Youlln", + "scores": { + "IFEval": 0.167, + "BBH": 0.2938, + "MATH Level 5": 0.0, + "GPQA": 0.2517, + "MUSR": 0.3541, + "MMLU-PRO": 0.1087 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL-YL-1B-SLERP-V1", + "name": "ECE-PRYMMAL-YL-1B-SLERP-V1", + "developer": "Youlln", + "scores": { + "IFEval": 0.3251, + "BBH": 0.4209, + "MATH Level 5": 0.1073, + "GPQA": 0.2911, + "MUSR": 0.4266, + "MMLU-PRO": 0.2936 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL-YL-1B-SLERP-V2", + "name": "ECE-PRYMMAL-YL-1B-SLERP-V2", + "developer": "Youlln", + "scores": { + "IFEval": 0.3251, + "BBH": 0.4209, + "MATH Level 5": 0.1073, + "GPQA": 0.2911, + "MUSR": 0.4266, + "MMLU-PRO": 0.2936 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL-YL-7B-SLERP-V4", + "name": "ECE-PRYMMAL-YL-7B-SLERP-V4", + "developer": "Youlln", + "scores": { + "IFEval": 0.251, + "BBH": 0.377, + "MATH Level 5": 0.0536, + "GPQA": 0.2651, + "MUSR": 0.3745, + "MMLU-PRO": 0.2132 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL0.5-FT", + "name": "ECE-PRYMMAL0.5-FT", + "developer": "Youlln", + "scores": { + "IFEval": 0.1851, + "BBH": 0.3132, + "MATH Level 5": 0.0234, + "GPQA": 0.2559, + "MUSR": 0.3301, + "MMLU-PRO": 0.1477 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL0.5B-Youri", + "name": "ECE-PRYMMAL0.5B-Youri", + "developer": "Youlln", + "scores": { + "IFEval": 0.1446, + "BBH": 0.2817, + "MATH Level 5": 0.0, + "GPQA": 0.2433, + "MUSR": 0.3697, + "MMLU-PRO": 0.1095 + } + }, + { + "model_id": "Youlln/ECE-PRYMMAL1B-FT-V1", + "name": "ECE-PRYMMAL1B-FT-V1", + "developer": "Youlln", + "scores": { + "IFEval": 0.2144, + "BBH": 0.4033, + "MATH Level 5": 0.0642, + "GPQA": 0.2785, + "MUSR": 0.3417, + "MMLU-PRO": 0.2743 + } + }, + { + "model_id": "Youlln/ECE-Qwen0.5B-FT-V2", + "name": "ECE-Qwen0.5B-FT-V2", + "developer": "Youlln", + "scores": { + "IFEval": 0.2526, + "BBH": 0.329, + "MATH Level 5": 0.0204, + "GPQA": 0.2668, + "MUSR": 0.3063, + "MMLU-PRO": 0.1666 + } + }, + { + "model_id": "Youlln/ECE.EIFFEIL.ia-0.5B-SLERP", + "name": "ECE.EIFFEIL.ia-0.5B-SLERP", + "developer": "Youlln", + "scores": { + "IFEval": 0.2561, + "BBH": 0.3306, + "MATH Level 5": 0.0597, + "GPQA": 0.2651, + "MUSR": 0.3102, + "MMLU-PRO": 0.1903 + } + }, + { + "model_id": "YoungPanda/qwenqwen", + "name": "qwenqwen", + "developer": "YoungPanda", + "scores": { + "IFEval": 0.1264, + "BBH": 0.3379, + "MATH Level 5": 0.0355, + "GPQA": 0.25, + "MUSR": 0.3434, + "MMLU-PRO": 0.1168 + } + }, + { + "model_id": "Yuma42/KangalKhan-RawRuby-7B", + "name": "KangalKhan-RawRuby-7B", + "developer": "Yuma42", + "scores": { + "IFEval": 0.5477, + "BBH": 0.4755, + "MATH Level 5": 0.0665, + "GPQA": 0.2878, + "MUSR": 0.395, + "MMLU-PRO": 0.3023 + } + }, + { + "model_id": "Yuma42/Llama3.1-IgneousIguana-8B", + "name": "Llama3.1-IgneousIguana-8B", + "developer": "Yuma42", + "scores": { + "IFEval": 0.8133, + "BBH": 0.5191, + "MATH Level 5": 0.2198, + "GPQA": 0.3104, + "MUSR": 0.4203, + "MMLU-PRO": 0.3974 + } + }, + { + "model_id": "Yuma42/Llama3.1-SuperHawk-8B", + "name": "Llama3.1-SuperHawk-8B", + "developer": "Yuma42", + "scores": { + "IFEval": 0.7986, + "BBH": 0.52, + "MATH Level 5": 0.2349, + "GPQA": 0.3129, + "MUSR": 0.4084, + "MMLU-PRO": 0.3945 + } + }, + { + "model_id": "Z1-Coder/Z1-Coder-7B", + "name": "Z1-Coder-7B", + "developer": "Z1-Coder", + "scores": { + "IFEval": 0.3215, + "BBH": 0.4842, + "MATH Level 5": 0.3248, + "GPQA": 0.2727, + "MUSR": 0.3622, + "MMLU-PRO": 0.3759 + } + }, + { + "model_id": "ZHLiu627/zephyr-7b-gemma-dpo-avg", + "name": "zephyr-7b-gemma-dpo-avg", + "developer": "ZHLiu627", + "scores": { + "IFEval": 0.309, + "BBH": 0.4149, + "MATH Level 5": 0.0453, + "GPQA": 0.2785, + "MUSR": 0.4107, + "MMLU-PRO": 0.2851 + } + }, + { + "model_id": "ZHLiu627/zephyr-7b-gemma-rpo-avg", + "name": "zephyr-7b-gemma-rpo-avg", + "developer": "ZHLiu627", + "scores": { + "IFEval": 0.3006, + "BBH": 0.4183, + "MATH Level 5": 0.0498, + "GPQA": 0.2768, + "MUSR": 0.4081, + "MMLU-PRO": 0.2831 + } + }, + { + "model_id": "ZeroXClem/L3-Aspire-Heart-Matrix-8B", + "name": "L3-Aspire-Heart-Matrix-8B", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.4834, + "BBH": 0.5384, + "MATH Level 5": 0.1828, + "GPQA": 0.3247, + "MUSR": 0.4187, + "MMLU-PRO": 0.3785 + } + }, + { + "model_id": "ZeroXClem/Llama-3.1-8B-AthenaSky-MegaMix", + "name": "Llama-3.1-8B-AthenaSky-MegaMix", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.6301, + "BBH": 0.5163, + "MATH Level 5": 0.2795, + "GPQA": 0.2777, + "MUSR": 0.3538, + "MMLU-PRO": 0.3504 + } + }, + { + "model_id": "ZeroXClem/Llama-3.1-8B-RainbowLight-EtherealMix", + "name": "Llama-3.1-8B-RainbowLight-EtherealMix", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.4973, + "BBH": 0.5155, + "MATH Level 5": 0.1216, + "GPQA": 0.2869, + "MUSR": 0.3947, + "MMLU-PRO": 0.363 + } + }, + { + "model_id": "ZeroXClem/Llama-3.1-8B-SpecialTitanFusion", + "name": "Llama-3.1-8B-SpecialTitanFusion", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.7402, + "BBH": 0.5439, + "MATH Level 5": 0.2334, + "GPQA": 0.2995, + "MUSR": 0.3874, + "MMLU-PRO": 0.3621 + } + }, + { + "model_id": "ZeroXClem/Llama-3.1-8B-SuperNova-EtherealHermes", + "name": "Llama-3.1-8B-SuperNova-EtherealHermes", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.7339, + "BBH": 0.5244, + "MATH Level 5": 0.1745, + "GPQA": 0.2928, + "MUSR": 0.4066, + "MMLU-PRO": 0.3745 + } + }, + { + "model_id": "ZeroXClem/Llama-3.1-8B-SuperTulu-LexiNova", + "name": "Llama-3.1-8B-SuperTulu-LexiNova", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.4165, + "BBH": 0.5079, + "MATH Level 5": 0.253, + "GPQA": 0.2861, + "MUSR": 0.3971, + "MMLU-PRO": 0.3368 + } + }, + { + "model_id": "ZeroXClem/Qwen-2.5-Aether-SlerpFusion-7B", + "name": "Qwen-2.5-Aether-SlerpFusion-7B", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.6262, + "BBH": 0.5462, + "MATH Level 5": 0.2734, + "GPQA": 0.2987, + "MUSR": 0.4178, + "MMLU-PRO": 0.4327 + } + }, + { + "model_id": "ZeroXClem/Qwen2.5-7B-CelestialHarmony-1M", + "name": "Qwen2.5-7B-CelestialHarmony-1M", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.5944, + "BBH": 0.5431, + "MATH Level 5": 0.3474, + "GPQA": 0.3188, + "MUSR": 0.4595, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "ZeroXClem/Qwen2.5-7B-HomerAnvita-NerdMix", + "name": "Qwen2.5-7B-HomerAnvita-NerdMix", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.7708, + "BBH": 0.5541, + "MATH Level 5": 0.3837, + "GPQA": 0.3196, + "MUSR": 0.4391, + "MMLU-PRO": 0.4432 + } + }, + { + "model_id": "ZeroXClem/Qwen2.5-7B-HomerCreative-Mix", + "name": "Qwen2.5-7B-HomerCreative-Mix", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.7835, + "BBH": 0.5548, + "MATH Level 5": 0.3565, + "GPQA": 0.2995, + "MUSR": 0.435, + "MMLU-PRO": 0.4447 + } + }, + { + "model_id": "ZeroXClem/Qwen2.5-7B-Qandora-CySec", + "name": "Qwen2.5-7B-Qandora-CySec", + "developer": "ZeroXClem", + "scores": { + "IFEval": 0.6773, + "BBH": 0.549, + "MATH Level 5": 0.2931, + "GPQA": 0.3003, + "MUSR": 0.4286, + "MMLU-PRO": 0.4485 + } + }, + { + "model_id": "ZeusLabs/L3-Aethora-15B-V2", + "name": "L3-Aethora-15B-V2", + "developer": "ZeusLabs", + "scores": { + "IFEval": 0.7208, + "BBH": 0.5011, + "MATH Level 5": 0.0808, + "GPQA": 0.2878, + "MUSR": 0.3871, + "MMLU-PRO": 0.35 + } + }, + { + "model_id": "ZhangShenao/SELM-Llama-3-8B-Instruct-iter-3", + "name": "SELM-Llama-3-8B-Instruct-iter-3", + "developer": "ZhangShenao", + "scores": { + "IFEval": 0.6903, + "BBH": 0.5046, + "MATH Level 5": 0.0861, + "GPQA": 0.2584, + "MUSR": 0.3845, + "MMLU-PRO": 0.3783 + } + }, + { + "model_id": "aaditya/Llama3-OpenBioLLM-70B", + "name": "Llama3-OpenBioLLM-70B", + "developer": "aaditya", + "scores": { + "IFEval": 0.7597, + "BBH": 0.6399, + "MATH Level 5": 0.1971, + "GPQA": 0.323, + "MUSR": 0.4417, + "MMLU-PRO": 0.4867 + } + }, + { + "model_id": "abacusai/Dracarys-72B-Instruct", + "name": "Dracarys-72B-Instruct", + "developer": "abacusai", + "scores": { + "IFEval": 0.7856, + "BBH": 0.6944, + "MATH Level 5": 0.3965, + "GPQA": 0.3909, + "MUSR": 0.4558, + "MMLU-PRO": 0.5456 + } + }, + { + "model_id": "abacusai/Liberated-Qwen1.5-14B", + "name": "Liberated-Qwen1.5-14B", + "developer": "abacusai", + "scores": { + "IFEval": 0.3631, + "BBH": 0.4948, + "MATH Level 5": 0.1601, + "GPQA": 0.2836, + "MUSR": 0.4175, + "MMLU-PRO": 0.3512 + } + }, + { + "model_id": "abacusai/Llama-3-Smaug-8B", + "name": "Llama-3-Smaug-8B", + "developer": "abacusai", + "scores": { + "IFEval": 0.4867, + "BBH": 0.4931, + "MATH Level 5": 0.0853, + "GPQA": 0.2483, + "MUSR": 0.3622, + "MMLU-PRO": 0.3185 + } + }, + { + "model_id": "abacusai/Smaug-34B-v0.1", + "name": "Smaug-34B-v0.1", + "developer": "abacusai", + "scores": { + "IFEval": 0.5016, + "BBH": 0.5358, + "MATH Level 5": 0.0718, + "GPQA": 0.3297, + "MUSR": 0.3979, + "MMLU-PRO": 0.4543 + } + }, + { + "model_id": "abacusai/Smaug-72B-v0.1", + "name": "Smaug-72B-v0.1", + "developer": "abacusai", + "scores": { + "IFEval": 0.5167, + "BBH": 0.5996, + "MATH Level 5": 0.1911, + "GPQA": 0.3238, + "MUSR": 0.4473, + "MMLU-PRO": 0.4624 + } + }, + { + "model_id": "abacusai/Smaug-Llama-3-70B-Instruct-32K", + "name": "Smaug-Llama-3-70B-Instruct-32K", + "developer": "abacusai", + "scores": { + "IFEval": 0.7761, + "BBH": 0.6493, + "MATH Level 5": 0.2749, + "GPQA": 0.2961, + "MUSR": 0.4208, + "MMLU-PRO": 0.4765 + } + }, + { + "model_id": "abacusai/Smaug-Mixtral-v0.1", + "name": "Smaug-Mixtral-v0.1", + "developer": "abacusai", + "scores": { + "IFEval": 0.5554, + "BBH": 0.5162, + "MATH Level 5": 0.0952, + "GPQA": 0.3012, + "MUSR": 0.4298, + "MMLU-PRO": 0.3352 + } + }, + { + "model_id": "abacusai/Smaug-Qwen2-72B-Instruct", + "name": "Smaug-Qwen2-72B-Instruct", + "developer": "abacusai", + "scores": { + "IFEval": 0.7825, + "BBH": 0.691, + "MATH Level 5": 0.4131, + "GPQA": 0.3616, + "MUSR": 0.4401, + "MMLU-PRO": 0.519 + } + }, + { + "model_id": "abacusai/bigstral-12b-32k", + "name": "bigstral-12b-32k", + "developer": "abacusai", + "scores": { + "IFEval": 0.4194, + "BBH": 0.47, + "MATH Level 5": 0.0151, + "GPQA": 0.2928, + "MUSR": 0.456, + "MMLU-PRO": 0.2641 + } + }, + { + "model_id": "abacusai/bigyi-15b", + "name": "bigyi-15b", + "developer": "abacusai", + "scores": { + "IFEval": 0.2094, + "BBH": 0.4345, + "MATH Level 5": 0.0295, + "GPQA": 0.3096, + "MUSR": 0.3538, + "MMLU-PRO": 0.3003 + } + }, + { + "model_id": "abhishek/autotrain-0tmgq-5tpbg", + "name": "autotrain-0tmgq-5tpbg", + "developer": "abhishek", + "scores": { + "IFEval": 0.1957, + "BBH": 0.3135, + "MATH Level 5": 0.0, + "GPQA": 0.2517, + "MUSR": 0.365, + "MMLU-PRO": 0.1151 + } + }, + { + "model_id": "abhishek/autotrain-llama3-70b-orpo-v1", + "name": "autotrain-llama3-70b-orpo-v1", + "developer": "abhishek", + "scores": { + "IFEval": 0.4233, + "BBH": 0.5998, + "MATH Level 5": 0.0106, + "GPQA": 0.2441, + "MUSR": 0.3579, + "MMLU-PRO": 0.1122 + } + }, + { + "model_id": "abhishek/autotrain-llama3-70b-orpo-v2", + "name": "autotrain-llama3-70b-orpo-v2", + "developer": "abhishek", + "scores": { + "IFEval": 0.5406, + "BBH": 0.5899, + "MATH Level 5": 0.2107, + "GPQA": 0.2936, + "MUSR": 0.4113, + "MMLU-PRO": 0.4818 + } + }, + { + "model_id": "abhishek/autotrain-llama3-orpo-v2", + "name": "autotrain-llama3-orpo-v2", + "developer": "abhishek", + "scores": { + "IFEval": 0.4372, + "BBH": 0.3159, + "MATH Level 5": 0.0468, + "GPQA": 0.2668, + "MUSR": 0.3792, + "MMLU-PRO": 0.2218 + } + }, + { + "model_id": "abhishek/autotrain-vr4a1-e5mms", + "name": "autotrain-vr4a1-e5mms", + "developer": "abhishek", + "scores": { + "IFEval": 0.2142, + "BBH": 0.5001, + "MATH Level 5": 0.1412, + "GPQA": 0.3196, + "MUSR": 0.3891, + "MMLU-PRO": 0.3667 + } + }, + { + "model_id": "abideen/MedPhi-4-14B-v1", + "name": "MedPhi-4-14B-v1", + "developer": "abideen", + "scores": { + "IFEval": 0.6277, + "BBH": 0.6897, + "MATH Level 5": 0.2931, + "GPQA": 0.344, + "MUSR": 0.4155, + "MMLU-PRO": 0.5338 + } + }, + { + "model_id": "adamo1139/Yi-34B-200K-AEZAKMI-v2", + "name": "Yi-34B-200K-AEZAKMI-v2", + "developer": "adamo1139", + "scores": { + "IFEval": 0.4555, + "BBH": 0.5384, + "MATH Level 5": 0.0566, + "GPQA": 0.3322, + "MUSR": 0.3886, + "MMLU-PRO": 0.4513 + } + }, + { + "model_id": "adriszmar/QAIMath-Qwen2.5-7B-TIES", + "name": "QAIMath-Qwen2.5-7B-TIES", + "developer": "adriszmar", + "scores": { + "IFEval": 0.1685, + "BBH": 0.3124, + "MATH Level 5": 0.0015, + "GPQA": 0.2492, + "MUSR": 0.3963, + "MMLU-PRO": 0.1066 + } + }, + { + "model_id": "aevalone/distill_qw_test", + "name": "distill_qw_test", + "developer": "aevalone", + "scores": { + "IFEval": 0.7409, + "BBH": 0.5246, + "MATH Level 5": 0.4781, + "GPQA": 0.3003, + "MUSR": 0.386, + "MMLU-PRO": 0.4092 + } + }, + { + "model_id": "agentlans/Gemma2-9B-AdvancedFuse", + "name": "Gemma2-9B-AdvancedFuse", + "developer": "agentlans", + "scores": { + "IFEval": 0.1543, + "BBH": 0.5859, + "MATH Level 5": 0.1005, + "GPQA": 0.3347, + "MUSR": 0.4231, + "MMLU-PRO": 0.4 + } + }, + { + "model_id": "agentlans/Llama-3.2-1B-Instruct-CrashCourse12K", + "name": "Llama-3.2-1B-Instruct-CrashCourse12K", + "developer": "agentlans", + "scores": { + "IFEval": 0.5395, + "BBH": 0.3548, + "MATH Level 5": 0.071, + "GPQA": 0.2408, + "MUSR": 0.321, + "MMLU-PRO": 0.1809 + } + }, + { + "model_id": "agentlans/Llama3.1-8B-drill", + "name": "Llama3.1-8B-drill", + "developer": "agentlans", + "scores": { + "IFEval": 0.7652, + "BBH": 0.5016, + "MATH Level 5": 0.1715, + "GPQA": 0.2676, + "MUSR": 0.3672, + "MMLU-PRO": 0.3776 + } + }, + { + "model_id": "agentlans/Llama3.1-Daredevilish", + "name": "Llama3.1-Daredevilish", + "developer": "agentlans", + "scores": { + "IFEval": 0.6292, + "BBH": 0.5013, + "MATH Level 5": 0.1292, + "GPQA": 0.3012, + "MUSR": 0.4091, + "MMLU-PRO": 0.3697 + } + }, + { + "model_id": "agentlans/Llama3.1-Daredevilish-Instruct", + "name": "Llama3.1-Daredevilish-Instruct", + "developer": "agentlans", + "scores": { + "IFEval": 0.7926, + "BBH": 0.5235, + "MATH Level 5": 0.1722, + "GPQA": 0.307, + "MUSR": 0.3911, + "MMLU-PRO": 0.3877 + } + }, + { + "model_id": "agentlans/Llama3.1-LexiHermes-SuperStorm", + "name": "Llama3.1-LexiHermes-SuperStorm", + "developer": "agentlans", + "scores": { + "IFEval": 0.7835, + "BBH": 0.5266, + "MATH Level 5": 0.1616, + "GPQA": 0.323, + "MUSR": 0.3963, + "MMLU-PRO": 0.3844 + } + }, + { + "model_id": "agentlans/Llama3.1-SuperDeepFuse", + "name": "Llama3.1-SuperDeepFuse", + "developer": "agentlans", + "scores": { + "IFEval": 0.7762, + "BBH": 0.5049, + "MATH Level 5": 0.1828, + "GPQA": 0.2743, + "MUSR": 0.3699, + "MMLU-PRO": 0.3775 + } + }, + { + "model_id": "agentlans/Llama3.1-SuperDeepFuse-CrashCourse12K", + "name": "Llama3.1-SuperDeepFuse-CrashCourse12K", + "developer": "agentlans", + "scores": { + "IFEval": 0.7187, + "BBH": 0.5216, + "MATH Level 5": 0.1805, + "GPQA": 0.3129, + "MUSR": 0.4026, + "MMLU-PRO": 0.3631 + } + }, + { + "model_id": "agentlans/Qwen2.5-0.5B-Instruct-CrashCourse-dropout", + "name": "Qwen2.5-0.5B-Instruct-CrashCourse-dropout", + "developer": "agentlans", + "scores": { + "IFEval": 0.2949, + "BBH": 0.3312, + "MATH Level 5": 0.0423, + "GPQA": 0.2634, + "MUSR": 0.3342, + "MMLU-PRO": 0.1608 + } + }, + { + "model_id": "ahmeda335/13_outOf_32_pruned_layers_llama3.1-8b", + "name": "13_outOf_32_pruned_layers_llama3.1-8b", + "developer": "ahmeda335", + "scores": { + "IFEval": 0.1748, + "BBH": 0.2883, + "MATH Level 5": 0.0, + "GPQA": 0.2592, + "MUSR": 0.3803, + "MMLU-PRO": 0.1129 + } + }, + { + "model_id": "ai21labs/Jamba-v0.1", + "name": "Jamba-v0.1", + "developer": "ai21labs", + "scores": { + "IFEval": 0.2026, + "BBH": 0.3602, + "MATH Level 5": 0.0159, + "GPQA": 0.2685, + "MUSR": 0.359, + "MMLU-PRO": 0.2492 + } + }, + { + "model_id": "ai4bharat/Airavata", + "name": "Airavata", + "developer": "ai4bharat", + "scores": { + "IFEval": 0.0559, + "BBH": 0.3628, + "MATH Level 5": 0.0181, + "GPQA": 0.2743, + "MUSR": 0.3763, + "MMLU-PRO": 0.1635 + } + }, + { + "model_id": "aixonlab/Aether-12b", + "name": "Aether-12b", + "developer": "aixonlab", + "scores": { + "IFEval": 0.2347, + "BBH": 0.5179, + "MATH Level 5": 0.1065, + "GPQA": 0.3163, + "MUSR": 0.3829, + "MMLU-PRO": 0.341 + } + }, + { + "model_id": "aixonlab/Grey-12b", + "name": "Grey-12b", + "developer": "aixonlab", + "scores": { + "IFEval": 0.3968, + "BBH": 0.5699, + "MATH Level 5": 0.0982, + "GPQA": 0.3003, + "MUSR": 0.4516, + "MMLU-PRO": 0.3779 + } + }, + { + "model_id": "aixonlab/Zara-14b-v1.2", + "name": "Zara-14b-v1.2", + "developer": "aixonlab", + "scores": { + "IFEval": 0.6197, + "BBH": 0.6405, + "MATH Level 5": 0.3535, + "GPQA": 0.3817, + "MUSR": 0.4675, + "MMLU-PRO": 0.5263 + } + }, + { + "model_id": "akhadangi/Llama3.2.1B.0.01-First", + "name": "Llama3.2.1B.0.01-First", + "developer": "akhadangi", + "scores": { + "IFEval": 0.0814, + "BBH": 0.3189, + "MATH Level 5": 0.0181, + "GPQA": 0.2483, + "MUSR": 0.3194, + "MMLU-PRO": 0.1197 + } + }, + { + "model_id": "akhadangi/Llama3.2.1B.0.01-Last", + "name": "Llama3.2.1B.0.01-Last", + "developer": "akhadangi", + "scores": { + "IFEval": 0.0917, + "BBH": 0.3159, + "MATH Level 5": 0.0136, + "GPQA": 0.2433, + "MUSR": 0.3206, + "MMLU-PRO": 0.1227 + } + }, + { + "model_id": "akhadangi/Llama3.2.1B.0.1-First", + "name": "Llama3.2.1B.0.1-First", + "developer": "akhadangi", + "scores": { + "IFEval": 0.1001, + "BBH": 0.312, + "MATH Level 5": 0.0211, + "GPQA": 0.245, + "MUSR": 0.3301, + "MMLU-PRO": 0.1169 + } + }, + { + "model_id": "akhadangi/Llama3.2.1B.0.1-Last", + "name": "Llama3.2.1B.0.1-Last", + "developer": "akhadangi", + "scores": { + "IFEval": 0.095, + "BBH": 0.3164, + "MATH Level 5": 0.0211, + "GPQA": 0.2383, + "MUSR": 0.3341, + "MMLU-PRO": 0.1178 + } + }, + { + "model_id": "akhadangi/Llama3.2.1B.BaseFiT", + "name": "Llama3.2.1B.BaseFiT", + "developer": "akhadangi", + "scores": { + "IFEval": 0.0883, + "BBH": 0.3175, + "MATH Level 5": 0.0242, + "GPQA": 0.2534, + "MUSR": 0.3221, + "MMLU-PRO": 0.1172 + } + }, + { + "model_id": "akjindal53244/Llama-3.1-Storm-8B", + "name": "Llama-3.1-Storm-8B", + "developer": "akjindal53244", + "scores": { + "IFEval": 0.8033, + "BBH": 0.5196, + "MATH Level 5": 0.1624, + "GPQA": 0.3096, + "MUSR": 0.4028, + "MMLU-PRO": 0.3812 + } + }, + { + "model_id": "alcholjung/llama3_medical_tuned", + "name": "llama3_medical_tuned", + "developer": "alcholjung", + "scores": { + "IFEval": 0.0106, + "BBH": 0.4513, + "MATH Level 5": 0.0468, + "GPQA": 0.2861, + "MUSR": 0.466, + "MMLU-PRO": 0.2946 + } + }, + { + "model_id": "allenai/Llama-3.1-Tulu-3-70B", + "name": "Llama-3.1-Tulu-3-70B", + "developer": "allenai", + "scores": { + "IFEval": 0.8379, + "BBH": 0.6157, + "MATH Level 5": 0.3829, + "GPQA": 0.3733, + "MUSR": 0.4988, + "MMLU-PRO": 0.4656 + } + }, + { + "model_id": "allenai/Llama-3.1-Tulu-3-70B-DPO", + "name": "Llama-3.1-Tulu-3-70B-DPO", + "developer": "allenai", + "scores": { + "IFEval": 0.8282, + "BBH": 0.6146, + "MATH Level 5": 0.4494, + "GPQA": 0.3758, + "MUSR": 0.4923, + "MMLU-PRO": 0.4633 + } + }, + { + "model_id": "allenai/Llama-3.1-Tulu-3-70B-SFT", + "name": "Llama-3.1-Tulu-3-70B-SFT", + "developer": "allenai", + "scores": { + "IFEval": 0.8051, + "BBH": 0.5951, + "MATH Level 5": 0.3316, + "GPQA": 0.3448, + "MUSR": 0.5026, + "MMLU-PRO": 0.4624 + } + }, + { + "model_id": "allenai/Llama-3.1-Tulu-3-8B", + "name": "Llama-3.1-Tulu-3-8B", + "developer": "allenai", + "scores": { + "IFEval": 0.8267, + "BBH": 0.405, + "MATH Level 5": 0.1964, + "GPQA": 0.2987, + "MUSR": 0.4175, + "MMLU-PRO": 0.2827 + } + }, + { + "model_id": "allenai/Llama-3.1-Tulu-3-8B-DPO", + "name": "Llama-3.1-Tulu-3-8B-DPO", + "developer": "allenai", + "scores": { + "IFEval": 0.8029, + "BBH": 0.4079, + "MATH Level 5": 0.2364, + "GPQA": 0.2936, + "MUSR": 0.4161, + "MMLU-PRO": 0.2898 + } + }, + { + "model_id": "allenai/Llama-3.1-Tulu-3-8B-RM", + "name": "Llama-3.1-Tulu-3-8B-RM", + "developer": "allenai", + "scores": { + "IFEval": 0.167, + "BBH": 0.295, + "MATH Level 5": 0.0, + "GPQA": 0.2567, + "MUSR": 0.3764, + "MMLU-PRO": 0.1082 + } + }, + { + "model_id": "allenai/Llama-3.1-Tulu-3-8B-SFT", + "name": "Llama-3.1-Tulu-3-8B-SFT", + "developer": "allenai", + "scores": { + "IFEval": 0.7403, + "BBH": 0.3872, + "MATH Level 5": 0.1178, + "GPQA": 0.2777, + "MUSR": 0.4268, + "MMLU-PRO": 0.2812 + } + }, + { + "model_id": "allenai/OLMo-1.7-7B-hf", + "name": "OLMo-1.7-7B-hf", + "developer": "allenai", + "scores": { + "IFEval": 0.1569, + "BBH": 0.3014, + "MATH Level 5": 0.0023, + "GPQA": 0.255, + "MUSR": 0.3475, + "MMLU-PRO": 0.1124 + } + }, + { + "model_id": "allenai/OLMo-1B-hf", + "name": "OLMo-1B-hf", + "developer": "allenai", + "scores": { + "IFEval": 0.2182, + "BBH": 0.3052, + "MATH Level 5": 0.0174, + "GPQA": 0.2617, + "MUSR": 0.4098, + "MMLU-PRO": 0.1174 + } + }, + { + "model_id": "allenai/OLMo-2-1124-7B-Instruct", + "name": "OLMo-2-1124-7B-Instruct", + "developer": "allenai", + "scores": { + "IFEval": 0.7244, + "BBH": 0.4022, + "MATH Level 5": 0.1488, + "GPQA": 0.2785, + "MUSR": 0.3508, + "MMLU-PRO": 0.2672 + } + }, + { + "model_id": "allenai/OLMo-7B-Instruct-hf", + "name": "OLMo-7B-Instruct-hf", + "developer": "allenai", + "scores": { + "IFEval": 0.3473, + "BBH": 0.3706, + "MATH Level 5": 0.0136, + "GPQA": 0.271, + "MUSR": 0.3765, + "MMLU-PRO": 0.1785 + } + }, + { + "model_id": "allenai/OLMo-7B-hf", + "name": "OLMo-7B-hf", + "developer": "allenai", + "scores": { + "IFEval": 0.2719, + "BBH": 0.3279, + "MATH Level 5": 0.0121, + "GPQA": 0.2727, + "MUSR": 0.3487, + "MMLU-PRO": 0.1173 + } + }, + { + "model_id": "allenai/OLMoE-1B-7B-0125-Instruct", + "name": "OLMoE-1B-7B-0125-Instruct", + "developer": "allenai", + "scores": { + "IFEval": 0.6757, + "BBH": 0.3825, + "MATH Level 5": 0.0899, + "GPQA": 0.2601, + "MUSR": 0.3636, + "MMLU-PRO": 0.1915 + } + }, + { + "model_id": "allenai/OLMoE-1B-7B-0924", + "name": "OLMoE-1B-7B-0924", + "developer": "allenai", + "scores": { + "IFEval": 0.2185, + "BBH": 0.3393, + "MATH Level 5": 0.0166, + "GPQA": 0.2475, + "MUSR": 0.3488, + "MMLU-PRO": 0.174 + } + }, + { + "model_id": "allenai/OLMoE-1B-7B-0924-Instruct", + "name": "OLMoE-1B-7B-0924-Instruct", + "developer": "allenai", + "scores": { + "IFEval": 0.4667, + "BBH": 0.3902, + "MATH Level 5": 0.0279, + "GPQA": 0.2676, + "MUSR": 0.3848, + "MMLU-PRO": 0.1876 + } + }, + { + "model_id": "allknowingroger/Chocolatine-24B", + "name": "Chocolatine-24B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1958, + "BBH": 0.6191, + "MATH Level 5": 0.0008, + "GPQA": 0.3255, + "MUSR": 0.4323, + "MMLU-PRO": 0.4566 + } + }, + { + "model_id": "allknowingroger/Gemma2Slerp1-2.6B", + "name": "Gemma2Slerp1-2.6B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5354, + "BBH": 0.4343, + "MATH Level 5": 0.1065, + "GPQA": 0.2836, + "MUSR": 0.4562, + "MMLU-PRO": 0.2689 + } + }, + { + "model_id": "allknowingroger/Gemma2Slerp1-27B", + "name": "Gemma2Slerp1-27B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7186, + "BBH": 0.6399, + "MATH Level 5": 0.2583, + "GPQA": 0.3641, + "MUSR": 0.4767, + "MMLU-PRO": 0.4456 + } + }, + { + "model_id": "allknowingroger/Gemma2Slerp2-2.6B", + "name": "Gemma2Slerp2-2.6B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5747, + "BBH": 0.4308, + "MATH Level 5": 0.0906, + "GPQA": 0.3054, + "MUSR": 0.4468, + "MMLU-PRO": 0.2696 + } + }, + { + "model_id": "allknowingroger/Gemma2Slerp2-27B", + "name": "Gemma2Slerp2-27B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7546, + "BBH": 0.6557, + "MATH Level 5": 0.2787, + "GPQA": 0.37, + "MUSR": 0.4621, + "MMLU-PRO": 0.4623 + } + }, + { + "model_id": "allknowingroger/Gemma2Slerp3-27B", + "name": "Gemma2Slerp3-27B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7426, + "BBH": 0.65, + "MATH Level 5": 0.2742, + "GPQA": 0.3549, + "MUSR": 0.474, + "MMLU-PRO": 0.4641 + } + }, + { + "model_id": "allknowingroger/Gemma2Slerp4-27B", + "name": "Gemma2Slerp4-27B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7497, + "BBH": 0.653, + "MATH Level 5": 0.2719, + "GPQA": 0.3666, + "MUSR": 0.4502, + "MMLU-PRO": 0.4649 + } + }, + { + "model_id": "allknowingroger/GemmaSlerp-9B", + "name": "GemmaSlerp-9B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7043, + "BBH": 0.5921, + "MATH Level 5": 0.216, + "GPQA": 0.344, + "MUSR": 0.4673, + "MMLU-PRO": 0.4161 + } + }, + { + "model_id": "allknowingroger/GemmaSlerp2-9B", + "name": "GemmaSlerp2-9B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7281, + "BBH": 0.5983, + "MATH Level 5": 0.2107, + "GPQA": 0.3523, + "MUSR": 0.4767, + "MMLU-PRO": 0.4239 + } + }, + { + "model_id": "allknowingroger/GemmaSlerp4-10B", + "name": "GemmaSlerp4-10B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7326, + "BBH": 0.6028, + "MATH Level 5": 0.2243, + "GPQA": 0.3532, + "MUSR": 0.454, + "MMLU-PRO": 0.425 + } + }, + { + "model_id": "allknowingroger/GemmaSlerp5-10B", + "name": "GemmaSlerp5-10B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7353, + "BBH": 0.6054, + "MATH Level 5": 0.2183, + "GPQA": 0.3523, + "MUSR": 0.4608, + "MMLU-PRO": 0.4328 + } + }, + { + "model_id": "allknowingroger/GemmaStock1-27B", + "name": "GemmaStock1-27B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7509, + "BBH": 0.6566, + "MATH Level 5": 0.2636, + "GPQA": 0.3641, + "MUSR": 0.4527, + "MMLU-PRO": 0.473 + } + }, + { + "model_id": "allknowingroger/HomerSlerp1-7B", + "name": "HomerSlerp1-7B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4621, + "BBH": 0.5518, + "MATH Level 5": 0.2719, + "GPQA": 0.318, + "MUSR": 0.4359, + "MMLU-PRO": 0.4504 + } + }, + { + "model_id": "allknowingroger/HomerSlerp2-7B", + "name": "HomerSlerp2-7B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4487, + "BBH": 0.5649, + "MATH Level 5": 0.2968, + "GPQA": 0.3196, + "MUSR": 0.4356, + "MMLU-PRO": 0.4515 + } + }, + { + "model_id": "allknowingroger/HomerSlerp3-7B", + "name": "HomerSlerp3-7B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4363, + "BBH": 0.5598, + "MATH Level 5": 0.3021, + "GPQA": 0.3171, + "MUSR": 0.4462, + "MMLU-PRO": 0.4535 + } + }, + { + "model_id": "allknowingroger/HomerSlerp4-7B", + "name": "HomerSlerp4-7B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4374, + "BBH": 0.5571, + "MATH Level 5": 0.327, + "GPQA": 0.3196, + "MUSR": 0.4408, + "MMLU-PRO": 0.4472 + } + }, + { + "model_id": "allknowingroger/LimyQstar-7B-slerp", + "name": "LimyQstar-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3491, + "BBH": 0.5024, + "MATH Level 5": 0.0687, + "GPQA": 0.2987, + "MUSR": 0.4146, + "MMLU-PRO": 0.3103 + } + }, + { + "model_id": "allknowingroger/Llama3.1-60B", + "name": "Llama3.1-60B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1815, + "BBH": 0.3242, + "MATH Level 5": 0.0, + "GPQA": 0.2945, + "MUSR": 0.3596, + "MMLU-PRO": 0.331 + } + }, + { + "model_id": "allknowingroger/Marco-01-slerp1-7B", + "name": "Marco-01-slerp1-7B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4681, + "BBH": 0.5541, + "MATH Level 5": 0.3157, + "GPQA": 0.3171, + "MUSR": 0.4452, + "MMLU-PRO": 0.4483 + } + }, + { + "model_id": "allknowingroger/Meme-7B-slerp", + "name": "Meme-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5164, + "BBH": 0.4661, + "MATH Level 5": 0.0438, + "GPQA": 0.2861, + "MUSR": 0.4223, + "MMLU-PRO": 0.281 + } + }, + { + "model_id": "allknowingroger/Ministral-8B-slerp", + "name": "Ministral-8B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1961, + "BBH": 0.4686, + "MATH Level 5": 0.0038, + "GPQA": 0.3121, + "MUSR": 0.4285, + "MMLU-PRO": 0.3119 + } + }, + { + "model_id": "allknowingroger/MistralPhi3-11B", + "name": "MistralPhi3-11B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1943, + "BBH": 0.6234, + "MATH Level 5": 0.0, + "GPQA": 0.3322, + "MUSR": 0.4267, + "MMLU-PRO": 0.4688 + } + }, + { + "model_id": "allknowingroger/Mistralmash1-7B-s", + "name": "Mistralmash1-7B-s", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3961, + "BBH": 0.5277, + "MATH Level 5": 0.0921, + "GPQA": 0.2945, + "MUSR": 0.4267, + "MMLU-PRO": 0.3293 + } + }, + { + "model_id": "allknowingroger/Mistralmash2-7B-s", + "name": "Mistralmash2-7B-s", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4102, + "BBH": 0.5305, + "MATH Level 5": 0.0793, + "GPQA": 0.2978, + "MUSR": 0.4372, + "MMLU-PRO": 0.3345 + } + }, + { + "model_id": "allknowingroger/MixTAO-19B-pass", + "name": "MixTAO-19B-pass", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3814, + "BBH": 0.5128, + "MATH Level 5": 0.0612, + "GPQA": 0.2844, + "MUSR": 0.4783, + "MMLU-PRO": 0.3105 + } + }, + { + "model_id": "allknowingroger/MixTaoTruthful-13B-slerp", + "name": "MixTaoTruthful-13B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4139, + "BBH": 0.5207, + "MATH Level 5": 0.0665, + "GPQA": 0.2844, + "MUSR": 0.4292, + "MMLU-PRO": 0.31 + } + }, + { + "model_id": "allknowingroger/MultiCalm-7B-slerp", + "name": "MultiCalm-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3927, + "BBH": 0.5122, + "MATH Level 5": 0.0619, + "GPQA": 0.2827, + "MUSR": 0.4319, + "MMLU-PRO": 0.3033 + } + }, + { + "model_id": "allknowingroger/MultiMash-12B-slerp", + "name": "MultiMash-12B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3974, + "BBH": 0.5142, + "MATH Level 5": 0.0808, + "GPQA": 0.2768, + "MUSR": 0.4438, + "MMLU-PRO": 0.3068 + } + }, + { + "model_id": "allknowingroger/MultiMash10-13B-slerp", + "name": "MultiMash10-13B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4163, + "BBH": 0.5186, + "MATH Level 5": 0.0718, + "GPQA": 0.2861, + "MUSR": 0.4318, + "MMLU-PRO": 0.3117 + } + }, + { + "model_id": "allknowingroger/MultiMash11-13B-slerp", + "name": "MultiMash11-13B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4251, + "BBH": 0.5194, + "MATH Level 5": 0.0702, + "GPQA": 0.2827, + "MUSR": 0.4373, + "MMLU-PRO": 0.3085 + } + }, + { + "model_id": "allknowingroger/MultiMash2-12B-slerp", + "name": "MultiMash2-12B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4261, + "BBH": 0.5134, + "MATH Level 5": 0.0642, + "GPQA": 0.2794, + "MUSR": 0.4228, + "MMLU-PRO": 0.3043 + } + }, + { + "model_id": "allknowingroger/MultiMash5-12B-slerp", + "name": "MultiMash5-12B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4142, + "BBH": 0.5145, + "MATH Level 5": 0.0634, + "GPQA": 0.2777, + "MUSR": 0.4203, + "MMLU-PRO": 0.3028 + } + }, + { + "model_id": "allknowingroger/MultiMash6-12B-slerp", + "name": "MultiMash6-12B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.43, + "BBH": 0.5196, + "MATH Level 5": 0.0725, + "GPQA": 0.2743, + "MUSR": 0.4306, + "MMLU-PRO": 0.3091 + } + }, + { + "model_id": "allknowingroger/MultiMash7-12B-slerp", + "name": "MultiMash7-12B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4213, + "BBH": 0.5111, + "MATH Level 5": 0.0695, + "GPQA": 0.2785, + "MUSR": 0.4279, + "MMLU-PRO": 0.3029 + } + }, + { + "model_id": "allknowingroger/MultiMash8-13B-slerp", + "name": "MultiMash8-13B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4321, + "BBH": 0.5178, + "MATH Level 5": 0.077, + "GPQA": 0.2886, + "MUSR": 0.4424, + "MMLU-PRO": 0.3126 + } + }, + { + "model_id": "allknowingroger/MultiMash9-13B-slerp", + "name": "MultiMash9-13B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4188, + "BBH": 0.5194, + "MATH Level 5": 0.0785, + "GPQA": 0.2802, + "MUSR": 0.4398, + "MMLU-PRO": 0.31 + } + }, + { + "model_id": "allknowingroger/MultiMerge-7B-slerp", + "name": "MultiMerge-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3948, + "BBH": 0.514, + "MATH Level 5": 0.0665, + "GPQA": 0.2827, + "MUSR": 0.428, + "MMLU-PRO": 0.3037 + } + }, + { + "model_id": "allknowingroger/Multimash3-12B-slerp", + "name": "Multimash3-12B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4437, + "BBH": 0.5177, + "MATH Level 5": 0.0627, + "GPQA": 0.2802, + "MUSR": 0.4344, + "MMLU-PRO": 0.3068 + } + }, + { + "model_id": "allknowingroger/Multimerge-19B-pass", + "name": "Multimerge-19B-pass", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1773, + "BBH": 0.2892, + "MATH Level 5": 0.0, + "GPQA": 0.2592, + "MUSR": 0.343, + "MMLU-PRO": 0.1169 + } + }, + { + "model_id": "allknowingroger/MultiverseEx26-7B-slerp", + "name": "MultiverseEx26-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3939, + "BBH": 0.5134, + "MATH Level 5": 0.0755, + "GPQA": 0.2827, + "MUSR": 0.4293, + "MMLU-PRO": 0.3035 + } + }, + { + "model_id": "allknowingroger/NeuralWestSeverus-7B-slerp", + "name": "NeuralWestSeverus-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4136, + "BBH": 0.5244, + "MATH Level 5": 0.0733, + "GPQA": 0.271, + "MUSR": 0.4529, + "MMLU-PRO": 0.3137 + } + }, + { + "model_id": "allknowingroger/Neuralcoven-7B-slerp", + "name": "Neuralcoven-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3859, + "BBH": 0.5303, + "MATH Level 5": 0.0785, + "GPQA": 0.2852, + "MUSR": 0.429, + "MMLU-PRO": 0.3294 + } + }, + { + "model_id": "allknowingroger/Neuralmultiverse-7B-slerp", + "name": "Neuralmultiverse-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3769, + "BBH": 0.5166, + "MATH Level 5": 0.065, + "GPQA": 0.2844, + "MUSR": 0.428, + "MMLU-PRO": 0.3042 + } + }, + { + "model_id": "allknowingroger/Ph3della5-14B", + "name": "Ph3della5-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4799, + "BBH": 0.6332, + "MATH Level 5": 0.1767, + "GPQA": 0.3423, + "MUSR": 0.4386, + "MMLU-PRO": 0.4787 + } + }, + { + "model_id": "allknowingroger/Ph3merge-14B", + "name": "Ph3merge-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.2701, + "BBH": 0.6381, + "MATH Level 5": 0.0106, + "GPQA": 0.3381, + "MUSR": 0.4334, + "MMLU-PRO": 0.4611 + } + }, + { + "model_id": "allknowingroger/Ph3merge2-14B", + "name": "Ph3merge2-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1706, + "BBH": 0.3607, + "MATH Level 5": 0.0, + "GPQA": 0.2911, + "MUSR": 0.3911, + "MMLU-PRO": 0.1723 + } + }, + { + "model_id": "allknowingroger/Ph3merge3-14B", + "name": "Ph3merge3-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1645, + "BBH": 0.3597, + "MATH Level 5": 0.0, + "GPQA": 0.2852, + "MUSR": 0.4082, + "MMLU-PRO": 0.1647 + } + }, + { + "model_id": "allknowingroger/Ph3task1-14B", + "name": "Ph3task1-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4695, + "BBH": 0.6318, + "MATH Level 5": 0.1669, + "GPQA": 0.3507, + "MUSR": 0.4508, + "MMLU-PRO": 0.4734 + } + }, + { + "model_id": "allknowingroger/Ph3task2-14B", + "name": "Ph3task2-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4713, + "BBH": 0.6098, + "MATH Level 5": 0.1465, + "GPQA": 0.3305, + "MUSR": 0.4535, + "MMLU-PRO": 0.446 + } + }, + { + "model_id": "allknowingroger/Ph3task3-14B", + "name": "Ph3task3-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4962, + "BBH": 0.6298, + "MATH Level 5": 0.176, + "GPQA": 0.3414, + "MUSR": 0.4426, + "MMLU-PRO": 0.4771 + } + }, + { + "model_id": "allknowingroger/Ph3unsloth-3B-slerp", + "name": "Ph3unsloth-3B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1894, + "BBH": 0.5468, + "MATH Level 5": 0.1012, + "GPQA": 0.3247, + "MUSR": 0.4528, + "MMLU-PRO": 0.3701 + } + }, + { + "model_id": "allknowingroger/Phi3mash1-17B-pass", + "name": "Phi3mash1-17B-pass", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1884, + "BBH": 0.6129, + "MATH Level 5": 0.0, + "GPQA": 0.3196, + "MUSR": 0.4451, + "MMLU-PRO": 0.4589 + } + }, + { + "model_id": "allknowingroger/Quen2-65B", + "name": "Quen2-65B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1758, + "BBH": 0.2757, + "MATH Level 5": 0.0, + "GPQA": 0.2357, + "MUSR": 0.3209, + "MMLU-PRO": 0.1114 + } + }, + { + "model_id": "allknowingroger/Qwen2.5-42B-AGI", + "name": "Qwen2.5-42B-AGI", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1913, + "BBH": 0.2942, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.362, + "MMLU-PRO": 0.1168 + } + }, + { + "model_id": "allknowingroger/Qwen2.5-7B-task2", + "name": "Qwen2.5-7B-task2", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4527, + "BBH": 0.5626, + "MATH Level 5": 0.355, + "GPQA": 0.3163, + "MUSR": 0.437, + "MMLU-PRO": 0.4517 + } + }, + { + "model_id": "allknowingroger/Qwen2.5-7B-task3", + "name": "Qwen2.5-7B-task3", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5129, + "BBH": 0.5398, + "MATH Level 5": 0.2606, + "GPQA": 0.3171, + "MUSR": 0.4356, + "MMLU-PRO": 0.4501 + } + }, + { + "model_id": "allknowingroger/Qwen2.5-7B-task4", + "name": "Qwen2.5-7B-task4", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5005, + "BBH": 0.5583, + "MATH Level 5": 0.3112, + "GPQA": 0.3205, + "MUSR": 0.4395, + "MMLU-PRO": 0.4561 + } + }, + { + "model_id": "allknowingroger/Qwen2.5-7B-task7", + "name": "Qwen2.5-7B-task7", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4284, + "BBH": 0.5552, + "MATH Level 5": 0.065, + "GPQA": 0.3205, + "MUSR": 0.4326, + "MMLU-PRO": 0.4133 + } + }, + { + "model_id": "allknowingroger/Qwen2.5-7B-task8", + "name": "Qwen2.5-7B-task8", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4645, + "BBH": 0.5525, + "MATH Level 5": 0.3527, + "GPQA": 0.3205, + "MUSR": 0.4514, + "MMLU-PRO": 0.4433 + } + }, + { + "model_id": "allknowingroger/Qwen2.5-slerp-14B", + "name": "Qwen2.5-slerp-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4928, + "BBH": 0.6512, + "MATH Level 5": 0.4622, + "GPQA": 0.3674, + "MUSR": 0.4744, + "MMLU-PRO": 0.5379 + } + }, + { + "model_id": "allknowingroger/QwenSlerp12-7B", + "name": "QwenSlerp12-7B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5076, + "BBH": 0.5556, + "MATH Level 5": 0.2946, + "GPQA": 0.3154, + "MUSR": 0.4595, + "MMLU-PRO": 0.4461 + } + }, + { + "model_id": "allknowingroger/QwenSlerp4-14B", + "name": "QwenSlerp4-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.6328, + "BBH": 0.6483, + "MATH Level 5": 0.3693, + "GPQA": 0.3725, + "MUSR": 0.465, + "MMLU-PRO": 0.5436 + } + }, + { + "model_id": "allknowingroger/QwenSlerp5-14B", + "name": "QwenSlerp5-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.7119, + "BBH": 0.6357, + "MATH Level 5": 0.3565, + "GPQA": 0.3649, + "MUSR": 0.4675, + "MMLU-PRO": 0.5391 + } + }, + { + "model_id": "allknowingroger/QwenSlerp6-14B", + "name": "QwenSlerp6-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.6867, + "BBH": 0.6384, + "MATH Level 5": 0.3724, + "GPQA": 0.3733, + "MUSR": 0.469, + "MMLU-PRO": 0.5406 + } + }, + { + "model_id": "allknowingroger/QwenStock1-14B", + "name": "QwenStock1-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5634, + "BBH": 0.6528, + "MATH Level 5": 0.3769, + "GPQA": 0.3767, + "MUSR": 0.473, + "MMLU-PRO": 0.5418 + } + }, + { + "model_id": "allknowingroger/QwenStock2-14B", + "name": "QwenStock2-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5563, + "BBH": 0.6569, + "MATH Level 5": 0.3882, + "GPQA": 0.3792, + "MUSR": 0.4756, + "MMLU-PRO": 0.5406 + } + }, + { + "model_id": "allknowingroger/QwenStock3-14B", + "name": "QwenStock3-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5615, + "BBH": 0.6565, + "MATH Level 5": 0.3776, + "GPQA": 0.3784, + "MUSR": 0.4756, + "MMLU-PRO": 0.5428 + } + }, + { + "model_id": "allknowingroger/Qwenslerp2-14B", + "name": "Qwenslerp2-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5007, + "BBH": 0.6555, + "MATH Level 5": 0.4456, + "GPQA": 0.3683, + "MUSR": 0.4729, + "MMLU-PRO": 0.5403 + } + }, + { + "model_id": "allknowingroger/Qwenslerp2-7B", + "name": "Qwenslerp2-7B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5294, + "BBH": 0.5609, + "MATH Level 5": 0.3421, + "GPQA": 0.3129, + "MUSR": 0.4356, + "MMLU-PRO": 0.4515 + } + }, + { + "model_id": "allknowingroger/Qwenslerp3-14B", + "name": "Qwenslerp3-14B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5052, + "BBH": 0.6521, + "MATH Level 5": 0.4464, + "GPQA": 0.375, + "MUSR": 0.4676, + "MMLU-PRO": 0.5395 + } + }, + { + "model_id": "allknowingroger/Qwenslerp3-7B", + "name": "Qwenslerp3-7B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.5018, + "BBH": 0.558, + "MATH Level 5": 0.3218, + "GPQA": 0.3247, + "MUSR": 0.4515, + "MMLU-PRO": 0.4542 + } + }, + { + "model_id": "allknowingroger/ROGERphi-7B-slerp", + "name": "ROGERphi-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3861, + "BBH": 0.5196, + "MATH Level 5": 0.0733, + "GPQA": 0.2886, + "MUSR": 0.4685, + "MMLU-PRO": 0.3053 + } + }, + { + "model_id": "allknowingroger/RogerMerge-7B-slerp", + "name": "RogerMerge-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3933, + "BBH": 0.516, + "MATH Level 5": 0.0687, + "GPQA": 0.2802, + "MUSR": 0.432, + "MMLU-PRO": 0.303 + } + }, + { + "model_id": "allknowingroger/Rombos-LLM-V2.5-Qwen-42b", + "name": "Rombos-LLM-V2.5-Qwen-42b", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1879, + "BBH": 0.2969, + "MATH Level 5": 0.0, + "GPQA": 0.2626, + "MUSR": 0.3633, + "MMLU-PRO": 0.1168 + } + }, + { + "model_id": "allknowingroger/Strangecoven-7B-slerp", + "name": "Strangecoven-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3746, + "BBH": 0.5368, + "MATH Level 5": 0.0763, + "GPQA": 0.2894, + "MUSR": 0.4199, + "MMLU-PRO": 0.3364 + } + }, + { + "model_id": "allknowingroger/Weirdslerp2-25B", + "name": "Weirdslerp2-25B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1754, + "BBH": 0.2874, + "MATH Level 5": 0.0, + "GPQA": 0.2492, + "MUSR": 0.3524, + "MMLU-PRO": 0.1128 + } + }, + { + "model_id": "allknowingroger/WestlakeMaziyar-7B-slerp", + "name": "WestlakeMaziyar-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4838, + "BBH": 0.5245, + "MATH Level 5": 0.0665, + "GPQA": 0.3037, + "MUSR": 0.4474, + "MMLU-PRO": 0.3078 + } + }, + { + "model_id": "allknowingroger/YamMaths-7B-slerp", + "name": "YamMaths-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4148, + "BBH": 0.5156, + "MATH Level 5": 0.0853, + "GPQA": 0.2802, + "MUSR": 0.4384, + "MMLU-PRO": 0.3131 + } + }, + { + "model_id": "allknowingroger/Yi-1.5-34B", + "name": "Yi-1.5-34B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1639, + "BBH": 0.2827, + "MATH Level 5": 0.0, + "GPQA": 0.2584, + "MUSR": 0.3857, + "MMLU-PRO": 0.1095 + } + }, + { + "model_id": "allknowingroger/Yi-blossom-40B", + "name": "Yi-blossom-40B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.2009, + "BBH": 0.3215, + "MATH Level 5": 0.0, + "GPQA": 0.2743, + "MUSR": 0.3843, + "MMLU-PRO": 0.108 + } + }, + { + "model_id": "allknowingroger/Yibuddy-35B", + "name": "Yibuddy-35B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4235, + "BBH": 0.5916, + "MATH Level 5": 0.1571, + "GPQA": 0.3557, + "MUSR": 0.4505, + "MMLU-PRO": 0.4489 + } + }, + { + "model_id": "allknowingroger/Yillama-40B", + "name": "Yillama-40B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1697, + "BBH": 0.4063, + "MATH Level 5": 0.0, + "GPQA": 0.2827, + "MUSR": 0.3501, + "MMLU-PRO": 0.1981 + } + }, + { + "model_id": "allknowingroger/Yislerp-34B", + "name": "Yislerp-34B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3692, + "BBH": 0.6159, + "MATH Level 5": 0.216, + "GPQA": 0.3582, + "MUSR": 0.4566, + "MMLU-PRO": 0.4751 + } + }, + { + "model_id": "allknowingroger/Yislerp2-34B", + "name": "Yislerp2-34B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.3999, + "BBH": 0.6246, + "MATH Level 5": 0.2296, + "GPQA": 0.3641, + "MUSR": 0.453, + "MMLU-PRO": 0.4724 + } + }, + { + "model_id": "allknowingroger/Yunconglong-13B-slerp", + "name": "Yunconglong-13B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4242, + "BBH": 0.5166, + "MATH Level 5": 0.0544, + "GPQA": 0.281, + "MUSR": 0.4161, + "MMLU-PRO": 0.3036 + } + }, + { + "model_id": "allknowingroger/limyClown-7B-slerp", + "name": "limyClown-7B-slerp", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.4017, + "BBH": 0.5148, + "MATH Level 5": 0.0687, + "GPQA": 0.281, + "MUSR": 0.4293, + "MMLU-PRO": 0.3038 + } + }, + { + "model_id": "allknowingroger/llama3-Jallabi-40B-s", + "name": "llama3-Jallabi-40B-s", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1921, + "BBH": 0.3252, + "MATH Level 5": 0.0, + "GPQA": 0.2374, + "MUSR": 0.375, + "MMLU-PRO": 0.1088 + } + }, + { + "model_id": "allknowingroger/llama3AnFeng-40B", + "name": "llama3AnFeng-40B", + "developer": "allknowingroger", + "scores": { + "IFEval": 0.1742, + "BBH": 0.3794, + "MATH Level 5": 0.0, + "GPQA": 0.3062, + "MUSR": 0.394, + "MMLU-PRO": 0.198 + } + }, + { + "model_id": "allura-org/L3.1-8b-RP-Ink", + "name": "L3.1-8b-RP-Ink", + "developer": "allura-org", + "scores": { + "IFEval": 0.7811, + "BBH": 0.4828, + "MATH Level 5": 0.148, + "GPQA": 0.2643, + "MUSR": 0.3608, + "MMLU-PRO": 0.3428 + } + }, + { + "model_id": "allura-org/MN-12b-RP-Ink", + "name": "MN-12b-RP-Ink", + "developer": "allura-org", + "scores": { + "IFEval": 0.7186, + "BBH": 0.4834, + "MATH Level 5": 0.1186, + "GPQA": 0.2852, + "MUSR": 0.3818, + "MMLU-PRO": 0.3514 + } + }, + { + "model_id": "allura-org/MS-Meadowlark-22B", + "name": "MS-Meadowlark-22B", + "developer": "allura-org", + "scores": { + "IFEval": 0.6697, + "BBH": 0.5163, + "MATH Level 5": 0.1835, + "GPQA": 0.3255, + "MUSR": 0.3843, + "MMLU-PRO": 0.3823 + } + }, + { + "model_id": "allura-org/Mistral-Small-24b-Sertraline-0304", + "name": "Mistral-Small-24b-Sertraline-0304", + "developer": "allura-org", + "scores": { + "IFEval": 0.68, + "BBH": 0.6525, + "MATH Level 5": 0.2228, + "GPQA": 0.3515, + "MUSR": 0.4395, + "MMLU-PRO": 0.5106 + } + }, + { + "model_id": "allura-org/Mistral-Small-Sisyphus-24b-2503", + "name": "Mistral-Small-Sisyphus-24b-2503", + "developer": "allura-org", + "scores": { + "IFEval": 0.6848, + "BBH": 0.627, + "MATH Level 5": 0.25, + "GPQA": 0.2626, + "MUSR": 0.3977, + "MMLU-PRO": 0.5127 + } + }, + { + "model_id": "allura-org/MoE-Girl-1BA-7BT", + "name": "MoE-Girl-1BA-7BT", + "developer": "allura-org", + "scores": { + "IFEval": 0.2705, + "BBH": 0.3139, + "MATH Level 5": 0.0151, + "GPQA": 0.2584, + "MUSR": 0.3436, + "MMLU-PRO": 0.1218 + } + }, + { + "model_id": "allura-org/TQ2.5-14B-Aletheia-v1", + "name": "TQ2.5-14B-Aletheia-v1", + "developer": "allura-org", + "scores": { + "IFEval": 0.753, + "BBH": 0.6585, + "MATH Level 5": 0.3399, + "GPQA": 0.3624, + "MUSR": 0.4452, + "MMLU-PRO": 0.5241 + } + }, + { + "model_id": "allura-org/TQ2.5-14B-Neon-v1", + "name": "TQ2.5-14B-Neon-v1", + "developer": "allura-org", + "scores": { + "IFEval": 0.6754, + "BBH": 0.6553, + "MATH Level 5": 0.3603, + "GPQA": 0.3716, + "MUSR": 0.461, + "MMLU-PRO": 0.5253 + } + }, + { + "model_id": "allura-org/Teleut-7b", + "name": "Teleut-7b", + "developer": "allura-org", + "scores": { + "IFEval": 0.6379, + "BBH": 0.5141, + "MATH Level 5": 0.2409, + "GPQA": 0.3263, + "MUSR": 0.464, + "MMLU-PRO": 0.4131 + } + }, + { + "model_id": "aloobun/Meta-Llama-3-7B-28Layers", + "name": "Meta-Llama-3-7B-28Layers", + "developer": "aloobun", + "scores": { + "IFEval": 0.1964, + "BBH": 0.4437, + "MATH Level 5": 0.0279, + "GPQA": 0.2945, + "MUSR": 0.3589, + "MMLU-PRO": 0.316 + } + }, + { + "model_id": "aloobun/d-SmolLM2-360M", + "name": "d-SmolLM2-360M", + "developer": "aloobun", + "scores": { + "IFEval": 0.2097, + "BBH": 0.3196, + "MATH Level 5": 0.0128, + "GPQA": 0.2534, + "MUSR": 0.3981, + "MMLU-PRO": 0.1169 + } + }, + { + "model_id": "alpindale/WizardLM-2-8x22B", + "name": "WizardLM-2-8x22B", + "developer": "alpindale", + "scores": { + "IFEval": 0.5272, + "BBH": 0.6377, + "MATH Level 5": 0.25, + "GPQA": 0.3817, + "MUSR": 0.4387, + "MMLU-PRO": 0.4596 + } + }, + { + "model_id": "alpindale/magnum-72b-v1", + "name": "magnum-72b-v1", + "developer": "alpindale", + "scores": { + "IFEval": 0.7606, + "BBH": 0.6982, + "MATH Level 5": 0.398, + "GPQA": 0.3909, + "MUSR": 0.4489, + "MMLU-PRO": 0.5468 + } + }, + { + "model_id": "altomek/YiSM-34B-0rn", + "name": "YiSM-34B-0rn", + "developer": "altomek", + "scores": { + "IFEval": 0.4284, + "BBH": 0.614, + "MATH Level 5": 0.2281, + "GPQA": 0.3716, + "MUSR": 0.445, + "MMLU-PRO": 0.4696 + } + }, + { + "model_id": "amazon/MegaBeam-Mistral-7B-300k", + "name": "MegaBeam-Mistral-7B-300k", + "developer": "amazon", + "scores": { + "IFEval": 0.5203, + "BBH": 0.4228, + "MATH Level 5": 0.0211, + "GPQA": 0.2735, + "MUSR": 0.398, + "MMLU-PRO": 0.2549 + } + }, + { + "model_id": "amd/AMD-Llama-135m", + "name": "AMD-Llama-135m", + "developer": "amd", + "scores": { + "IFEval": 0.1918, + "BBH": 0.2969, + "MATH Level 5": 0.0076, + "GPQA": 0.2584, + "MUSR": 0.3846, + "MMLU-PRO": 0.1169 + } + }, + { + "model_id": "anakin87/gemma-2b-orpo", + "name": "gemma-2b-orpo", + "developer": "anakin87", + "scores": { + "IFEval": 0.2478, + "BBH": 0.3426, + "MATH Level 5": 0.0189, + "GPQA": 0.2617, + "MUSR": 0.3728, + "MMLU-PRO": 0.1306 + } + }, + { + "model_id": "anthracite-org/magnum-v1-72b", + "name": "magnum-v1-72b", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.7606, + "BBH": 0.6982, + "MATH Level 5": 0.398, + "GPQA": 0.3909, + "MUSR": 0.4489, + "MMLU-PRO": 0.5486 + } + }, + { + "model_id": "anthracite-org/magnum-v2-12b", + "name": "magnum-v2-12b", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.3762, + "BBH": 0.5021, + "MATH Level 5": 0.0544, + "GPQA": 0.2911, + "MUSR": 0.4179, + "MMLU-PRO": 0.3167 + } + }, + { + "model_id": "anthracite-org/magnum-v2-72b", + "name": "magnum-v2-72b", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.756, + "BBH": 0.7005, + "MATH Level 5": 0.3542, + "GPQA": 0.3859, + "MUSR": 0.4372, + "MMLU-PRO": 0.5456 + } + }, + { + "model_id": "anthracite-org/magnum-v2.5-12b-kto", + "name": "magnum-v2.5-12b-kto", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.3866, + "BBH": 0.5077, + "MATH Level 5": 0.0521, + "GPQA": 0.2936, + "MUSR": 0.4086, + "MMLU-PRO": 0.3215 + } + }, + { + "model_id": "anthracite-org/magnum-v3-27b-kto", + "name": "magnum-v3-27b-kto", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.5675, + "BBH": 0.586, + "MATH Level 5": 0.1813, + "GPQA": 0.3557, + "MUSR": 0.3855, + "MMLU-PRO": 0.4238 + } + }, + { + "model_id": "anthracite-org/magnum-v3-34b", + "name": "magnum-v3-34b", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.5115, + "BBH": 0.6088, + "MATH Level 5": 0.1949, + "GPQA": 0.3607, + "MUSR": 0.3872, + "MMLU-PRO": 0.4752 + } + }, + { + "model_id": "anthracite-org/magnum-v3-9b-chatml", + "name": "magnum-v3-9b-chatml", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.1275, + "BBH": 0.5428, + "MATH Level 5": 0.0695, + "GPQA": 0.3456, + "MUSR": 0.4432, + "MMLU-PRO": 0.4242 + } + }, + { + "model_id": "anthracite-org/magnum-v3-9b-customgemma2", + "name": "magnum-v3-9b-customgemma2", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.1273, + "BBH": 0.534, + "MATH Level 5": 0.0718, + "GPQA": 0.3289, + "MUSR": 0.4565, + "MMLU-PRO": 0.4205 + } + }, + { + "model_id": "anthracite-org/magnum-v4-12b", + "name": "magnum-v4-12b", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.3393, + "BBH": 0.5177, + "MATH Level 5": 0.1178, + "GPQA": 0.2961, + "MUSR": 0.4093, + "MMLU-PRO": 0.3604 + } + }, + { + "model_id": "anthracite-org/magnum-v4-22b", + "name": "magnum-v4-22b", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.5629, + "BBH": 0.5486, + "MATH Level 5": 0.2002, + "GPQA": 0.328, + "MUSR": 0.4408, + "MMLU-PRO": 0.383 + } + }, + { + "model_id": "anthracite-org/magnum-v4-27b", + "name": "magnum-v4-27b", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.3454, + "BBH": 0.5867, + "MATH Level 5": 0.1798, + "GPQA": 0.37, + "MUSR": 0.438, + "MMLU-PRO": 0.4376 + } + }, + { + "model_id": "anthracite-org/magnum-v4-9b", + "name": "magnum-v4-9b", + "developer": "anthracite-org", + "scores": { + "IFEval": 0.3503, + "BBH": 0.5336, + "MATH Level 5": 0.1307, + "GPQA": 0.3473, + "MUSR": 0.4516, + "MMLU-PRO": 0.3953 + } + }, + { + "model_id": "apple/DCLM-7B", + "name": "DCLM-7B", + "developer": "apple", + "scores": { + "IFEval": 0.2173, + "BBH": 0.4232, + "MATH Level 5": 0.037, + "GPQA": 0.3154, + "MUSR": 0.3921, + "MMLU-PRO": 0.3111 + } + }, + { + "model_id": "appvoid/arco-2", + "name": "arco-2", + "developer": "appvoid", + "scores": { + "IFEval": 0.1991, + "BBH": 0.3146, + "MATH Level 5": 0.0136, + "GPQA": 0.2391, + "MUSR": 0.3536, + "MMLU-PRO": 0.1116 + } + }, + { + "model_id": "appvoid/arco-2-instruct", + "name": "arco-2-instruct", + "developer": "appvoid", + "scores": { + "IFEval": 0.2164, + "BBH": 0.3133, + "MATH Level 5": 0.0128, + "GPQA": 0.2383, + "MUSR": 0.3496, + "MMLU-PRO": 0.1113 + } + }, + { + "model_id": "arcee-ai/Arcee-Blitz", + "name": "Arcee-Blitz", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.5543, + "BBH": 0.6607, + "MATH Level 5": 0.3482, + "GPQA": 0.3851, + "MUSR": 0.5047, + "MMLU-PRO": 0.6154 + } + }, + { + "model_id": "arcee-ai/Arcee-Maestro-7B-Preview", + "name": "Arcee-Maestro-7B-Preview", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.275, + "BBH": 0.4648, + "MATH Level 5": 0.4992, + "GPQA": 0.3322, + "MUSR": 0.3885, + "MMLU-PRO": 0.3039 + } + }, + { + "model_id": "arcee-ai/Arcee-Nova", + "name": "Arcee-Nova", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.7907, + "BBH": 0.6942, + "MATH Level 5": 0.4381, + "GPQA": 0.3851, + "MUSR": 0.4562, + "MMLU-PRO": 0.5452 + } + }, + { + "model_id": "arcee-ai/Arcee-Spark", + "name": "Arcee-Spark", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.5621, + "BBH": 0.5489, + "MATH Level 5": 0.2953, + "GPQA": 0.307, + "MUSR": 0.4021, + "MMLU-PRO": 0.3822 + } + }, + { + "model_id": "arcee-ai/Llama-3.1-SuperNova-Lite", + "name": "Llama-3.1-SuperNova-Lite", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.8017, + "BBH": 0.5152, + "MATH Level 5": 0.1828, + "GPQA": 0.3062, + "MUSR": 0.4163, + "MMLU-PRO": 0.3877 + } + }, + { + "model_id": "arcee-ai/Llama-Spark", + "name": "Llama-Spark", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.7911, + "BBH": 0.5054, + "MATH Level 5": 0.139, + "GPQA": 0.2995, + "MUSR": 0.3593, + "MMLU-PRO": 0.3721 + } + }, + { + "model_id": "arcee-ai/SuperNova-Medius", + "name": "SuperNova-Medius", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.7184, + "BBH": 0.6377, + "MATH Level 5": 0.469, + "GPQA": 0.3331, + "MUSR": 0.4233, + "MMLU-PRO": 0.5035 + } + }, + { + "model_id": "arcee-ai/Virtuoso-Lite", + "name": "Virtuoso-Lite", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.81, + "BBH": 0.6099, + "MATH Level 5": 0.253, + "GPQA": 0.344, + "MUSR": 0.4595, + "MMLU-PRO": 0.4441 + } + }, + { + "model_id": "arcee-ai/Virtuoso-Small", + "name": "Virtuoso-Small", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.7935, + "BBH": 0.6518, + "MATH Level 5": 0.4094, + "GPQA": 0.3364, + "MUSR": 0.4339, + "MMLU-PRO": 0.5191 + } + }, + { + "model_id": "arcee-ai/Virtuoso-Small-v2", + "name": "Virtuoso-Small-v2", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.8273, + "BBH": 0.6554, + "MATH Level 5": 0.466, + "GPQA": 0.3532, + "MUSR": 0.4313, + "MMLU-PRO": 0.5188 + } + }, + { + "model_id": "arcee-ai/raspberry-3B", + "name": "raspberry-3B", + "developer": "arcee-ai", + "scores": { + "IFEval": 0.3154, + "BBH": 0.4269, + "MATH Level 5": 0.1035, + "GPQA": 0.2777, + "MUSR": 0.4123, + "MMLU-PRO": 0.2854 + } + }, + { + "model_id": "argilla-warehouse/Llama-3.1-8B-MagPie-Ultra", + "name": "Llama-3.1-8B-MagPie-Ultra", + "developer": "argilla-warehouse", + "scores": { + "IFEval": 0.5757, + "BBH": 0.462, + "MATH Level 5": 0.077, + "GPQA": 0.2668, + "MUSR": 0.3543, + "MMLU-PRO": 0.3144 + } + }, + { + "model_id": "argilla/notus-7b-v1", + "name": "notus-7b-v1", + "developer": "argilla", + "scores": { + "IFEval": 0.5082, + "BBH": 0.4512, + "MATH Level 5": 0.0317, + "GPQA": 0.2894, + "MUSR": 0.3364, + "MMLU-PRO": 0.3004 + } + }, + { + "model_id": "argilla/notux-8x7b-v1", + "name": "notux-8x7b-v1", + "developer": "argilla", + "scores": { + "IFEval": 0.5422, + "BBH": 0.5363, + "MATH Level 5": 0.0997, + "GPQA": 0.3087, + "MUSR": 0.4176, + "MMLU-PRO": 0.366 + } + }, + { + "model_id": "arisin/orca-platypus-13B-slerp", + "name": "orca-platypus-13B-slerp", + "developer": "arisin", + "scores": { + "IFEval": 0.2672, + "BBH": 0.4631, + "MATH Level 5": 0.0159, + "GPQA": 0.2987, + "MUSR": 0.4253, + "MMLU-PRO": 0.2592 + } + }, + { + "model_id": "arshiaafshani/Arsh-V1", + "name": "Arsh-V1", + "developer": "arshiaafshani", + "scores": { + "IFEval": 0.6043, + "BBH": 0.674, + "MATH Level 5": 0.2621, + "GPQA": 0.3733, + "MUSR": 0.4899, + "MMLU-PRO": 0.5257 + } + }, + { + "model_id": "asharsha30/LLAMA_Harsha_8_B_ORDP_10k", + "name": "LLAMA_Harsha_8_B_ORDP_10k", + "developer": "asharsha30", + "scores": { + "IFEval": 0.3464, + "BBH": 0.4669, + "MATH Level 5": 0.0665, + "GPQA": 0.2735, + "MUSR": 0.3697, + "MMLU-PRO": 0.281 + } + }, + { + "model_id": "ashercn97/a1-v0.0.1", + "name": "a1-v0.0.1", + "developer": "ashercn97", + "scores": { + "IFEval": 0.2198, + "BBH": 0.5188, + "MATH Level 5": 0.2145, + "GPQA": 0.3112, + "MUSR": 0.412, + "MMLU-PRO": 0.4165 + } + }, + { + "model_id": "ashercn97/a1-v002", + "name": "a1-v002", + "developer": "ashercn97", + "scores": { + "IFEval": 0.2585, + "BBH": 0.5261, + "MATH Level 5": 0.2341, + "GPQA": 0.3188, + "MUSR": 0.4159, + "MMLU-PRO": 0.4175 + } + }, + { + "model_id": "assskelad/smollm2-360M-sft_SmallThoughts", + "name": "smollm2-360M-sft_SmallThoughts", + "developer": "assskelad", + "scores": { + "IFEval": 0.2007, + "BBH": 0.315, + "MATH Level 5": 0.0166, + "GPQA": 0.2592, + "MUSR": 0.3395, + "MMLU-PRO": 0.1182 + } + }, + { + "model_id": "athirdpath/Llama-3.1-Instruct_NSFW-pretrained_e1-plus_reddit", + "name": "Llama-3.1-Instruct_NSFW-pretrained_e1-plus_reddit", + "developer": "athirdpath", + "scores": { + "IFEval": 0.4521, + "BBH": 0.4939, + "MATH Level 5": 0.102, + "GPQA": 0.2919, + "MUSR": 0.3864, + "MMLU-PRO": 0.3565 + } + }, + { + "model_id": "automerger/YamshadowExperiment28-7B", + "name": "YamshadowExperiment28-7B", + "developer": "automerger", + "scores": { + "IFEval": 0.407, + "BBH": 0.515, + "MATH Level 5": 0.0612, + "GPQA": 0.2869, + "MUSR": 0.4306, + "MMLU-PRO": 0.306 + } + }, + { + "model_id": "avemio/GRAG-NEMO-12B-ORPO-HESSIAN-AI", + "name": "GRAG-NEMO-12B-ORPO-HESSIAN-AI", + "developer": "avemio", + "scores": { + "IFEval": 0.0, + "BBH": 0.2607, + "MATH Level 5": 0.0, + "GPQA": 0.2592, + "MUSR": 0.3447, + "MMLU-PRO": 0.1061 + } + }, + { + "model_id": "awnr/Mistral-7B-v0.1-signtensors-1-over-2", + "name": "Mistral-7B-v0.1-signtensors-1-over-2", + "developer": "awnr", + "scores": { + "IFEval": 0.2179, + "BBH": 0.4423, + "MATH Level 5": 0.034, + "GPQA": 0.307, + "MUSR": 0.4006, + "MMLU-PRO": 0.3 + } + }, + { + "model_id": "awnr/Mistral-7B-v0.1-signtensors-1-over-4", + "name": "Mistral-7B-v0.1-signtensors-1-over-4", + "developer": "awnr", + "scores": { + "IFEval": 0.2133, + "BBH": 0.3507, + "MATH Level 5": 0.0249, + "GPQA": 0.2701, + "MUSR": 0.346, + "MMLU-PRO": 0.2311 + } + }, + { + "model_id": "awnr/Mistral-7B-v0.1-signtensors-3-over-8", + "name": "Mistral-7B-v0.1-signtensors-3-over-8", + "developer": "awnr", + "scores": { + "IFEval": 0.2394, + "BBH": 0.43, + "MATH Level 5": 0.0332, + "GPQA": 0.3037, + "MUSR": 0.3818, + "MMLU-PRO": 0.3001 + } + }, + { + "model_id": "awnr/Mistral-7B-v0.1-signtensors-5-over-16", + "name": "Mistral-7B-v0.1-signtensors-5-over-16", + "developer": "awnr", + "scores": { + "IFEval": 0.2118, + "BBH": 0.4124, + "MATH Level 5": 0.0295, + "GPQA": 0.281, + "MUSR": 0.3686, + "MMLU-PRO": 0.2958 + } + }, + { + "model_id": "awnr/Mistral-7B-v0.1-signtensors-7-over-16", + "name": "Mistral-7B-v0.1-signtensors-7-over-16", + "developer": "awnr", + "scores": { + "IFEval": 0.2294, + "BBH": 0.4316, + "MATH Level 5": 0.0385, + "GPQA": 0.3037, + "MUSR": 0.3952, + "MMLU-PRO": 0.303 + } + }, + { + "model_id": "aws-prototyping/MegaBeam-Mistral-7B-512k", + "name": "MegaBeam-Mistral-7B-512k", + "developer": "aws-prototyping", + "scores": { + "IFEval": 0.5973, + "BBH": 0.3662, + "MATH Level 5": 0.0287, + "GPQA": 0.2827, + "MUSR": 0.3994, + "MMLU-PRO": 0.2589 + } + }, + { + "model_id": "axolotl-ai-co/romulus-mistral-nemo-12b-simpo", + "name": "romulus-mistral-nemo-12b-simpo", + "developer": "axolotl-ai-co", + "scores": { + "IFEval": 0.6079, + "BBH": 0.5395, + "MATH Level 5": 0.114, + "GPQA": 0.2785, + "MUSR": 0.4233, + "MMLU-PRO": 0.3469 + } + }, + { + "model_id": "baconnier/Napoleon_24B_V0.0", + "name": "Napoleon_24B_V0.0", + "developer": "baconnier", + "scores": { + "IFEval": 0.1801, + "BBH": 0.6367, + "MATH Level 5": 0.2273, + "GPQA": 0.3792, + "MUSR": 0.442, + "MMLU-PRO": 0.504 + } + }, + { + "model_id": "baconnier/Napoleon_24B_V0.2", + "name": "Napoleon_24B_V0.2", + "developer": "baconnier", + "scores": { + "IFEval": 0.2527, + "BBH": 0.5911, + "MATH Level 5": 0.1435, + "GPQA": 0.3381, + "MUSR": 0.446, + "MMLU-PRO": 0.4357 + } + }, + { + "model_id": "baebee/7B-Cetacea", + "name": "7B-Cetacea", + "developer": "baebee", + "scores": { + "IFEval": 0.5279, + "BBH": 0.4757, + "MATH Level 5": 0.0468, + "GPQA": 0.2861, + "MUSR": 0.4136, + "MMLU-PRO": 0.2955 + } + }, + { + "model_id": "baebee/mergekit-model_stock-nzjnheg", + "name": "mergekit-model_stock-nzjnheg", + "developer": "baebee", + "scores": { + "IFEval": 0.4844, + "BBH": 0.5287, + "MATH Level 5": 0.1677, + "GPQA": 0.2802, + "MUSR": 0.3847, + "MMLU-PRO": 0.3699 + } + }, + { + "model_id": "baebee/mergekit-ties-fnjenli", + "name": "mergekit-ties-fnjenli", + "developer": "baebee", + "scores": { + "IFEval": 0.1988, + "BBH": 0.3024, + "MATH Level 5": 0.0023, + "GPQA": 0.245, + "MUSR": 0.4019, + "MMLU-PRO": 0.1129 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B", + "name": "MISCHIEVOUS-12B", + "developer": "bamec66557", + "scores": { + "IFEval": 0.3852, + "BBH": 0.5405, + "MATH Level 5": 0.1276, + "GPQA": 0.3205, + "MUSR": 0.4145, + "MMLU-PRO": 0.3672 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_0.1v", + "name": "MISCHIEVOUS-12B-Mix_0.1v", + "developer": "bamec66557", + "scores": { + "IFEval": 0.3636, + "BBH": 0.5436, + "MATH Level 5": 0.1329, + "GPQA": 0.328, + "MUSR": 0.4132, + "MMLU-PRO": 0.3674 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_0.2v", + "name": "MISCHIEVOUS-12B-Mix_0.2v", + "developer": "bamec66557", + "scores": { + "IFEval": 0.3624, + "BBH": 0.5434, + "MATH Level 5": 0.1261, + "GPQA": 0.3255, + "MUSR": 0.4158, + "MMLU-PRO": 0.3663 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_0.3v", + "name": "MISCHIEVOUS-12B-Mix_0.3v", + "developer": "bamec66557", + "scores": { + "IFEval": 0.387, + "BBH": 0.5431, + "MATH Level 5": 0.1337, + "GPQA": 0.3196, + "MUSR": 0.4131, + "MMLU-PRO": 0.3664 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_0.4v", + "name": "MISCHIEVOUS-12B-Mix_0.4v", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6508, + "BBH": 0.5094, + "MATH Level 5": 0.1352, + "GPQA": 0.3171, + "MUSR": 0.4176, + "MMLU-PRO": 0.3683 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_0.5v", + "name": "MISCHIEVOUS-12B-Mix_0.5v", + "developer": "bamec66557", + "scores": { + "IFEval": 0.3746, + "BBH": 0.5422, + "MATH Level 5": 0.1367, + "GPQA": 0.3205, + "MUSR": 0.4132, + "MMLU-PRO": 0.3661 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_0.6v", + "name": "MISCHIEVOUS-12B-Mix_0.6v", + "developer": "bamec66557", + "scores": { + "IFEval": 0.4366, + "BBH": 0.5449, + "MATH Level 5": 0.1254, + "GPQA": 0.328, + "MUSR": 0.4185, + "MMLU-PRO": 0.3662 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_III_IV_V", + "name": "MISCHIEVOUS-12B-Mix_III_IV_V", + "developer": "bamec66557", + "scores": { + "IFEval": 0.4031, + "BBH": 0.5465, + "MATH Level 5": 0.1292, + "GPQA": 0.3205, + "MUSR": 0.4198, + "MMLU-PRO": 0.3664 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_III_ex_V", + "name": "MISCHIEVOUS-12B-Mix_III_ex_V", + "developer": "bamec66557", + "scores": { + "IFEval": 0.4316, + "BBH": 0.5449, + "MATH Level 5": 0.1322, + "GPQA": 0.3205, + "MUSR": 0.4198, + "MMLU-PRO": 0.3649 + } + }, + { + "model_id": "bamec66557/MISCHIEVOUS-12B-Mix_Neo", + "name": "MISCHIEVOUS-12B-Mix_Neo", + "developer": "bamec66557", + "scores": { + "IFEval": 0.625, + "BBH": 0.5078, + "MATH Level 5": 0.1329, + "GPQA": 0.3163, + "MUSR": 0.415, + "MMLU-PRO": 0.3685 + } + }, + { + "model_id": "bamec66557/Mistral-Nemo-VICIOUS_MESH-12B-2407", + "name": "Mistral-Nemo-VICIOUS_MESH-12B-2407", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6706, + "BBH": 0.5156, + "MATH Level 5": 0.1367, + "GPQA": 0.3154, + "MUSR": 0.431, + "MMLU-PRO": 0.3677 + } + }, + { + "model_id": "bamec66557/NameLess-12B-prob", + "name": "NameLess-12B-prob", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6602, + "BBH": 0.5158, + "MATH Level 5": 0.1261, + "GPQA": 0.3146, + "MUSR": 0.4336, + "MMLU-PRO": 0.3684 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B", + "name": "VICIOUS_MESH-12B", + "developer": "bamec66557", + "scores": { + "IFEval": 0.3716, + "BBH": 0.5436, + "MATH Level 5": 0.1344, + "GPQA": 0.328, + "MUSR": 0.4105, + "MMLU-PRO": 0.3679 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-0.1v", + "name": "VICIOUS_MESH-12B-0.1v", + "developer": "bamec66557", + "scores": { + "IFEval": 0.3657, + "BBH": 0.5412, + "MATH Level 5": 0.1322, + "GPQA": 0.3247, + "MUSR": 0.4158, + "MMLU-PRO": 0.3683 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-0.X.ver", + "name": "VICIOUS_MESH-12B-0.X.ver", + "developer": "bamec66557", + "scores": { + "IFEval": 0.3776, + "BBH": 0.5416, + "MATH Level 5": 0.1201, + "GPQA": 0.3213, + "MUSR": 0.4198, + "MMLU-PRO": 0.3671 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-ALPHA", + "name": "VICIOUS_MESH-12B-ALPHA", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6365, + "BBH": 0.5094, + "MATH Level 5": 0.1367, + "GPQA": 0.3138, + "MUSR": 0.4203, + "MMLU-PRO": 0.3697 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-BETA", + "name": "VICIOUS_MESH-12B-BETA", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6721, + "BBH": 0.5156, + "MATH Level 5": 0.1329, + "GPQA": 0.3163, + "MUSR": 0.431, + "MMLU-PRO": 0.3679 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-DELTA", + "name": "VICIOUS_MESH-12B-DELTA", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6469, + "BBH": 0.5055, + "MATH Level 5": 0.1375, + "GPQA": 0.3121, + "MUSR": 0.4057, + "MMLU-PRO": 0.3651 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-DIGAMMA", + "name": "VICIOUS_MESH-12B-DIGAMMA", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6429, + "BBH": 0.5061, + "MATH Level 5": 0.1337, + "GPQA": 0.3129, + "MUSR": 0.4097, + "MMLU-PRO": 0.3659 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-EPSILON", + "name": "VICIOUS_MESH-12B-EPSILON", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6305, + "BBH": 0.5038, + "MATH Level 5": 0.1261, + "GPQA": 0.3146, + "MUSR": 0.407, + "MMLU-PRO": 0.3648 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-GAMMA", + "name": "VICIOUS_MESH-12B-GAMMA", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6362, + "BBH": 0.5182, + "MATH Level 5": 0.1307, + "GPQA": 0.3138, + "MUSR": 0.4363, + "MMLU-PRO": 0.3666 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-NEMO", + "name": "VICIOUS_MESH-12B-NEMO", + "developer": "bamec66557", + "scores": { + "IFEval": 0.4022, + "BBH": 0.5442, + "MATH Level 5": 0.1269, + "GPQA": 0.3238, + "MUSR": 0.4251, + "MMLU-PRO": 0.3716 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-OMEGA", + "name": "VICIOUS_MESH-12B-OMEGA", + "developer": "bamec66557", + "scores": { + "IFEval": 0.67, + "BBH": 0.5166, + "MATH Level 5": 0.1344, + "GPQA": 0.3154, + "MUSR": 0.4323, + "MMLU-PRO": 0.3677 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B-UNION", + "name": "VICIOUS_MESH-12B-UNION", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6429, + "BBH": 0.5107, + "MATH Level 5": 0.139, + "GPQA": 0.3121, + "MUSR": 0.4257, + "MMLU-PRO": 0.3672 + } + }, + { + "model_id": "bamec66557/VICIOUS_MESH-12B_Razor", + "name": "VICIOUS_MESH-12B_Razor", + "developer": "bamec66557", + "scores": { + "IFEval": 0.3736, + "BBH": 0.5447, + "MATH Level 5": 0.1299, + "GPQA": 0.323, + "MUSR": 0.4092, + "MMLU-PRO": 0.3669 + } + }, + { + "model_id": "bamec66557/mergekit-model_stock-zdaysvi", + "name": "mergekit-model_stock-zdaysvi", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6426, + "BBH": 0.5063, + "MATH Level 5": 0.1352, + "GPQA": 0.3138, + "MUSR": 0.4124, + "MMLU-PRO": 0.3688 + } + }, + { + "model_id": "bamec66557/mergekit-ties-sinbkow", + "name": "mergekit-ties-sinbkow", + "developer": "bamec66557", + "scores": { + "IFEval": 0.6432, + "BBH": 0.5092, + "MATH Level 5": 0.145, + "GPQA": 0.3196, + "MUSR": 0.4045, + "MMLU-PRO": 0.3603 + } + }, + { + "model_id": "belztjti/dffghgjh", + "name": "dffghgjh", + "developer": "belztjti", + "scores": { + "IFEval": 0.5784, + "BBH": 0.3582, + "MATH Level 5": 0.0234, + "GPQA": 0.2634, + "MUSR": 0.3475, + "MMLU-PRO": 0.3422 + } + }, + { + "model_id": "belztjti/dtfgv", + "name": "dtfgv", + "developer": "belztjti", + "scores": { + "IFEval": 0.3345, + "BBH": 0.3282, + "MATH Level 5": 0.0181, + "GPQA": 0.2693, + "MUSR": 0.3794, + "MMLU-PRO": 0.1504 + } + }, + { + "model_id": "benhaotang/phi4-qwq-sky-t1", + "name": "phi4-qwq-sky-t1", + "developer": "benhaotang", + "scores": { + "IFEval": 0.046, + "BBH": 0.6711, + "MATH Level 5": 0.4101, + "GPQA": 0.3951, + "MUSR": 0.49, + "MMLU-PRO": 0.5244 + } + }, + { + "model_id": "beomi/gemma-mling-7b", + "name": "gemma-mling-7b", + "developer": "beomi", + "scores": { + "IFEval": 0.2029, + "BBH": 0.4068, + "MATH Level 5": 0.0544, + "GPQA": 0.25, + "MUSR": 0.3759, + "MMLU-PRO": 0.2633 + } + }, + { + "model_id": "beowolx/CodeNinja-1.0-OpenChat-7B", + "name": "CodeNinja-1.0-OpenChat-7B", + "developer": "beowolx", + "scores": { + "IFEval": 0.5447, + "BBH": 0.4441, + "MATH Level 5": 0.0672, + "GPQA": 0.2945, + "MUSR": 0.4243, + "MMLU-PRO": 0.3015 + } + }, + { + "model_id": "berkeley-nest/Starling-LM-7B-alpha", + "name": "Starling-LM-7B-alpha", + "developer": "berkeley-nest", + "scores": { + "IFEval": 0.548, + "BBH": 0.444, + "MATH Level 5": 0.0838, + "GPQA": 0.297, + "MUSR": 0.412, + "MMLU-PRO": 0.3172 + } + }, + { + "model_id": "bfuzzy1/Gunny", + "name": "Gunny", + "developer": "bfuzzy1", + "scores": { + "IFEval": 0.7129, + "BBH": 0.4546, + "MATH Level 5": 0.173, + "GPQA": 0.2785, + "MUSR": 0.3583, + "MMLU-PRO": 0.3039 + } + }, + { + "model_id": "bfuzzy1/acheron", + "name": "acheron", + "developer": "bfuzzy1", + "scores": { + "IFEval": 0.1983, + "BBH": 0.3108, + "MATH Level 5": 0.0166, + "GPQA": 0.2391, + "MUSR": 0.3511, + "MMLU-PRO": 0.1096 + } + }, + { + "model_id": "bfuzzy1/acheron-c", + "name": "acheron-c", + "developer": "bfuzzy1", + "scores": { + "IFEval": 0.1929, + "BBH": 0.3026, + "MATH Level 5": 0.003, + "GPQA": 0.2475, + "MUSR": 0.3382, + "MMLU-PRO": 0.1172 + } + }, + { + "model_id": "bfuzzy1/acheron-d", + "name": "acheron-d", + "developer": "bfuzzy1", + "scores": { + "IFEval": 0.1925, + "BBH": 0.314, + "MATH Level 5": 0.0151, + "GPQA": 0.2366, + "MUSR": 0.3497, + "MMLU-PRO": 0.1134 + } + }, + { + "model_id": "bfuzzy1/acheron-m", + "name": "acheron-m", + "developer": "bfuzzy1", + "scores": { + "IFEval": 0.1758, + "BBH": 0.2928, + "MATH Level 5": 0.0091, + "GPQA": 0.2601, + "MUSR": 0.3487, + "MMLU-PRO": 0.1113 + } + }, + { + "model_id": "bfuzzy1/acheron-m1a-llama", + "name": "acheron-m1a-llama", + "developer": "bfuzzy1", + "scores": { + "IFEval": 0.1125, + "BBH": 0.2956, + "MATH Level 5": 0.0076, + "GPQA": 0.2601, + "MUSR": 0.3633, + "MMLU-PRO": 0.1146 + } + }, + { + "model_id": "bfuzzy1/llambses-1", + "name": "llambses-1", + "developer": "bfuzzy1", + "scores": { + "IFEval": 0.3554, + "BBH": 0.5047, + "MATH Level 5": 0.0687, + "GPQA": 0.2978, + "MUSR": 0.4529, + "MMLU-PRO": 0.314 + } + }, + { + "model_id": "bhuvneshsaini/merged_model", + "name": "merged_model", + "developer": "bhuvneshsaini", + "scores": { + "IFEval": 0.1813, + "BBH": 0.336, + "MATH Level 5": 0.0, + "GPQA": 0.25, + "MUSR": 0.3497, + "MMLU-PRO": 0.1445 + } + }, + { + "model_id": "bigcode/starcoder2-15b", + "name": "starcoder2-15b", + "developer": "bigcode", + "scores": { + "IFEval": 0.278, + "BBH": 0.4448, + "MATH Level 5": 0.0597, + "GPQA": 0.2735, + "MUSR": 0.3501, + "MMLU-PRO": 0.2353 + } + }, + { + "model_id": "bigcode/starcoder2-3b", + "name": "starcoder2-3b", + "developer": "bigcode", + "scores": { + "IFEval": 0.2037, + "BBH": 0.3509, + "MATH Level 5": 0.0151, + "GPQA": 0.2441, + "MUSR": 0.3435, + "MMLU-PRO": 0.1636 + } + }, + { + "model_id": "bigcode/starcoder2-7b", + "name": "starcoder2-7b", + "developer": "bigcode", + "scores": { + "IFEval": 0.2209, + "BBH": 0.3661, + "MATH Level 5": 0.031, + "GPQA": 0.2517, + "MUSR": 0.3793, + "MMLU-PRO": 0.1642 + } + }, + { + "model_id": "bigscience/bloom-1b1", + "name": "bloom-1b1", + "developer": "bigscience", + "scores": { + "IFEval": 0.1373, + "BBH": 0.3107, + "MATH Level 5": 0.0053, + "GPQA": 0.2592, + "MUSR": 0.37, + "MMLU-PRO": 0.1108 + } + }, + { + "model_id": "bigscience/bloom-1b7", + "name": "bloom-1b7", + "developer": "bigscience", + "scores": { + "IFEval": 0.1044, + "BBH": 0.3141, + "MATH Level 5": 0.0053, + "GPQA": 0.2584, + "MUSR": 0.3886, + "MMLU-PRO": 0.1086 + } + }, + { + "model_id": "bigscience/bloom-3b", + "name": "bloom-3b", + "developer": "bigscience", + "scores": { + "IFEval": 0.1271, + "BBH": 0.3063, + "MATH Level 5": 0.0083, + "GPQA": 0.2399, + "MUSR": 0.3981, + "MMLU-PRO": 0.1133 + } + }, + { + "model_id": "bigscience/bloom-560m", + "name": "bloom-560m", + "developer": "bigscience", + "scores": { + "IFEval": 0.062, + "BBH": 0.3026, + "MATH Level 5": 0.0038, + "GPQA": 0.2617, + "MUSR": 0.4031, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "bigscience/bloom-7b1", + "name": "bloom-7b1", + "developer": "bigscience", + "scores": { + "IFEval": 0.1322, + "BBH": 0.3114, + "MATH Level 5": 0.0053, + "GPQA": 0.2643, + "MUSR": 0.3487, + "MMLU-PRO": 0.1105 + } + }, + { + "model_id": "bluuwhale/L3-SthenoMaid-8B-V1", + "name": "L3-SthenoMaid-8B-V1", + "developer": "bluuwhale", + "scores": { + "IFEval": 0.7345, + "BBH": 0.5219, + "MATH Level 5": 0.108, + "GPQA": 0.2802, + "MUSR": 0.3687, + "MMLU-PRO": 0.3656 + } + }, + { + "model_id": "bond005/meno-tiny-0.1", + "name": "meno-tiny-0.1", + "developer": "bond005", + "scores": { + "IFEval": 0.455, + "BBH": 0.4263, + "MATH Level 5": 0.139, + "GPQA": 0.2819, + "MUSR": 0.4185, + "MMLU-PRO": 0.2786 + } + }, + { + "model_id": "bosonai/Higgs-Llama-3-70B", + "name": "Higgs-Llama-3-70B", + "developer": "bosonai", + "scores": { + "IFEval": 0.5561, + "BBH": 0.6258, + "MATH Level 5": 0.2523, + "GPQA": 0.3666, + "MUSR": 0.4471, + "MMLU-PRO": 0.4902 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-1.5B-Blunt", + "name": "DeepSeek-R1-Distill-Qwen-1.5B-Blunt", + "developer": "braindao", + "scores": { + "IFEval": 0.2611, + "BBH": 0.2774, + "MATH Level 5": 0.1382, + "GPQA": 0.2475, + "MUSR": 0.3595, + "MMLU-PRO": 0.1184 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-1.5B-Reflective", + "name": "DeepSeek-R1-Distill-Qwen-1.5B-Reflective", + "developer": "braindao", + "scores": { + "IFEval": 0.3033, + "BBH": 0.2908, + "MATH Level 5": 0.1631, + "GPQA": 0.2609, + "MUSR": 0.3356, + "MMLU-PRO": 0.113 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-14B", + "name": "DeepSeek-R1-Distill-Qwen-14B", + "developer": "braindao", + "scores": { + "IFEval": 0.4172, + "BBH": 0.3033, + "MATH Level 5": 0.176, + "GPQA": 0.2802, + "MUSR": 0.4488, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-14B-ABUB-ST", + "name": "DeepSeek-R1-Distill-Qwen-14B-ABUB-ST", + "developer": "braindao", + "scores": { + "IFEval": 0.3752, + "BBH": 0.4927, + "MATH Level 5": 0.5015, + "GPQA": 0.3448, + "MUSR": 0.4221, + "MMLU-PRO": 0.4243 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-14B-Blunt", + "name": "DeepSeek-R1-Distill-Qwen-14B-Blunt", + "developer": "braindao", + "scores": { + "IFEval": 0.5612, + "BBH": 0.3283, + "MATH Level 5": 0.1639, + "GPQA": 0.3029, + "MUSR": 0.4554, + "MMLU-PRO": 0.1447 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-14B-Blunt-Uncensored", + "name": "DeepSeek-R1-Distill-Qwen-14B-Blunt-Uncensored", + "developer": "braindao", + "scores": { + "IFEval": 0.5422, + "BBH": 0.317, + "MATH Level 5": 0.1631, + "GPQA": 0.2827, + "MUSR": 0.4487, + "MMLU-PRO": 0.1431 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-14B-Blunt-Uncensored-Blunt", + "name": "DeepSeek-R1-Distill-Qwen-14B-Blunt-Uncensored-Blunt", + "developer": "braindao", + "scores": { + "IFEval": 0.5221, + "BBH": 0.3199, + "MATH Level 5": 0.2508, + "GPQA": 0.2785, + "MUSR": 0.4527, + "MMLU-PRO": 0.1484 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-14B-Blunt-Uncensored-Blunt-Reflective", + "name": "DeepSeek-R1-Distill-Qwen-14B-Blunt-Uncensored-Blunt-Reflective", + "developer": "braindao", + "scores": { + "IFEval": 0.554, + "BBH": 0.3371, + "MATH Level 5": 0.2372, + "GPQA": 0.2777, + "MUSR": 0.4248, + "MMLU-PRO": 0.1504 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-14B-Blunt-Uncensored-Reflective", + "name": "DeepSeek-R1-Distill-Qwen-14B-Blunt-Uncensored-Reflective", + "developer": "braindao", + "scores": { + "IFEval": 0.5139, + "BBH": 0.3013, + "MATH Level 5": 0.1473, + "GPQA": 0.2878, + "MUSR": 0.4433, + "MMLU-PRO": 0.1289 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-14B-Reflective", + "name": "DeepSeek-R1-Distill-Qwen-14B-Reflective", + "developer": "braindao", + "scores": { + "IFEval": 0.429, + "BBH": 0.3012, + "MATH Level 5": 0.1918, + "GPQA": 0.2727, + "MUSR": 0.4554, + "MMLU-PRO": 0.1129 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-7B", + "name": "DeepSeek-R1-Distill-Qwen-7B", + "developer": "braindao", + "scores": { + "IFEval": 0.3968, + "BBH": 0.2887, + "MATH Level 5": 0.1918, + "GPQA": 0.2617, + "MUSR": 0.3767, + "MMLU-PRO": 0.1141 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-7B-Blunt", + "name": "DeepSeek-R1-Distill-Qwen-7B-Blunt", + "developer": "braindao", + "scores": { + "IFEval": 0.4266, + "BBH": 0.2902, + "MATH Level 5": 0.2145, + "GPQA": 0.271, + "MUSR": 0.3885, + "MMLU-PRO": 0.1169 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-7B-ORPO-Uncensored", + "name": "DeepSeek-R1-Distill-Qwen-7B-ORPO-Uncensored", + "developer": "braindao", + "scores": { + "IFEval": 0.3655, + "BBH": 0.2958, + "MATH Level 5": 0.1737, + "GPQA": 0.2534, + "MUSR": 0.3846, + "MMLU-PRO": 0.1133 + } + }, + { + "model_id": "braindao/DeepSeek-R1-Distill-Qwen-7B-Reflective", + "name": "DeepSeek-R1-Distill-Qwen-7B-Reflective", + "developer": "braindao", + "scores": { + "IFEval": 0.3922, + "BBH": 0.2907, + "MATH Level 5": 0.2024, + "GPQA": 0.2542, + "MUSR": 0.39, + "MMLU-PRO": 0.1155 + } + }, + { + "model_id": "braindao/Qwen2.5-14B", + "name": "Qwen2.5-14B", + "developer": "braindao", + "scores": { + "IFEval": 0.5409, + "BBH": 0.5853, + "MATH Level 5": 0.2923, + "GPQA": 0.3733, + "MUSR": 0.4124, + "MMLU-PRO": 0.4884 + } + }, + { + "model_id": "braindao/Qwen2.5-14B-Instruct", + "name": "Qwen2.5-14B-Instruct", + "developer": "braindao", + "scores": { + "IFEval": 0.8143, + "BBH": 0.6404, + "MATH Level 5": 0.5529, + "GPQA": 0.3289, + "MUSR": 0.414, + "MMLU-PRO": 0.4889 + } + }, + { + "model_id": "braindao/iq-code-evmind-0.5b", + "name": "iq-code-evmind-0.5b", + "developer": "braindao", + "scores": { + "IFEval": 0.3216, + "BBH": 0.3164, + "MATH Level 5": 0.0242, + "GPQA": 0.2416, + "MUSR": 0.3304, + "MMLU-PRO": 0.1189 + } + }, + { + "model_id": "brgx53/3Bgeneral-ECE-PRYMMAL-Martial", + "name": "3Bgeneral-ECE-PRYMMAL-Martial", + "developer": "brgx53", + "scores": { + "IFEval": 0.3289, + "BBH": 0.5458, + "MATH Level 5": 0.1314, + "GPQA": 0.3247, + "MUSR": 0.4373, + "MMLU-PRO": 0.3934 + } + }, + { + "model_id": "brgx53/3Bgeneralv2-ECE-PRYMMAL-Martial", + "name": "3Bgeneralv2-ECE-PRYMMAL-Martial", + "developer": "brgx53", + "scores": { + "IFEval": 0.5677, + "BBH": 0.5607, + "MATH Level 5": 0.3497, + "GPQA": 0.3112, + "MUSR": 0.4356, + "MMLU-PRO": 0.4505 + } + }, + { + "model_id": "brgx53/3Blareneg-ECE-PRYMMAL-Martial", + "name": "3Blareneg-ECE-PRYMMAL-Martial", + "developer": "brgx53", + "scores": { + "IFEval": 0.2876, + "BBH": 0.5358, + "MATH Level 5": 0.1208, + "GPQA": 0.3347, + "MUSR": 0.4429, + "MMLU-PRO": 0.4016 + } + }, + { + "model_id": "brgx53/3Blarenegv2-ECE-PRYMMAL-Martial", + "name": "3Blarenegv2-ECE-PRYMMAL-Martial", + "developer": "brgx53", + "scores": { + "IFEval": 0.5662, + "BBH": 0.5607, + "MATH Level 5": 0.3497, + "GPQA": 0.3112, + "MUSR": 0.4356, + "MMLU-PRO": 0.4505 + } + }, + { + "model_id": "brgx53/Barracuda-PRYMMAL-ECE-TW3", + "name": "Barracuda-PRYMMAL-ECE-TW3", + "developer": "brgx53", + "scores": { + "IFEval": 0.164, + "BBH": 0.3002, + "MATH Level 5": 0.0023, + "GPQA": 0.2534, + "MUSR": 0.3609, + "MMLU-PRO": 0.1093 + } + }, + { + "model_id": "brgx53/LaConfiance-PRYMMAL-ECE-TW3", + "name": "LaConfiance-PRYMMAL-ECE-TW3", + "developer": "brgx53", + "scores": { + "IFEval": 0.1579, + "BBH": 0.2962, + "MATH Level 5": 0.0, + "GPQA": 0.2517, + "MUSR": 0.3846, + "MMLU-PRO": 0.1146 + } + }, + { + "model_id": "bunnycore/Best-Mix-Llama-3.1-8B", + "name": "Best-Mix-Llama-3.1-8B", + "developer": "bunnycore", + "scores": { + "IFEval": 0.2067, + "BBH": 0.3432, + "MATH Level 5": 0.2054, + "GPQA": 0.2651, + "MUSR": 0.2929, + "MMLU-PRO": 0.1565 + } + }, + { + "model_id": "bunnycore/Blabbertron-1.0", + "name": "Blabbertron-1.0", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7433, + "BBH": 0.5497, + "MATH Level 5": 0.4924, + "GPQA": 0.302, + "MUSR": 0.4337, + "MMLU-PRO": 0.4354 + } + }, + { + "model_id": "bunnycore/Blabbertron-1.1", + "name": "Blabbertron-1.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7265, + "BBH": 0.5534, + "MATH Level 5": 0.4804, + "GPQA": 0.3029, + "MUSR": 0.4416, + "MMLU-PRO": 0.4431 + } + }, + { + "model_id": "bunnycore/CyberCore-Qwen-2.1-7B", + "name": "CyberCore-Qwen-2.1-7B", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5766, + "BBH": 0.5572, + "MATH Level 5": 0.3588, + "GPQA": 0.3079, + "MUSR": 0.4145, + "MMLU-PRO": 0.4445 + } + }, + { + "model_id": "bunnycore/DeepQwen-3B-LCoT-SCE", + "name": "DeepQwen-3B-LCoT-SCE", + "developer": "bunnycore", + "scores": { + "IFEval": 0.449, + "BBH": 0.4512, + "MATH Level 5": 0.247, + "GPQA": 0.2626, + "MUSR": 0.3514, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "bunnycore/DeepSeek-R1-Distill-Qwen-7B-RRP-Ex", + "name": "DeepSeek-R1-Distill-Qwen-7B-RRP-Ex", + "developer": "bunnycore", + "scores": { + "IFEval": 0.3901, + "BBH": 0.3494, + "MATH Level 5": 0.1654, + "GPQA": 0.2785, + "MUSR": 0.3663, + "MMLU-PRO": 0.2508 + } + }, + { + "model_id": "bunnycore/DeepThinker-7B-Sce-v1", + "name": "DeepThinker-7B-Sce-v1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.1218, + "BBH": 0.3018, + "MATH Level 5": 0.0098, + "GPQA": 0.2517, + "MUSR": 0.4194, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "bunnycore/DeepThinker-7B-Sce-v2", + "name": "DeepThinker-7B-Sce-v2", + "developer": "bunnycore", + "scores": { + "IFEval": 0.1631, + "BBH": 0.3057, + "MATH Level 5": 0.0113, + "GPQA": 0.2584, + "MUSR": 0.4101, + "MMLU-PRO": 0.1146 + } + }, + { + "model_id": "bunnycore/FuseCyberMix-Qwen-2.5-7B-Instruct", + "name": "FuseCyberMix-Qwen-2.5-7B-Instruct", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7019, + "BBH": 0.5518, + "MATH Level 5": 0.4841, + "GPQA": 0.297, + "MUSR": 0.402, + "MMLU-PRO": 0.4337 + } + }, + { + "model_id": "bunnycore/FuseQwQen-7B", + "name": "FuseQwQen-7B", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7275, + "BBH": 0.5504, + "MATH Level 5": 0.4366, + "GPQA": 0.2945, + "MUSR": 0.4217, + "MMLU-PRO": 0.4407 + } + }, + { + "model_id": "bunnycore/FwF-Qwen-7B-0.1", + "name": "FwF-Qwen-7B-0.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.3005, + "BBH": 0.5019, + "MATH Level 5": 0.2764, + "GPQA": 0.271, + "MUSR": 0.3952, + "MMLU-PRO": 0.4061 + } + }, + { + "model_id": "bunnycore/FwF-Qwen-7B-0.2", + "name": "FwF-Qwen-7B-0.2", + "developer": "bunnycore", + "scores": { + "IFEval": 0.4479, + "BBH": 0.5596, + "MATH Level 5": 0.426, + "GPQA": 0.2903, + "MUSR": 0.4218, + "MMLU-PRO": 0.4382 + } + }, + { + "model_id": "bunnycore/Gemma-2-2B-Smart", + "name": "Gemma-2-2B-Smart", + "developer": "bunnycore", + "scores": { + "IFEval": 0.1321, + "BBH": 0.3974, + "MATH Level 5": 0.0332, + "GPQA": 0.2827, + "MUSR": 0.4249, + "MMLU-PRO": 0.2426 + } + }, + { + "model_id": "bunnycore/Gemma2-9B-TitanFusion", + "name": "Gemma2-9B-TitanFusion", + "developer": "bunnycore", + "scores": { + "IFEval": 0.1618, + "BBH": 0.5712, + "MATH Level 5": 0.077, + "GPQA": 0.3322, + "MUSR": 0.4136, + "MMLU-PRO": 0.396 + } + }, + { + "model_id": "bunnycore/HyperLlama-3.1-8B", + "name": "HyperLlama-3.1-8B", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7883, + "BBH": 0.5103, + "MATH Level 5": 0.1828, + "GPQA": 0.2869, + "MUSR": 0.3829, + "MMLU-PRO": 0.3783 + } + }, + { + "model_id": "bunnycore/Llama-3.1-8B-TitanFusion-Mix", + "name": "Llama-3.1-8B-TitanFusion-Mix", + "developer": "bunnycore", + "scores": { + "IFEval": 0.4925, + "BBH": 0.5756, + "MATH Level 5": 0.1284, + "GPQA": 0.2953, + "MUSR": 0.4317, + "MMLU-PRO": 0.3695 + } + }, + { + "model_id": "bunnycore/Llama-3.1-8B-TitanFusion-v3", + "name": "Llama-3.1-8B-TitanFusion-v3", + "developer": "bunnycore", + "scores": { + "IFEval": 0.481, + "BBH": 0.5262, + "MATH Level 5": 0.142, + "GPQA": 0.3087, + "MUSR": 0.4302, + "MMLU-PRO": 0.3806 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-All-Mix", + "name": "Llama-3.2-3B-All-Mix", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7226, + "BBH": 0.4508, + "MATH Level 5": 0.1503, + "GPQA": 0.2626, + "MUSR": 0.3287, + "MMLU-PRO": 0.316 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-Bespoke-Thought", + "name": "Llama-3.2-3B-Bespoke-Thought", + "developer": "bunnycore", + "scores": { + "IFEval": 0.4113, + "BBH": 0.4522, + "MATH Level 5": 0.1647, + "GPQA": 0.2659, + "MUSR": 0.3302, + "MMLU-PRO": 0.311 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-Booval", + "name": "Llama-3.2-3B-Booval", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6669, + "BBH": 0.4514, + "MATH Level 5": 0.1269, + "GPQA": 0.2668, + "MUSR": 0.3394, + "MMLU-PRO": 0.3058 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-Deep-Test", + "name": "Llama-3.2-3B-Deep-Test", + "developer": "bunnycore", + "scores": { + "IFEval": 0.1775, + "BBH": 0.295, + "MATH Level 5": 0.0, + "GPQA": 0.2517, + "MUSR": 0.3647, + "MMLU-PRO": 0.1049 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-Della", + "name": "Llama-3.2-3B-Della", + "developer": "bunnycore", + "scores": { + "IFEval": 0.3561, + "BBH": 0.3683, + "MATH Level 5": 0.0302, + "GPQA": 0.276, + "MUSR": 0.3902, + "MMLU-PRO": 0.2128 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-Long-Think", + "name": "Llama-3.2-3B-Long-Think", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5473, + "BBH": 0.461, + "MATH Level 5": 0.1458, + "GPQA": 0.2609, + "MUSR": 0.3396, + "MMLU-PRO": 0.3048 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-Mix-Skill", + "name": "Llama-3.2-3B-Mix-Skill", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6404, + "BBH": 0.4582, + "MATH Level 5": 0.1473, + "GPQA": 0.2617, + "MUSR": 0.3396, + "MMLU-PRO": 0.3121 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-ProdigyPlus", + "name": "Llama-3.2-3B-ProdigyPlus", + "developer": "bunnycore", + "scores": { + "IFEval": 0.4015, + "BBH": 0.4392, + "MATH Level 5": 0.1156, + "GPQA": 0.2685, + "MUSR": 0.358, + "MMLU-PRO": 0.2817 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-ProdigyPlusPlus", + "name": "Llama-3.2-3B-ProdigyPlusPlus", + "developer": "bunnycore", + "scores": { + "IFEval": 0.1645, + "BBH": 0.369, + "MATH Level 5": 0.0453, + "GPQA": 0.2534, + "MUSR": 0.3541, + "MMLU-PRO": 0.15 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-RP-DeepThink", + "name": "Llama-3.2-3B-RP-DeepThink", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7144, + "BBH": 0.4563, + "MATH Level 5": 0.1609, + "GPQA": 0.2659, + "MUSR": 0.3302, + "MMLU-PRO": 0.3242 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-RRStock", + "name": "Llama-3.2-3B-RRStock", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6657, + "BBH": 0.4568, + "MATH Level 5": 0.1699, + "GPQA": 0.2659, + "MUSR": 0.3314, + "MMLU-PRO": 0.3236 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3B-ToxicKod", + "name": "Llama-3.2-3B-ToxicKod", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6319, + "BBH": 0.4525, + "MATH Level 5": 0.1699, + "GPQA": 0.2659, + "MUSR": 0.3475, + "MMLU-PRO": 0.288 + } + }, + { + "model_id": "bunnycore/Llama-3.2-3b-RP-Toxic-Fuse", + "name": "Llama-3.2-3b-RP-Toxic-Fuse", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6834, + "BBH": 0.465, + "MATH Level 5": 0.2402, + "GPQA": 0.2777, + "MUSR": 0.3954, + "MMLU-PRO": 0.3106 + } + }, + { + "model_id": "bunnycore/Maestro-S1k-7B-Sce", + "name": "Maestro-S1k-7B-Sce", + "developer": "bunnycore", + "scores": { + "IFEval": 0.2523, + "BBH": 0.3104, + "MATH Level 5": 0.0279, + "GPQA": 0.2609, + "MUSR": 0.3768, + "MMLU-PRO": 0.117 + } + }, + { + "model_id": "bunnycore/Phi-3.5-mini-TitanFusion-0.1", + "name": "Phi-3.5-mini-TitanFusion-0.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5228, + "BBH": 0.5374, + "MATH Level 5": 0.1186, + "GPQA": 0.3314, + "MUSR": 0.4453, + "MMLU-PRO": 0.3807 + } + }, + { + "model_id": "bunnycore/Phi-4-Model-Stock", + "name": "Phi-4-Model-Stock", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6879, + "BBH": 0.689, + "MATH Level 5": 0.4298, + "GPQA": 0.3549, + "MUSR": 0.4441, + "MMLU-PRO": 0.5368 + } + }, + { + "model_id": "bunnycore/Phi-4-Model-Stock-v2", + "name": "Phi-4-Model-Stock-v2", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6375, + "BBH": 0.6825, + "MATH Level 5": 0.3754, + "GPQA": 0.349, + "MUSR": 0.4662, + "MMLU-PRO": 0.5331 + } + }, + { + "model_id": "bunnycore/Phi-4-Model-Stock-v3", + "name": "Phi-4-Model-Stock-v3", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5912, + "BBH": 0.6726, + "MATH Level 5": 0.4902, + "GPQA": 0.2894, + "MUSR": 0.4166, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "bunnycore/Phi-4-Model-Stock-v4", + "name": "Phi-4-Model-Stock-v4", + "developer": "bunnycore", + "scores": { + "IFEval": 0.711, + "BBH": 0.6924, + "MATH Level 5": 0.3829, + "GPQA": 0.3691, + "MUSR": 0.4611, + "MMLU-PRO": 0.5394 + } + }, + { + "model_id": "bunnycore/Phi-4-RP-v0", + "name": "Phi-4-RP-v0", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6827, + "BBH": 0.6856, + "MATH Level 5": 0.3316, + "GPQA": 0.3523, + "MUSR": 0.4141, + "MMLU-PRO": 0.5364 + } + }, + { + "model_id": "bunnycore/Phi-4-RR-Shoup", + "name": "Phi-4-RR-Shoup", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6587, + "BBH": 0.6947, + "MATH Level 5": 0.4992, + "GPQA": 0.3372, + "MUSR": 0.444, + "MMLU-PRO": 0.5429 + } + }, + { + "model_id": "bunnycore/Phi-4-RStock-v0.1", + "name": "Phi-4-RStock-v0.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7019, + "BBH": 0.6928, + "MATH Level 5": 0.395, + "GPQA": 0.3649, + "MUSR": 0.4584, + "MMLU-PRO": 0.5401 + } + }, + { + "model_id": "bunnycore/Phi-4-ReasoningRP", + "name": "Phi-4-ReasoningRP", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6736, + "BBH": 0.6922, + "MATH Level 5": 0.4569, + "GPQA": 0.344, + "MUSR": 0.4491, + "MMLU-PRO": 0.5421 + } + }, + { + "model_id": "bunnycore/Phi-4-Sce-exp-v0.1", + "name": "Phi-4-Sce-exp-v0.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6595, + "BBH": 0.6943, + "MATH Level 5": 0.503, + "GPQA": 0.3356, + "MUSR": 0.4441, + "MMLU-PRO": 0.5423 + } + }, + { + "model_id": "bunnycore/Phi-4-Stock-Ex", + "name": "Phi-4-Stock-Ex", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6575, + "BBH": 0.6864, + "MATH Level 5": 0.4086, + "GPQA": 0.3507, + "MUSR": 0.4624, + "MMLU-PRO": 0.5375 + } + }, + { + "model_id": "bunnycore/Phi-4-Stock-RP", + "name": "Phi-4-Stock-RP", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6399, + "BBH": 0.686, + "MATH Level 5": 0.3414, + "GPQA": 0.3582, + "MUSR": 0.4715, + "MMLU-PRO": 0.5317 + } + }, + { + "model_id": "bunnycore/Phi-4-Trim-Exp1", + "name": "Phi-4-Trim-Exp1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.1219, + "BBH": 0.2852, + "MATH Level 5": 0.0053, + "GPQA": 0.255, + "MUSR": 0.4177, + "MMLU-PRO": 0.1147 + } + }, + { + "model_id": "bunnycore/Phi-Seek-4-Sce-V1", + "name": "Phi-Seek-4-Sce-V1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.2935, + "BBH": 0.6459, + "MATH Level 5": 0.2145, + "GPQA": 0.276, + "MUSR": 0.3982, + "MMLU-PRO": 0.5123 + } + }, + { + "model_id": "bunnycore/Qandora-2.5-7B-Creative", + "name": "Qandora-2.5-7B-Creative", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6803, + "BBH": 0.5542, + "MATH Level 5": 0.3059, + "GPQA": 0.3104, + "MUSR": 0.4212, + "MMLU-PRO": 0.448 + } + }, + { + "model_id": "bunnycore/QandoraExp-7B", + "name": "QandoraExp-7B", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7509, + "BBH": 0.5478, + "MATH Level 5": 0.4743, + "GPQA": 0.3104, + "MUSR": 0.4312, + "MMLU-PRO": 0.441 + } + }, + { + "model_id": "bunnycore/QandoraExp-7B-Persona", + "name": "QandoraExp-7B-Persona", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6247, + "BBH": 0.5558, + "MATH Level 5": 0.3104, + "GPQA": 0.3146, + "MUSR": 0.4372, + "MMLU-PRO": 0.4407 + } + }, + { + "model_id": "bunnycore/QandoraExp-7B-v2", + "name": "QandoraExp-7B-v2", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5607, + "BBH": 0.5445, + "MATH Level 5": 0.4713, + "GPQA": 0.3029, + "MUSR": 0.4045, + "MMLU-PRO": 0.3909 + } + }, + { + "model_id": "bunnycore/QwQen-3B-LCoT", + "name": "QwQen-3B-LCoT", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6025, + "BBH": 0.4899, + "MATH Level 5": 0.3618, + "GPQA": 0.2668, + "MUSR": 0.4178, + "MMLU-PRO": 0.3699 + } + }, + { + "model_id": "bunnycore/QwQen-3B-LCoT-R1", + "name": "QwQen-3B-LCoT-R1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5342, + "BBH": 0.4799, + "MATH Level 5": 0.3353, + "GPQA": 0.2617, + "MUSR": 0.4138, + "MMLU-PRO": 0.3723 + } + }, + { + "model_id": "bunnycore/Qwen-2.5-7B-Deep-Sky-T1", + "name": "Qwen-2.5-7B-Deep-Sky-T1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.4208, + "BBH": 0.414, + "MATH Level 5": 0.0551, + "GPQA": 0.281, + "MUSR": 0.4018, + "MMLU-PRO": 0.2104 + } + }, + { + "model_id": "bunnycore/Qwen-2.5-7B-Deep-Stock-v1", + "name": "Qwen-2.5-7B-Deep-Stock-v1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5695, + "BBH": 0.5361, + "MATH Level 5": 0.2644, + "GPQA": 0.2777, + "MUSR": 0.4109, + "MMLU-PRO": 0.4066 + } + }, + { + "model_id": "bunnycore/Qwen-2.5-7B-Deep-Stock-v4", + "name": "Qwen-2.5-7B-Deep-Stock-v4", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7753, + "BBH": 0.5453, + "MATH Level 5": 0.4894, + "GPQA": 0.3003, + "MUSR": 0.4127, + "MMLU-PRO": 0.4342 + } + }, + { + "model_id": "bunnycore/Qwen-2.5-7B-Deep-Stock-v5", + "name": "Qwen-2.5-7B-Deep-Stock-v5", + "developer": "bunnycore", + "scores": { + "IFEval": 0.4509, + "BBH": 0.4672, + "MATH Level 5": 0.1473, + "GPQA": 0.2701, + "MUSR": 0.3648, + "MMLU-PRO": 0.2832 + } + }, + { + "model_id": "bunnycore/Qwen-2.5-7B-Exp-Sce", + "name": "Qwen-2.5-7B-Exp-Sce", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7652, + "BBH": 0.5506, + "MATH Level 5": 0.3255, + "GPQA": 0.2987, + "MUSR": 0.443, + "MMLU-PRO": 0.4259 + } + }, + { + "model_id": "bunnycore/Qwen-2.5-7B-R1-Stock", + "name": "Qwen-2.5-7B-R1-Stock", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7573, + "BBH": 0.5393, + "MATH Level 5": 0.5008, + "GPQA": 0.2995, + "MUSR": 0.3994, + "MMLU-PRO": 0.4294 + } + }, + { + "model_id": "bunnycore/Qwen-2.5-7B-Stock-Deep-Bespoke", + "name": "Qwen-2.5-7B-Stock-Deep-Bespoke", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5206, + "BBH": 0.492, + "MATH Level 5": 0.1888, + "GPQA": 0.281, + "MUSR": 0.4068, + "MMLU-PRO": 0.358 + } + }, + { + "model_id": "bunnycore/Qwen-2.5-7b-S1k", + "name": "Qwen-2.5-7b-S1k", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7162, + "BBH": 0.5563, + "MATH Level 5": 0.4781, + "GPQA": 0.2844, + "MUSR": 0.4071, + "MMLU-PRO": 0.4382 + } + }, + { + "model_id": "bunnycore/Qwen2.5-1.5B-Model-Stock", + "name": "Qwen2.5-1.5B-Model-Stock", + "developer": "bunnycore", + "scores": { + "IFEval": 0.1829, + "BBH": 0.2874, + "MATH Level 5": 0.0, + "GPQA": 0.2592, + "MUSR": 0.3674, + "MMLU-PRO": 0.11 + } + }, + { + "model_id": "bunnycore/Qwen2.5-3B-Model-Stock", + "name": "Qwen2.5-3B-Model-Stock", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6381, + "BBH": 0.4712, + "MATH Level 5": 0.3799, + "GPQA": 0.2886, + "MUSR": 0.3942, + "MMLU-PRO": 0.325 + } + }, + { + "model_id": "bunnycore/Qwen2.5-3B-Model-Stock-v2", + "name": "Qwen2.5-3B-Model-Stock-v2", + "developer": "bunnycore", + "scores": { + "IFEval": 0.649, + "BBH": 0.4677, + "MATH Level 5": 0.3867, + "GPQA": 0.2869, + "MUSR": 0.3915, + "MMLU-PRO": 0.327 + } + }, + { + "model_id": "bunnycore/Qwen2.5-3B-Model-Stock-v3.1", + "name": "Qwen2.5-3B-Model-Stock-v3.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6481, + "BBH": 0.4737, + "MATH Level 5": 0.3897, + "GPQA": 0.2844, + "MUSR": 0.3968, + "MMLU-PRO": 0.329 + } + }, + { + "model_id": "bunnycore/Qwen2.5-3B-Model-Stock-v3.2", + "name": "Qwen2.5-3B-Model-Stock-v3.2", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6353, + "BBH": 0.4727, + "MATH Level 5": 0.3754, + "GPQA": 0.2836, + "MUSR": 0.3928, + "MMLU-PRO": 0.3294 + } + }, + { + "model_id": "bunnycore/Qwen2.5-3B-Model-Stock-v4.1", + "name": "Qwen2.5-3B-Model-Stock-v4.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6381, + "BBH": 0.482, + "MATH Level 5": 0.3769, + "GPQA": 0.2794, + "MUSR": 0.3941, + "MMLU-PRO": 0.3387 + } + }, + { + "model_id": "bunnycore/Qwen2.5-3B-RP-Mix", + "name": "Qwen2.5-3B-RP-Mix", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5721, + "BBH": 0.4894, + "MATH Level 5": 0.2153, + "GPQA": 0.2735, + "MUSR": 0.4284, + "MMLU-PRO": 0.3728 + } + }, + { + "model_id": "bunnycore/Qwen2.5-3B-RP-Thinker", + "name": "Qwen2.5-3B-RP-Thinker", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5894, + "BBH": 0.4164, + "MATH Level 5": 0.3353, + "GPQA": 0.2643, + "MUSR": 0.3287, + "MMLU-PRO": 0.315 + } + }, + { + "model_id": "bunnycore/Qwen2.5-3B-RP-Thinker-V2", + "name": "Qwen2.5-3B-RP-Thinker-V2", + "developer": "bunnycore", + "scores": { + "IFEval": 0.642, + "BBH": 0.4678, + "MATH Level 5": 0.3829, + "GPQA": 0.2852, + "MUSR": 0.3981, + "MMLU-PRO": 0.3271 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-CyberRombos", + "name": "Qwen2.5-7B-CyberRombos", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7518, + "BBH": 0.5465, + "MATH Level 5": 0.4962, + "GPQA": 0.3045, + "MUSR": 0.4125, + "MMLU-PRO": 0.4391 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-Fuse-Exp", + "name": "Qwen2.5-7B-Fuse-Exp", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5469, + "BBH": 0.5109, + "MATH Level 5": 0.3142, + "GPQA": 0.276, + "MUSR": 0.4573, + "MMLU-PRO": 0.3309 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-Instruct-Fusion", + "name": "Qwen2.5-7B-Instruct-Fusion", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6962, + "BBH": 0.5492, + "MATH Level 5": 0.3406, + "GPQA": 0.3045, + "MUSR": 0.4297, + "MMLU-PRO": 0.4467 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-Instruct-Merge-Stock-v0.1", + "name": "Qwen2.5-7B-Instruct-Merge-Stock-v0.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7509, + "BBH": 0.5529, + "MATH Level 5": 0.4894, + "GPQA": 0.3037, + "MUSR": 0.4231, + "MMLU-PRO": 0.4383 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-MixStock-Sce-V0.3", + "name": "Qwen2.5-7B-MixStock-Sce-V0.3", + "developer": "bunnycore", + "scores": { + "IFEval": 0.212, + "BBH": 0.3479, + "MATH Level 5": 0.2576, + "GPQA": 0.2576, + "MUSR": 0.3714, + "MMLU-PRO": 0.1779 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-MixStock-V0.1", + "name": "Qwen2.5-7B-MixStock-V0.1", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7673, + "BBH": 0.5479, + "MATH Level 5": 0.3172, + "GPQA": 0.3003, + "MUSR": 0.4416, + "MMLU-PRO": 0.4256 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-R1-Bespoke-Stock", + "name": "Qwen2.5-7B-R1-Bespoke-Stock", + "developer": "bunnycore", + "scores": { + "IFEval": 0.3726, + "BBH": 0.4822, + "MATH Level 5": 0.2047, + "GPQA": 0.2785, + "MUSR": 0.3926, + "MMLU-PRO": 0.3472 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-R1-Bespoke-Task", + "name": "Qwen2.5-7B-R1-Bespoke-Task", + "developer": "bunnycore", + "scores": { + "IFEval": 0.3787, + "BBH": 0.415, + "MATH Level 5": 0.1782, + "GPQA": 0.2534, + "MUSR": 0.3569, + "MMLU-PRO": 0.2688 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-RRP-1M", + "name": "Qwen2.5-7B-RRP-1M", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7481, + "BBH": 0.5452, + "MATH Level 5": 0.3248, + "GPQA": 0.3029, + "MUSR": 0.4483, + "MMLU-PRO": 0.4266 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-RRP-1M-Thinker", + "name": "Qwen2.5-7B-RRP-1M-Thinker", + "developer": "bunnycore", + "scores": { + "IFEval": 0.2308, + "BBH": 0.3482, + "MATH Level 5": 0.2719, + "GPQA": 0.2576, + "MUSR": 0.3767, + "MMLU-PRO": 0.1769 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-RRP-ID", + "name": "Qwen2.5-7B-RRP-ID", + "developer": "bunnycore", + "scores": { + "IFEval": 0.7473, + "BBH": 0.548, + "MATH Level 5": 0.4864, + "GPQA": 0.2827, + "MUSR": 0.418, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "bunnycore/Qwen2.5-7B-Sky-R1-Mini", + "name": "Qwen2.5-7B-Sky-R1-Mini", + "developer": "bunnycore", + "scores": { + "IFEval": 0.2305, + "BBH": 0.3503, + "MATH Level 5": 0.0295, + "GPQA": 0.2894, + "MUSR": 0.3448, + "MMLU-PRO": 0.1253 + } + }, + { + "model_id": "bunnycore/QwenMosaic-7B", + "name": "QwenMosaic-7B", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5819, + "BBH": 0.5564, + "MATH Level 5": 0.4441, + "GPQA": 0.2609, + "MUSR": 0.4164, + "MMLU-PRO": 0.431 + } + }, + { + "model_id": "bunnycore/Smol-Llama-3.2-3B", + "name": "Smol-Llama-3.2-3B", + "developer": "bunnycore", + "scores": { + "IFEval": 0.6679, + "BBH": 0.4539, + "MATH Level 5": 0.1382, + "GPQA": 0.2768, + "MUSR": 0.346, + "MMLU-PRO": 0.3228 + } + }, + { + "model_id": "bunnycore/SmolLM2-1.7-Persona", + "name": "SmolLM2-1.7-Persona", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5465, + "BBH": 0.3623, + "MATH Level 5": 0.0566, + "GPQA": 0.2634, + "MUSR": 0.3341, + "MMLU-PRO": 0.1974 + } + }, + { + "model_id": "bunnycore/SmolLM2-1.7B-roleplay-lora", + "name": "SmolLM2-1.7B-roleplay-lora", + "developer": "bunnycore", + "scores": { + "IFEval": 0.5382, + "BBH": 0.361, + "MATH Level 5": 0.0529, + "GPQA": 0.2752, + "MUSR": 0.3395, + "MMLU-PRO": 0.1966 + } + }, + { + "model_id": "bunnycore/Tulu-3.1-8B-SuperNova", + "name": "Tulu-3.1-8B-SuperNova", + "developer": "bunnycore", + "scores": { + "IFEval": 0.8194, + "BBH": 0.5254, + "MATH Level 5": 0.2462, + "GPQA": 0.302, + "MUSR": 0.3935, + "MMLU-PRO": 0.3814 + } + }, + { + "model_id": "byroneverson/Mistral-Small-Instruct-2409-abliterated", + "name": "Mistral-Small-Instruct-2409-abliterated", + "developer": "byroneverson", + "scores": { + "IFEval": 0.6971, + "BBH": 0.5238, + "MATH Level 5": 0.2477, + "GPQA": 0.3331, + "MUSR": 0.3697, + "MMLU-PRO": 0.3923 + } + }, + { + "model_id": "byroneverson/Yi-1.5-9B-Chat-16K-abliterated", + "name": "Yi-1.5-9B-Chat-16K-abliterated", + "developer": "byroneverson", + "scores": { + "IFEval": 0.5528, + "BBH": 0.5282, + "MATH Level 5": 0.1412, + "GPQA": 0.3129, + "MUSR": 0.4734, + "MMLU-PRO": 0.3823 + } + }, + { + "model_id": "byroneverson/Yi-1.5-9B-Chat-abliterated", + "name": "Yi-1.5-9B-Chat-abliterated", + "developer": "byroneverson", + "scores": { + "IFEval": 0.5723, + "BBH": 0.5401, + "MATH Level 5": 0.1662, + "GPQA": 0.2919, + "MUSR": 0.4389, + "MMLU-PRO": 0.3715 + } + }, + { + "model_id": "c10x/Q-Pluse", + "name": "Q-Pluse", + "developer": "c10x", + "scores": { + "IFEval": 0.1123, + "BBH": 0.2875, + "MATH Level 5": 0.0, + "GPQA": 0.2466, + "MUSR": 0.3938, + "MMLU-PRO": 0.1135 + } + }, + { + "model_id": "c10x/longthinker", + "name": "longthinker", + "developer": "c10x", + "scores": { + "IFEval": 0.3609, + "BBH": 0.4927, + "MATH Level 5": 0.2319, + "GPQA": 0.2643, + "MUSR": 0.391, + "MMLU-PRO": 0.3527 + } + }, + { + "model_id": "carsenk/flippa-v6", + "name": "flippa-v6", + "developer": "carsenk", + "scores": { + "IFEval": 0.3439, + "BBH": 0.5047, + "MATH Level 5": 0.1405, + "GPQA": 0.2928, + "MUSR": 0.4089, + "MMLU-PRO": 0.3668 + } + }, + { + "model_id": "carsenk/phi3.5_mini_exp_825_uncensored", + "name": "phi3.5_mini_exp_825_uncensored", + "developer": "carsenk", + "scores": { + "IFEval": 0.1364, + "BBH": 0.2965, + "MATH Level 5": 0.0106, + "GPQA": 0.2492, + "MUSR": 0.3644, + "MMLU-PRO": 0.1175 + } + }, + { + "model_id": "cat-searcher/gemma-2-9b-it-sppo-iter-1", + "name": "gemma-2-9b-it-sppo-iter-1", + "developer": "cat-searcher", + "scores": { + "IFEval": 0.3015, + "BBH": 0.5972, + "MATH Level 5": 0.0831, + "GPQA": 0.3448, + "MUSR": 0.3927, + "MMLU-PRO": 0.3854 + } + }, + { + "model_id": "cat-searcher/gemma-2-9b-it-sppo-iter-1-evol-1", + "name": "gemma-2-9b-it-sppo-iter-1-evol-1", + "developer": "cat-searcher", + "scores": { + "IFEval": 0.2942, + "BBH": 0.5939, + "MATH Level 5": 0.0853, + "GPQA": 0.3406, + "MUSR": 0.3926, + "MMLU-PRO": 0.38 + } + }, + { + "model_id": "cckm/tinymistral_950m", + "name": "tinymistral_950m", + "developer": "cckm", + "scores": { + "IFEval": 0.2395, + "BBH": 0.2969, + "MATH Level 5": 0.0053, + "GPQA": 0.2601, + "MUSR": 0.3554, + "MMLU-PRO": 0.1096 + } + }, + { + "model_id": "cgato/TheSalt-L3-8b-v0.3.2", + "name": "TheSalt-L3-8b-v0.3.2", + "developer": "cgato", + "scores": { + "IFEval": 0.2705, + "BBH": 0.2968, + "MATH Level 5": 0.0476, + "GPQA": 0.2659, + "MUSR": 0.3896, + "MMLU-PRO": 0.1139 + } + }, + { + "model_id": "chargoddard/prometheus-2-llama-3-8b", + "name": "prometheus-2-llama-3-8b", + "developer": "chargoddard", + "scores": { + "IFEval": 0.5289, + "BBH": 0.4931, + "MATH Level 5": 0.0823, + "GPQA": 0.2727, + "MUSR": 0.3396, + "MMLU-PRO": 0.3087 + } + }, + { + "model_id": "chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO", + "name": "Llama-3-Instruct-8B-SimPO-ExPO", + "developer": "chujiezheng", + "scores": { + "IFEval": 0.6434, + "BBH": 0.4765, + "MATH Level 5": 0.0702, + "GPQA": 0.2869, + "MUSR": 0.392, + "MMLU-PRO": 0.3401 + } + }, + { + "model_id": "chujiezheng/Mistral7B-PairRM-SPPO-ExPO", + "name": "Mistral7B-PairRM-SPPO-ExPO", + "developer": "chujiezheng", + "scores": { + "IFEval": 0.3673, + "BBH": 0.3882, + "MATH Level 5": 0.0181, + "GPQA": 0.2768, + "MUSR": 0.4055, + "MMLU-PRO": 0.2552 + } + }, + { + "model_id": "cjvt/GaMS-1B", + "name": "GaMS-1B", + "developer": "cjvt", + "scores": { + "IFEval": 0.1635, + "BBH": 0.3075, + "MATH Level 5": 0.0136, + "GPQA": 0.2584, + "MUSR": 0.3684, + "MMLU-PRO": 0.1149 + } + }, + { + "model_id": "cloudyu/Llama-3-70Bx2-MOE", + "name": "Llama-3-70Bx2-MOE", + "developer": "cloudyu", + "scores": { + "IFEval": 0.5482, + "BBH": 0.6636, + "MATH Level 5": 0.2175, + "GPQA": 0.3935, + "MUSR": 0.4812, + "MMLU-PRO": 0.5142 + } + }, + { + "model_id": "cloudyu/Llama-3.2-3Bx4", + "name": "Llama-3.2-3Bx4", + "developer": "cloudyu", + "scores": { + "IFEval": 0.5069, + "BBH": 0.4332, + "MATH Level 5": 0.1073, + "GPQA": 0.2777, + "MUSR": 0.3496, + "MMLU-PRO": 0.2985 + } + }, + { + "model_id": "cloudyu/Mixtral_11Bx2_MoE_19B", + "name": "Mixtral_11Bx2_MoE_19B", + "developer": "cloudyu", + "scores": { + "IFEval": 0.3851, + "BBH": 0.5209, + "MATH Level 5": 0.0672, + "GPQA": 0.2903, + "MUSR": 0.4297, + "MMLU-PRO": 0.3311 + } + }, + { + "model_id": "cloudyu/Mixtral_34Bx2_MoE_60B", + "name": "Mixtral_34Bx2_MoE_60B", + "developer": "cloudyu", + "scores": { + "IFEval": 0.4538, + "BBH": 0.587, + "MATH Level 5": 0.077, + "GPQA": 0.3381, + "MUSR": 0.4625, + "MMLU-PRO": 0.4766 + } + }, + { + "model_id": "cloudyu/Mixtral_7Bx2_MoE", + "name": "Mixtral_7Bx2_MoE", + "developer": "cloudyu", + "scores": { + "IFEval": 0.448, + "BBH": 0.516, + "MATH Level 5": 0.0687, + "GPQA": 0.3054, + "MUSR": 0.4473, + "MMLU-PRO": 0.3044 + } + }, + { + "model_id": "cloudyu/S1-Llama-3.2-3Bx4-MoE", + "name": "S1-Llama-3.2-3Bx4-MoE", + "developer": "cloudyu", + "scores": { + "IFEval": 0.5302, + "BBH": 0.4358, + "MATH Level 5": 0.1201, + "GPQA": 0.2936, + "MUSR": 0.3456, + "MMLU-PRO": 0.3044 + } + }, + { + "model_id": "cloudyu/Yi-34Bx2-MoE-60B-DPO", + "name": "Yi-34Bx2-MoE-60B-DPO", + "developer": "cloudyu", + "scores": { + "IFEval": 0.5319, + "BBH": 0.5168, + "MATH Level 5": 0.0702, + "GPQA": 0.3221, + "MUSR": 0.4375, + "MMLU-PRO": 0.4677 + } + }, + { + "model_id": "cluebbers/Llama-3.1-8B-paraphrase-type-generation-apty-ipo", + "name": "Llama-3.1-8B-paraphrase-type-generation-apty-ipo", + "developer": "cluebbers", + "scores": { + "IFEval": 0.1327, + "BBH": 0.38, + "MATH Level 5": 0.0249, + "GPQA": 0.2634, + "MUSR": 0.4332, + "MMLU-PRO": 0.2591 + } + }, + { + "model_id": "cluebbers/Llama-3.1-8B-paraphrase-type-generation-apty-sigmoid", + "name": "Llama-3.1-8B-paraphrase-type-generation-apty-sigmoid", + "developer": "cluebbers", + "scores": { + "IFEval": 0.1318, + "BBH": 0.3789, + "MATH Level 5": 0.0264, + "GPQA": 0.2685, + "MUSR": 0.4306, + "MMLU-PRO": 0.2562 + } + }, + { + "model_id": "cluebbers/Llama-3.1-8B-paraphrase-type-generation-etpc", + "name": "Llama-3.1-8B-paraphrase-type-generation-etpc", + "developer": "cluebbers", + "scores": { + "IFEval": 0.1209, + "BBH": 0.3781, + "MATH Level 5": 0.0196, + "GPQA": 0.2651, + "MUSR": 0.4319, + "MMLU-PRO": 0.2556 + } + }, + { + "model_id": "cognitivecomputations/Dolphin3.0-Llama3.1-8B", + "name": "Dolphin3.0-Llama3.1-8B", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.7621, + "BBH": 0.4916, + "MATH Level 5": 0.1231, + "GPQA": 0.2827, + "MUSR": 0.3653, + "MMLU-PRO": 0.2992 + } + }, + { + "model_id": "cognitivecomputations/Dolphin3.0-Llama3.2-1B", + "name": "Dolphin3.0-Llama3.2-1B", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.5428, + "BBH": 0.3122, + "MATH Level 5": 0.0279, + "GPQA": 0.2299, + "MUSR": 0.3249, + "MMLU-PRO": 0.1375 + } + }, + { + "model_id": "cognitivecomputations/Dolphin3.0-Qwen2.5-0.5B", + "name": "Dolphin3.0-Qwen2.5-0.5B", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.4697, + "BBH": 0.3114, + "MATH Level 5": 0.0514, + "GPQA": 0.2349, + "MUSR": 0.3555, + "MMLU-PRO": 0.1413 + } + }, + { + "model_id": "cognitivecomputations/Dolphin3.0-R1-Mistral-24B", + "name": "Dolphin3.0-R1-Mistral-24B", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.4068, + "BBH": 0.536, + "MATH Level 5": 0.3119, + "GPQA": 0.2945, + "MUSR": 0.3952, + "MMLU-PRO": 0.3005 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9-llama3-8b", + "name": "dolphin-2.9-llama3-8b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.385, + "BBH": 0.495, + "MATH Level 5": 0.0574, + "GPQA": 0.2869, + "MUSR": 0.4375, + "MMLU-PRO": 0.2771 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.1-llama-3-70b", + "name": "dolphin-2.9.1-llama-3-70b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.376, + "BBH": 0.5205, + "MATH Level 5": 0.182, + "GPQA": 0.3087, + "MUSR": 0.4976, + "MMLU-PRO": 0.413 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.1-yi-1.5-34b", + "name": "dolphin-2.9.1-yi-1.5-34b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.3853, + "BBH": 0.6076, + "MATH Level 5": 0.1866, + "GPQA": 0.3431, + "MUSR": 0.4598, + "MMLU-PRO": 0.4519 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.1-yi-1.5-9b", + "name": "dolphin-2.9.1-yi-1.5-9b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.4465, + "BBH": 0.5484, + "MATH Level 5": 0.1518, + "GPQA": 0.3381, + "MUSR": 0.4348, + "MMLU-PRO": 0.3967 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.2-Phi-3-Medium", + "name": "dolphin-2.9.2-Phi-3-Medium", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.4248, + "BBH": 0.6457, + "MATH Level 5": 0.1828, + "GPQA": 0.3272, + "MUSR": 0.4191, + "MMLU-PRO": 0.4555 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.2-Phi-3-Medium-abliterated", + "name": "dolphin-2.9.2-Phi-3-Medium-abliterated", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.3613, + "BBH": 0.6123, + "MATH Level 5": 0.1239, + "GPQA": 0.328, + "MUSR": 0.4112, + "MMLU-PRO": 0.4494 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.2-qwen2-72b", + "name": "dolphin-2.9.2-qwen2-72b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.6344, + "BBH": 0.6296, + "MATH Level 5": 0.2802, + "GPQA": 0.37, + "MUSR": 0.4521, + "MMLU-PRO": 0.5471 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.2-qwen2-7b", + "name": "dolphin-2.9.2-qwen2-7b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.3535, + "BBH": 0.4894, + "MATH Level 5": 0.1344, + "GPQA": 0.2903, + "MUSR": 0.4191, + "MMLU-PRO": 0.4051 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.3-Yi-1.5-34B-32k", + "name": "dolphin-2.9.3-Yi-1.5-34B-32k", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.3639, + "BBH": 0.6047, + "MATH Level 5": 0.1669, + "GPQA": 0.3431, + "MUSR": 0.4311, + "MMLU-PRO": 0.463 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.3-mistral-7B-32k", + "name": "dolphin-2.9.3-mistral-7B-32k", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.4126, + "BBH": 0.4813, + "MATH Level 5": 0.0506, + "GPQA": 0.2852, + "MUSR": 0.4643, + "MMLU-PRO": 0.2821 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.3-mistral-nemo-12b", + "name": "dolphin-2.9.3-mistral-nemo-12b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.5601, + "BBH": 0.548, + "MATH Level 5": 0.074, + "GPQA": 0.3154, + "MUSR": 0.443, + "MMLU-PRO": 0.3377 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.4-gemma2-2b", + "name": "dolphin-2.9.4-gemma2-2b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.0896, + "BBH": 0.4081, + "MATH Level 5": 0.0491, + "GPQA": 0.2844, + "MUSR": 0.418, + "MMLU-PRO": 0.2105 + } + }, + { + "model_id": "cognitivecomputations/dolphin-2.9.4-llama3.1-8b", + "name": "dolphin-2.9.4-llama3.1-8b", + "developer": "cognitivecomputations", + "scores": { + "IFEval": 0.2757, + "BBH": 0.3524, + "MATH Level 5": 0.0121, + "GPQA": 0.2634, + "MUSR": 0.3236, + "MMLU-PRO": 0.1237 + } + }, + { + "model_id": "collaiborateorg/Collaiborator-MEDLLM-Llama-3-8B-v2", + "name": "Collaiborator-MEDLLM-Llama-3-8B-v2", + "developer": "collaiborateorg", + "scores": { + "IFEval": 0.3809, + "BBH": 0.4648, + "MATH Level 5": 0.0566, + "GPQA": 0.3331, + "MUSR": 0.3434, + "MMLU-PRO": 0.3481 + } + }, + { + "model_id": "cpayne1303/cp2024", + "name": "cp2024", + "developer": "cpayne1303", + "scores": { + "IFEval": 0.1658, + "BBH": 0.2985, + "MATH Level 5": 0.0053, + "GPQA": 0.2559, + "MUSR": 0.3383, + "MMLU-PRO": 0.1101 + } + }, + { + "model_id": "cpayne1303/cp2024-instruct", + "name": "cp2024-instruct", + "developer": "cpayne1303", + "scores": { + "IFEval": 0.1706, + "BBH": 0.2947, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3686, + "MMLU-PRO": 0.1167 + } + }, + { + "model_id": "cpayne1303/llama-43m-beta", + "name": "llama-43m-beta", + "developer": "cpayne1303", + "scores": { + "IFEval": 0.1949, + "BBH": 0.2965, + "MATH Level 5": 0.0045, + "GPQA": 0.2685, + "MUSR": 0.3885, + "MMLU-PRO": 0.1111 + } + }, + { + "model_id": "cpayne1303/smallcp2024", + "name": "smallcp2024", + "developer": "cpayne1303", + "scores": { + "IFEval": 0.1582, + "BBH": 0.3027, + "MATH Level 5": 0.0053, + "GPQA": 0.2307, + "MUSR": 0.3425, + "MMLU-PRO": 0.1114 + } + }, + { + "model_id": "crestf411/MN-Slush", + "name": "MN-Slush", + "developer": "crestf411", + "scores": { + "IFEval": 0.4077, + "BBH": 0.534, + "MATH Level 5": 0.1269, + "GPQA": 0.3238, + "MUSR": 0.3933, + "MMLU-PRO": 0.3508 + } + }, + { + "model_id": "cstr/llama3.1-8b-spaetzle-v90", + "name": "llama3.1-8b-spaetzle-v90", + "developer": "cstr", + "scores": { + "IFEval": 0.7356, + "BBH": 0.5303, + "MATH Level 5": 0.1495, + "GPQA": 0.2827, + "MUSR": 0.4134, + "MMLU-PRO": 0.3731 + } + }, + { + "model_id": "cyberagent/calm3-22b-chat", + "name": "calm3-22b-chat", + "developer": "cyberagent", + "scores": { + "IFEval": 0.5091, + "BBH": 0.4992, + "MATH Level 5": 0.0695, + "GPQA": 0.2768, + "MUSR": 0.4553, + "MMLU-PRO": 0.295 + } + }, + { + "model_id": "darkc0de/BuddyGlassNeverSleeps", + "name": "BuddyGlassNeverSleeps", + "developer": "darkc0de", + "scores": { + "IFEval": 0.4239, + "BBH": 0.4977, + "MATH Level 5": 0.0627, + "GPQA": 0.2945, + "MUSR": 0.3993, + "MMLU-PRO": 0.3452 + } + }, + { + "model_id": "darkc0de/BuddyGlassUncensored2025.2", + "name": "BuddyGlassUncensored2025.2", + "developer": "darkc0de", + "scores": { + "IFEval": 0.7731, + "BBH": 0.6095, + "MATH Level 5": 0.2402, + "GPQA": 0.328, + "MUSR": 0.4071, + "MMLU-PRO": 0.4336 + } + }, + { + "model_id": "darkc0de/BuddyGlass_v0.3_Xortron7MethedUpSwitchedUp", + "name": "BuddyGlass_v0.3_Xortron7MethedUpSwitchedUp", + "developer": "darkc0de", + "scores": { + "IFEval": 0.4358, + "BBH": 0.5243, + "MATH Level 5": 0.1284, + "GPQA": 0.2987, + "MUSR": 0.4143, + "MMLU-PRO": 0.3673 + } + }, + { + "model_id": "databricks/dbrx-base", + "name": "dbrx-base", + "developer": "databricks", + "scores": { + "IFEval": 0.0821, + "BBH": 0.5196, + "MATH Level 5": 0.1, + "GPQA": 0.3267, + "MUSR": 0.4067, + "MMLU-PRO": 0.35 + } + }, + { + "model_id": "databricks/dbrx-instruct", + "name": "DBRX Instruct", + "developer": "databricks", + "scores": { + "IFEval": 0.5416, + "BBH": 0.5429, + "MATH Level 5": 0.0687, + "GPQA": 0.3414, + "MUSR": 0.4269, + "MMLU-PRO": 0.3683 + } + }, + { + "model_id": "databricks/dolly-v1-6b", + "name": "dolly-v1-6b", + "developer": "databricks", + "scores": { + "IFEval": 0.2224, + "BBH": 0.3172, + "MATH Level 5": 0.0189, + "GPQA": 0.2643, + "MUSR": 0.4004, + "MMLU-PRO": 0.1266 + } + }, + { + "model_id": "databricks/dolly-v2-12b", + "name": "dolly-v2-12b", + "developer": "databricks", + "scores": { + "IFEval": 0.2355, + "BBH": 0.332, + "MATH Level 5": 0.0136, + "GPQA": 0.2408, + "MUSR": 0.3739, + "MMLU-PRO": 0.1129 + } + }, + { + "model_id": "databricks/dolly-v2-3b", + "name": "dolly-v2-3b", + "developer": "databricks", + "scores": { + "IFEval": 0.2247, + "BBH": 0.3079, + "MATH Level 5": 0.0151, + "GPQA": 0.2609, + "MUSR": 0.3338, + "MMLU-PRO": 0.1145 + } + }, + { + "model_id": "databricks/dolly-v2-7b", + "name": "dolly-v2-7b", + "developer": "databricks", + "scores": { + "IFEval": 0.201, + "BBH": 0.3173, + "MATH Level 5": 0.0144, + "GPQA": 0.2685, + "MUSR": 0.3553, + "MMLU-PRO": 0.1149 + } + }, + { + "model_id": "davidkim205/Rhea-72b-v0.5", + "name": "Rhea-72b-v0.5", + "developer": "davidkim205", + "scores": { + "IFEval": 0.0145, + "BBH": 0.3078, + "MATH Level 5": 0.1737, + "GPQA": 0.2525, + "MUSR": 0.4241, + "MMLU-PRO": 0.1166 + } + }, + { + "model_id": "davidkim205/nox-solar-10.7b-v4", + "name": "nox-solar-10.7b-v4", + "developer": "davidkim205", + "scores": { + "IFEval": 0.3753, + "BBH": 0.4814, + "MATH Level 5": 0.0083, + "GPQA": 0.307, + "MUSR": 0.4298, + "MMLU-PRO": 0.3333 + } + }, + { + "model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "name": "DeepSeek-R1-Distill-Llama-70B", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.4336, + "BBH": 0.5635, + "MATH Level 5": 0.3074, + "GPQA": 0.2651, + "MUSR": 0.4342, + "MMLU-PRO": 0.4748 + } + }, + { + "model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", + "name": "DeepSeek-R1-Distill-Llama-8B", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.3782, + "BBH": 0.3239, + "MATH Level 5": 0.2198, + "GPQA": 0.255, + "MUSR": 0.325, + "MMLU-PRO": 0.2089 + } + }, + { + "model_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", + "name": "DeepSeek-R1-Distill-Qwen-1.5B", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.3463, + "BBH": 0.3241, + "MATH Level 5": 0.1692, + "GPQA": 0.2559, + "MUSR": 0.3635, + "MMLU-PRO": 0.1187 + } + }, + { + "model_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "DeepSeek-R1-Distill-Qwen-14B", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.4382, + "BBH": 0.5906, + "MATH Level 5": 0.5702, + "GPQA": 0.3876, + "MUSR": 0.5366, + "MMLU-PRO": 0.4667 + } + }, + { + "model_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "DeepSeek-R1-Distill-Qwen-32B", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.4186, + "BBH": 0.4197, + "MATH Level 5": 0.1707, + "GPQA": 0.2844, + "MUSR": 0.4526, + "MMLU-PRO": 0.4687 + } + }, + { + "model_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "DeepSeek-R1-Distill-Qwen-7B", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.4038, + "BBH": 0.3443, + "MATH Level 5": 0.1956, + "GPQA": 0.2794, + "MUSR": 0.3663, + "MMLU-PRO": 0.2321 + } + }, + { + "model_id": "deepseek-ai/deepseek-llm-67b-chat", + "name": "DeepSeek LLM Chat 67B", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.5587, + "BBH": 0.5243, + "MATH Level 5": 0.0929, + "GPQA": 0.3163, + "MUSR": 0.5059, + "MMLU-PRO": 0.3944 + } + }, + { + "model_id": "deepseek-ai/deepseek-llm-7b-base", + "name": "deepseek-llm-7b-base", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.2179, + "BBH": 0.3503, + "MATH Level 5": 0.0196, + "GPQA": 0.2735, + "MUSR": 0.3738, + "MMLU-PRO": 0.1806 + } + }, + { + "model_id": "deepseek-ai/deepseek-llm-7b-chat", + "name": "deepseek-llm-7b-chat", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.4171, + "BBH": 0.3632, + "MATH Level 5": 0.0204, + "GPQA": 0.2659, + "MUSR": 0.4668, + "MMLU-PRO": 0.2133 + } + }, + { + "model_id": "deepseek-ai/deepseek-moe-16b-base", + "name": "deepseek-moe-16b-base", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.245, + "BBH": 0.3409, + "MATH Level 5": 0.0242, + "GPQA": 0.2542, + "MUSR": 0.3658, + "MMLU-PRO": 0.1505 + } + }, + { + "model_id": "deepseek-ai/deepseek-moe-16b-chat", + "name": "deepseek-moe-16b-chat", + "developer": "deepseek-ai", + "scores": { + "IFEval": 0.3663, + "BBH": 0.3275, + "MATH Level 5": 0.0257, + "GPQA": 0.2248, + "MUSR": 0.3808, + "MMLU-PRO": 0.1964 + } + }, + { + "model_id": "dfurman/CalmeRys-78B-Orpo-v0.1", + "name": "CalmeRys-78B-Orpo-v0.1", + "developer": "dfurman", + "scores": { + "IFEval": 0.8163, + "BBH": 0.7262, + "MATH Level 5": 0.4063, + "GPQA": 0.4002, + "MUSR": 0.5902, + "MMLU-PRO": 0.7012 + } + }, + { + "model_id": "dfurman/Llama-3-70B-Orpo-v0.1", + "name": "Llama-3-70B-Orpo-v0.1", + "developer": "dfurman", + "scores": { + "IFEval": 0.2049, + "BBH": 0.4655, + "MATH Level 5": 0.1579, + "GPQA": 0.2576, + "MUSR": 0.4534, + "MMLU-PRO": 0.3893 + } + }, + { + "model_id": "dfurman/Llama-3-8B-Orpo-v0.1", + "name": "Llama-3-8B-Orpo-v0.1", + "developer": "dfurman", + "scores": { + "IFEval": 0.3, + "BBH": 0.3853, + "MATH Level 5": 0.0415, + "GPQA": 0.2617, + "MUSR": 0.3579, + "MMLU-PRO": 0.2281 + } + }, + { + "model_id": "dfurman/Qwen2-72B-Orpo-v0.1", + "name": "Qwen2-72B-Orpo-v0.1", + "developer": "dfurman", + "scores": { + "IFEval": 0.788, + "BBH": 0.6969, + "MATH Level 5": 0.4056, + "GPQA": 0.3842, + "MUSR": 0.4784, + "MMLU-PRO": 0.5455 + } + }, + { + "model_id": "dicta-il/dictalm2.0", + "name": "dictalm2.0", + "developer": "dicta-il", + "scores": { + "IFEval": 0.2413, + "BBH": 0.4018, + "MATH Level 5": 0.0181, + "GPQA": 0.2919, + "MUSR": 0.382, + "MMLU-PRO": 0.2605 + } + }, + { + "model_id": "dicta-il/dictalm2.0-instruct", + "name": "dictalm2.0-instruct", + "developer": "dicta-il", + "scores": { + "IFEval": 0.4412, + "BBH": 0.4256, + "MATH Level 5": 0.0227, + "GPQA": 0.3029, + "MUSR": 0.3946, + "MMLU-PRO": 0.2605 + } + }, + { + "model_id": "distilbert/distilgpt2", + "name": "distilgpt2", + "developer": "distilbert", + "scores": { + "IFEval": 0.0611, + "BBH": 0.3038, + "MATH Level 5": 0.006, + "GPQA": 0.2592, + "MUSR": 0.4207, + "MMLU-PRO": 0.1187 + } + }, + { + "model_id": "divyanshukunwar/SASTRI_1_9B", + "name": "SASTRI_1_9B", + "developer": "divyanshukunwar", + "scores": { + "IFEval": 0.4207, + "BBH": 0.468, + "MATH Level 5": 0.1156, + "GPQA": 0.3213, + "MUSR": 0.3831, + "MMLU-PRO": 0.3187 + } + }, + { + "model_id": "djuna-test-lab/TEST-L3.2-ReWish-3B", + "name": "TEST-L3.2-ReWish-3B", + "developer": "djuna-test-lab", + "scores": { + "IFEval": 0.6368, + "BBH": 0.4495, + "MATH Level 5": 0.1367, + "GPQA": 0.2836, + "MUSR": 0.3777, + "MMLU-PRO": 0.3126 + } + }, + { + "model_id": "djuna-test-lab/TEST-L3.2-ReWish-3B-ties-w-base", + "name": "TEST-L3.2-ReWish-3B-ties-w-base", + "developer": "djuna-test-lab", + "scores": { + "IFEval": 0.6353, + "BBH": 0.4495, + "MATH Level 5": 0.1367, + "GPQA": 0.2836, + "MUSR": 0.3777, + "MMLU-PRO": 0.3126 + } + }, + { + "model_id": "djuna/G2-BigGSHT-27B-2", + "name": "G2-BigGSHT-27B-2", + "developer": "djuna", + "scores": { + "IFEval": 0.7974, + "BBH": 0.6415, + "MATH Level 5": 0.2349, + "GPQA": 0.3633, + "MUSR": 0.4072, + "MMLU-PRO": 0.4528 + } + }, + { + "model_id": "djuna/G2-GSHT", + "name": "G2-GSHT", + "developer": "djuna", + "scores": { + "IFEval": 0.563, + "BBH": 0.527, + "MATH Level 5": 0.1926, + "GPQA": 0.3255, + "MUSR": 0.4006, + "MMLU-PRO": 0.307 + } + }, + { + "model_id": "djuna/Gemma-2-gemmama-9b", + "name": "Gemma-2-gemmama-9b", + "developer": "djuna", + "scores": { + "IFEval": 0.7703, + "BBH": 0.542, + "MATH Level 5": 0.1926, + "GPQA": 0.3356, + "MUSR": 0.4031, + "MMLU-PRO": 0.3109 + } + }, + { + "model_id": "djuna/L3.1-ForStHS", + "name": "L3.1-ForStHS", + "developer": "djuna", + "scores": { + "IFEval": 0.7813, + "BBH": 0.5203, + "MATH Level 5": 0.1503, + "GPQA": 0.2911, + "MUSR": 0.4026, + "MMLU-PRO": 0.3735 + } + }, + { + "model_id": "djuna/L3.1-Promissum_Mane-8B-Della-1.5-calc", + "name": "L3.1-Promissum_Mane-8B-Della-1.5-calc", + "developer": "djuna", + "scores": { + "IFEval": 0.7235, + "BBH": 0.5433, + "MATH Level 5": 0.1639, + "GPQA": 0.3146, + "MUSR": 0.4253, + "MMLU-PRO": 0.3904 + } + }, + { + "model_id": "djuna/L3.1-Promissum_Mane-8B-Della-calc", + "name": "L3.1-Promissum_Mane-8B-Della-calc", + "developer": "djuna", + "scores": { + "IFEval": 0.5442, + "BBH": 0.5486, + "MATH Level 5": 0.1843, + "GPQA": 0.2995, + "MUSR": 0.423, + "MMLU-PRO": 0.3802 + } + }, + { + "model_id": "djuna/L3.1-Purosani-2-8B", + "name": "L3.1-Purosani-2-8B", + "developer": "djuna", + "scores": { + "IFEval": 0.4988, + "BBH": 0.5182, + "MATH Level 5": 0.1171, + "GPQA": 0.3012, + "MUSR": 0.3816, + "MMLU-PRO": 0.3752 + } + }, + { + "model_id": "djuna/L3.1-Suze-Vume-calc", + "name": "L3.1-Suze-Vume-calc", + "developer": "djuna", + "scores": { + "IFEval": 0.7297, + "BBH": 0.5164, + "MATH Level 5": 0.114, + "GPQA": 0.2819, + "MUSR": 0.3843, + "MMLU-PRO": 0.3515 + } + }, + { + "model_id": "djuna/MN-Chinofun", + "name": "MN-Chinofun", + "developer": "djuna", + "scores": { + "IFEval": 0.611, + "BBH": 0.4953, + "MATH Level 5": 0.1307, + "GPQA": 0.2961, + "MUSR": 0.4084, + "MMLU-PRO": 0.3603 + } + }, + { + "model_id": "djuna/MN-Chinofun-12B-2", + "name": "MN-Chinofun-12B-2", + "developer": "djuna", + "scores": { + "IFEval": 0.6171, + "BBH": 0.5037, + "MATH Level 5": 0.1307, + "GPQA": 0.3054, + "MUSR": 0.4268, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "djuna/MN-Chinofun-12B-3", + "name": "MN-Chinofun-12B-3", + "developer": "djuna", + "scores": { + "IFEval": 0.3053, + "BBH": 0.5348, + "MATH Level 5": 0.1005, + "GPQA": 0.2659, + "MUSR": 0.4198, + "MMLU-PRO": 0.3026 + } + }, + { + "model_id": "djuna/MN-Chinofun-12B-4", + "name": "MN-Chinofun-12B-4", + "developer": "djuna", + "scores": { + "IFEval": 0.5404, + "BBH": 0.5348, + "MATH Level 5": 0.1118, + "GPQA": 0.2953, + "MUSR": 0.4307, + "MMLU-PRO": 0.3497 + } + }, + { + "model_id": "djuna/Q2.5-Partron-7B", + "name": "Q2.5-Partron-7B", + "developer": "djuna", + "scores": { + "IFEval": 0.7321, + "BBH": 0.5418, + "MATH Level 5": 0.4826, + "GPQA": 0.2978, + "MUSR": 0.4165, + "MMLU-PRO": 0.4283 + } + }, + { + "model_id": "djuna/Q2.5-Veltha-14B", + "name": "Q2.5-Veltha-14B", + "developer": "djuna", + "scores": { + "IFEval": 0.8292, + "BBH": 0.6484, + "MATH Level 5": 0.4789, + "GPQA": 0.3591, + "MUSR": 0.4194, + "MMLU-PRO": 0.5298 + } + }, + { + "model_id": "djuna/Q2.5-Veltha-14B-0.5", + "name": "Q2.5-Veltha-14B-0.5", + "developer": "djuna", + "scores": { + "IFEval": 0.7796, + "BBH": 0.6523, + "MATH Level 5": 0.4373, + "GPQA": 0.3683, + "MUSR": 0.4339, + "MMLU-PRO": 0.5295 + } + }, + { + "model_id": "dnhkng/RYS-Llama-3-8B-Instruct", + "name": "RYS-Llama-3-8B-Instruct", + "developer": "dnhkng", + "scores": { + "IFEval": 0.6958, + "BBH": 0.4809, + "MATH Level 5": 0.0687, + "GPQA": 0.2576, + "MUSR": 0.3383, + "MMLU-PRO": 0.3557 + } + }, + { + "model_id": "dnhkng/RYS-Llama-3-Huge-Instruct", + "name": "RYS-Llama-3-Huge-Instruct", + "developer": "dnhkng", + "scores": { + "IFEval": 0.7686, + "BBH": 0.6481, + "MATH Level 5": 0.2289, + "GPQA": 0.2609, + "MUSR": 0.4208, + "MMLU-PRO": 0.511 + } + }, + { + "model_id": "dnhkng/RYS-Llama-3-Large-Instruct", + "name": "RYS-Llama-3-Large-Instruct", + "developer": "dnhkng", + "scores": { + "IFEval": 0.8051, + "BBH": 0.6525, + "MATH Level 5": 0.2304, + "GPQA": 0.2894, + "MUSR": 0.418, + "MMLU-PRO": 0.5137 + } + }, + { + "model_id": "dnhkng/RYS-Llama-3.1-8B-Instruct", + "name": "RYS-Llama-3.1-8B-Instruct", + "developer": "dnhkng", + "scores": { + "IFEval": 0.7685, + "BBH": 0.5164, + "MATH Level 5": 0.1329, + "GPQA": 0.2676, + "MUSR": 0.3681, + "MMLU-PRO": 0.3639 + } + }, + { + "model_id": "dnhkng/RYS-Llama3.1-Large", + "name": "RYS-Llama3.1-Large", + "developer": "dnhkng", + "scores": { + "IFEval": 0.8492, + "BBH": 0.6899, + "MATH Level 5": 0.3505, + "GPQA": 0.3742, + "MUSR": 0.4554, + "MMLU-PRO": 0.5249 + } + }, + { + "model_id": "dnhkng/RYS-Medium", + "name": "RYS-Medium", + "developer": "dnhkng", + "scores": { + "IFEval": 0.4406, + "BBH": 0.6285, + "MATH Level 5": 0.108, + "GPQA": 0.328, + "MUSR": 0.4069, + "MMLU-PRO": 0.4326 + } + }, + { + "model_id": "dnhkng/RYS-Phi-3-medium-4k-instruct", + "name": "RYS-Phi-3-medium-4k-instruct", + "developer": "dnhkng", + "scores": { + "IFEval": 0.4391, + "BBH": 0.6226, + "MATH Level 5": 0.1609, + "GPQA": 0.3549, + "MUSR": 0.4253, + "MMLU-PRO": 0.4846 + } + }, + { + "model_id": "dnhkng/RYS-XLarge", + "name": "RYS-XLarge", + "developer": "dnhkng", + "scores": { + "IFEval": 0.7996, + "BBH": 0.705, + "MATH Level 5": 0.4252, + "GPQA": 0.3842, + "MUSR": 0.497, + "MMLU-PRO": 0.5428 + } + }, + { + "model_id": "dnhkng/RYS-XLarge-base", + "name": "RYS-XLarge-base", + "developer": "dnhkng", + "scores": { + "IFEval": 0.791, + "BBH": 0.7047, + "MATH Level 5": 0.3792, + "GPQA": 0.3792, + "MUSR": 0.4903, + "MMLU-PRO": 0.5431 + } + }, + { + "model_id": "dnhkng/RYS-XLarge2", + "name": "RYS-XLarge2", + "developer": "dnhkng", + "scores": { + "IFEval": 0.4902, + "BBH": 0.6574, + "MATH Level 5": 0.2749, + "GPQA": 0.3742, + "MUSR": 0.4508, + "MMLU-PRO": 0.5378 + } + }, + { + "model_id": "dreamgen/WizardLM-2-7B", + "name": "WizardLM-2-7B", + "developer": "dreamgen", + "scores": { + "IFEval": 0.4583, + "BBH": 0.3487, + "MATH Level 5": 0.0332, + "GPQA": 0.2869, + "MUSR": 0.3941, + "MMLU-PRO": 0.266 + } + }, + { + "model_id": "dustinwloring1988/Reflexis-8b-chat-v1", + "name": "Reflexis-8b-chat-v1", + "developer": "dustinwloring1988", + "scores": { + "IFEval": 0.3658, + "BBH": 0.4664, + "MATH Level 5": 0.1156, + "GPQA": 0.2542, + "MUSR": 0.3754, + "MMLU-PRO": 0.3384 + } + }, + { + "model_id": "dustinwloring1988/Reflexis-8b-chat-v2", + "name": "Reflexis-8b-chat-v2", + "developer": "dustinwloring1988", + "scores": { + "IFEval": 0.3912, + "BBH": 0.4724, + "MATH Level 5": 0.1163, + "GPQA": 0.2701, + "MUSR": 0.3526, + "MMLU-PRO": 0.3378 + } + }, + { + "model_id": "dustinwloring1988/Reflexis-8b-chat-v3", + "name": "Reflexis-8b-chat-v3", + "developer": "dustinwloring1988", + "scores": { + "IFEval": 0.5367, + "BBH": 0.4658, + "MATH Level 5": 0.1224, + "GPQA": 0.2424, + "MUSR": 0.3512, + "MMLU-PRO": 0.3548 + } + }, + { + "model_id": "dustinwloring1988/Reflexis-8b-chat-v4", + "name": "Reflexis-8b-chat-v4", + "developer": "dustinwloring1988", + "scores": { + "IFEval": 0.4698, + "BBH": 0.4686, + "MATH Level 5": 0.1027, + "GPQA": 0.2341, + "MUSR": 0.3393, + "MMLU-PRO": 0.339 + } + }, + { + "model_id": "dustinwloring1988/Reflexis-8b-chat-v5", + "name": "Reflexis-8b-chat-v5", + "developer": "dustinwloring1988", + "scores": { + "IFEval": 0.4238, + "BBH": 0.4782, + "MATH Level 5": 0.1216, + "GPQA": 0.271, + "MUSR": 0.3354, + "MMLU-PRO": 0.3217 + } + }, + { + "model_id": "dustinwloring1988/Reflexis-8b-chat-v6", + "name": "Reflexis-8b-chat-v6", + "developer": "dustinwloring1988", + "scores": { + "IFEval": 0.4939, + "BBH": 0.481, + "MATH Level 5": 0.1299, + "GPQA": 0.2626, + "MUSR": 0.3753, + "MMLU-PRO": 0.3479 + } + }, + { + "model_id": "dustinwloring1988/Reflexis-8b-chat-v7", + "name": "Reflexis-8b-chat-v7", + "developer": "dustinwloring1988", + "scores": { + "IFEval": 0.398, + "BBH": 0.481, + "MATH Level 5": 0.1631, + "GPQA": 0.2617, + "MUSR": 0.3222, + "MMLU-PRO": 0.3643 + } + }, + { + "model_id": "duyhv1411/Llama-3.2-1B-en-vi", + "name": "Llama-3.2-1B-en-vi", + "developer": "duyhv1411", + "scores": { + "IFEval": 0.4788, + "BBH": 0.3291, + "MATH Level 5": 0.0287, + "GPQA": 0.2768, + "MUSR": 0.3197, + "MMLU-PRO": 0.1341 + } + }, + { + "model_id": "duyhv1411/Llama-3.2-3B-en-vi", + "name": "Llama-3.2-3B-en-vi", + "developer": "duyhv1411", + "scores": { + "IFEval": 0.4852, + "BBH": 0.3272, + "MATH Level 5": 0.0227, + "GPQA": 0.2752, + "MUSR": 0.321, + "MMLU-PRO": 0.1359 + } + }, + { + "model_id": "dwikitheduck/gemma-2-2b-id", + "name": "gemma-2-2b-id", + "developer": "dwikitheduck", + "scores": { + "IFEval": 0.3879, + "BBH": 0.3962, + "MATH Level 5": 0.0453, + "GPQA": 0.2995, + "MUSR": 0.4154, + "MMLU-PRO": 0.2173 + } + }, + { + "model_id": "dwikitheduck/gemma-2-2b-id-inst", + "name": "gemma-2-2b-id-inst", + "developer": "dwikitheduck", + "scores": { + "IFEval": 0.3879, + "BBH": 0.3962, + "MATH Level 5": 0.0453, + "GPQA": 0.2995, + "MUSR": 0.4154, + "MMLU-PRO": 0.2173 + } + }, + { + "model_id": "dwikitheduck/gemma-2-2b-id-instruct", + "name": "gemma-2-2b-id-instruct", + "developer": "dwikitheduck", + "scores": { + "IFEval": 0.3879, + "BBH": 0.3962, + "MATH Level 5": 0.0453, + "GPQA": 0.2995, + "MUSR": 0.4154, + "MMLU-PRO": 0.2173 + } + }, + { + "model_id": "dwikitheduck/gen-inst-1", + "name": "gen-inst-1", + "developer": "dwikitheduck", + "scores": { + "IFEval": 0.775, + "BBH": 0.642, + "MATH Level 5": 0.4554, + "GPQA": 0.3716, + "MUSR": 0.4205, + "MMLU-PRO": 0.5089 + } + }, + { + "model_id": "dwikitheduck/gen-try1", + "name": "gen-try1", + "developer": "dwikitheduck", + "scores": { + "IFEval": 0.7522, + "BBH": 0.6359, + "MATH Level 5": 0.4101, + "GPQA": 0.3414, + "MUSR": 0.4416, + "MMLU-PRO": 0.5111 + } + }, + { + "model_id": "dwikitheduck/gen-try1-notemp", + "name": "gen-try1-notemp", + "developer": "dwikitheduck", + "scores": { + "IFEval": 0.2627, + "BBH": 0.6263, + "MATH Level 5": 0.318, + "GPQA": 0.354, + "MUSR": 0.4714, + "MMLU-PRO": 0.521 + } + }, + { + "model_id": "dzakwan/dzakwan-MoE-4x7b-Beta", + "name": "dzakwan-MoE-4x7b-Beta", + "developer": "dzakwan", + "scores": { + "IFEval": 0.4443, + "BBH": 0.514, + "MATH Level 5": 0.0778, + "GPQA": 0.2861, + "MUSR": 0.4267, + "MMLU-PRO": 0.3108 + } + }, + { + "model_id": "ehristoforu/Falcon3-8B-Franken-Basestruct", + "name": "Falcon3-8B-Franken-Basestruct", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.1715, + "BBH": 0.5463, + "MATH Level 5": 0.0, + "GPQA": 0.3406, + "MUSR": 0.3555, + "MMLU-PRO": 0.3947 + } + }, + { + "model_id": "ehristoforu/Falcon3-MoE-2x7B-Insruct", + "name": "Falcon3-MoE-2x7B-Insruct", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7643, + "BBH": 0.5648, + "MATH Level 5": 0.4124, + "GPQA": 0.3121, + "MUSR": 0.484, + "MMLU-PRO": 0.4095 + } + }, + { + "model_id": "ehristoforu/Gemma2-9B-it-psy10k-mental_health", + "name": "Gemma2-9B-it-psy10k-mental_health", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.5887, + "BBH": 0.5539, + "MATH Level 5": 0.1631, + "GPQA": 0.3372, + "MUSR": 0.4086, + "MMLU-PRO": 0.3829 + } + }, + { + "model_id": "ehristoforu/Gemma2-9b-it-train6", + "name": "Gemma2-9b-it-train6", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7025, + "BBH": 0.5898, + "MATH Level 5": 0.1911, + "GPQA": 0.3289, + "MUSR": 0.4084, + "MMLU-PRO": 0.3942 + } + }, + { + "model_id": "ehristoforu/HappyLlama1", + "name": "HappyLlama1", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7363, + "BBH": 0.4996, + "MATH Level 5": 0.1427, + "GPQA": 0.2836, + "MUSR": 0.4287, + "MMLU-PRO": 0.3546 + } + }, + { + "model_id": "ehristoforu/QwenQwen2.5-7B-IT", + "name": "QwenQwen2.5-7B-IT", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7518, + "BBH": 0.5398, + "MATH Level 5": 0.5091, + "GPQA": 0.3037, + "MUSR": 0.4034, + "MMLU-PRO": 0.4289 + } + }, + { + "model_id": "ehristoforu/QwenQwen2.5-7B-IT-Dare", + "name": "QwenQwen2.5-7B-IT-Dare", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7509, + "BBH": 0.5398, + "MATH Level 5": 0.5091, + "GPQA": 0.3037, + "MUSR": 0.4034, + "MMLU-PRO": 0.4289 + } + }, + { + "model_id": "ehristoforu/RQwen-v0.1", + "name": "RQwen-v0.1", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7625, + "BBH": 0.6446, + "MATH Level 5": 0.4645, + "GPQA": 0.3255, + "MUSR": 0.4139, + "MMLU-PRO": 0.5202 + } + }, + { + "model_id": "ehristoforu/RQwen-v0.2", + "name": "RQwen-v0.2", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7504, + "BBH": 0.6427, + "MATH Level 5": 0.327, + "GPQA": 0.3372, + "MUSR": 0.4207, + "MMLU-PRO": 0.5159 + } + }, + { + "model_id": "ehristoforu/SoRu-0009", + "name": "SoRu-0009", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.2582, + "BBH": 0.315, + "MATH Level 5": 0.0211, + "GPQA": 0.2609, + "MUSR": 0.3369, + "MMLU-PRO": 0.1239 + } + }, + { + "model_id": "ehristoforu/coolqwen-3b-it", + "name": "coolqwen-3b-it", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.6473, + "BBH": 0.4851, + "MATH Level 5": 0.3671, + "GPQA": 0.2827, + "MUSR": 0.4125, + "MMLU-PRO": 0.3601 + } + }, + { + "model_id": "ehristoforu/della-70b-test-v1", + "name": "della-70b-test-v1", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.4979, + "BBH": 0.3029, + "MATH Level 5": 0.0098, + "GPQA": 0.2525, + "MUSR": 0.4555, + "MMLU-PRO": 0.1575 + } + }, + { + "model_id": "ehristoforu/falcon3-ultraset", + "name": "falcon3-ultraset", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7135, + "BBH": 0.5584, + "MATH Level 5": 0.2122, + "GPQA": 0.3322, + "MUSR": 0.4853, + "MMLU-PRO": 0.3982 + } + }, + { + "model_id": "ehristoforu/fd-lora-merged-16x32", + "name": "fd-lora-merged-16x32", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.3481, + "BBH": 0.3308, + "MATH Level 5": 0.1707, + "GPQA": 0.2534, + "MUSR": 0.3514, + "MMLU-PRO": 0.1205 + } + }, + { + "model_id": "ehristoforu/fd-lora-merged-64x128", + "name": "fd-lora-merged-64x128", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.3281, + "BBH": 0.3345, + "MATH Level 5": 0.1873, + "GPQA": 0.255, + "MUSR": 0.3368, + "MMLU-PRO": 0.1537 + } + }, + { + "model_id": "ehristoforu/fp4-14b-it-v1", + "name": "fp4-14b-it-v1", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.2535, + "BBH": 0.574, + "MATH Level 5": 0.0408, + "GPQA": 0.2953, + "MUSR": 0.3595, + "MMLU-PRO": 0.4205 + } + }, + { + "model_id": "ehristoforu/fp4-14b-v1-fix", + "name": "fp4-14b-v1-fix", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.6742, + "BBH": 0.6817, + "MATH Level 5": 0.4207, + "GPQA": 0.354, + "MUSR": 0.4532, + "MMLU-PRO": 0.5353 + } + }, + { + "model_id": "ehristoforu/fq2.5-7b-it-normalize_false", + "name": "fq2.5-7b-it-normalize_false", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7399, + "BBH": 0.552, + "MATH Level 5": 0.4622, + "GPQA": 0.302, + "MUSR": 0.4612, + "MMLU-PRO": 0.4413 + } + }, + { + "model_id": "ehristoforu/fq2.5-7b-it-normalize_true", + "name": "fq2.5-7b-it-normalize_true", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7399, + "BBH": 0.552, + "MATH Level 5": 0.4622, + "GPQA": 0.302, + "MUSR": 0.4612, + "MMLU-PRO": 0.4413 + } + }, + { + "model_id": "ehristoforu/frqwen2.5-from7b-duable4layers-it", + "name": "frqwen2.5-from7b-duable4layers-it", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7729, + "BBH": 0.5264, + "MATH Level 5": 0.4509, + "GPQA": 0.2953, + "MUSR": 0.4166, + "MMLU-PRO": 0.4126 + } + }, + { + "model_id": "ehristoforu/frqwen2.5-from7b-it", + "name": "frqwen2.5-from7b-it", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.6532, + "BBH": 0.5143, + "MATH Level 5": 0.2923, + "GPQA": 0.2903, + "MUSR": 0.4086, + "MMLU-PRO": 0.3977 + } + }, + { + "model_id": "ehristoforu/mllama-3.1-8b-instruct", + "name": "mllama-3.1-8b-instruct", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.3458, + "BBH": 0.4718, + "MATH Level 5": 0.3776, + "GPQA": 0.2701, + "MUSR": 0.338, + "MMLU-PRO": 0.2533 + } + }, + { + "model_id": "ehristoforu/mllama-3.1-8b-it", + "name": "mllama-3.1-8b-it", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.3879, + "BBH": 0.4868, + "MATH Level 5": 0.3799, + "GPQA": 0.2768, + "MUSR": 0.3349, + "MMLU-PRO": 0.2622 + } + }, + { + "model_id": "ehristoforu/moremerge", + "name": "moremerge", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.2019, + "BBH": 0.2868, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3566, + "MMLU-PRO": 0.1065 + } + }, + { + "model_id": "ehristoforu/moremerge-upscaled", + "name": "moremerge-upscaled", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.1979, + "BBH": 0.2698, + "MATH Level 5": 0.0, + "GPQA": 0.2466, + "MUSR": 0.3593, + "MMLU-PRO": 0.1041 + } + }, + { + "model_id": "ehristoforu/phi-4-25b", + "name": "phi-4-25b", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.6484, + "BBH": 0.6908, + "MATH Level 5": 0.4524, + "GPQA": 0.3188, + "MUSR": 0.4208, + "MMLU-PRO": 0.5351 + } + }, + { + "model_id": "ehristoforu/qwen2.5-test-32b-it", + "name": "qwen2.5-test-32b-it", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.7889, + "BBH": 0.7081, + "MATH Level 5": 0.5974, + "GPQA": 0.3641, + "MUSR": 0.4578, + "MMLU-PRO": 0.5765 + } + }, + { + "model_id": "ehristoforu/qwen2.5-with-lora-think-3b-it", + "name": "qwen2.5-with-lora-think-3b-it", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.5319, + "BBH": 0.4687, + "MATH Level 5": 0.2364, + "GPQA": 0.2802, + "MUSR": 0.431, + "MMLU-PRO": 0.3403 + } + }, + { + "model_id": "ehristoforu/rmoe-v1", + "name": "rmoe-v1", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.265, + "BBH": 0.2929, + "MATH Level 5": 0.0015, + "GPQA": 0.2584, + "MUSR": 0.3663, + "MMLU-PRO": 0.1125 + } + }, + { + "model_id": "ehristoforu/rufalcon3-3b-it", + "name": "rufalcon3-3b-it", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.5942, + "BBH": 0.4155, + "MATH Level 5": 0.1782, + "GPQA": 0.2727, + "MUSR": 0.3895, + "MMLU-PRO": 0.2348 + } + }, + { + "model_id": "ehristoforu/ruphi-4b", + "name": "ruphi-4b", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.1752, + "BBH": 0.2906, + "MATH Level 5": 0.0, + "GPQA": 0.2399, + "MUSR": 0.3512, + "MMLU-PRO": 0.1126 + } + }, + { + "model_id": "ehristoforu/testq-32b", + "name": "testq-32b", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.1876, + "BBH": 0.2877, + "MATH Level 5": 0.003, + "GPQA": 0.2542, + "MUSR": 0.3715, + "MMLU-PRO": 0.1166 + } + }, + { + "model_id": "ehristoforu/tmoe", + "name": "tmoe", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.1193, + "BBH": 0.3073, + "MATH Level 5": 0.0076, + "GPQA": 0.2232, + "MUSR": 0.3699, + "MMLU-PRO": 0.1191 + } + }, + { + "model_id": "ehristoforu/tmoe-v2", + "name": "tmoe-v2", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.1903, + "BBH": 0.2897, + "MATH Level 5": 0.0023, + "GPQA": 0.2634, + "MUSR": 0.4151, + "MMLU-PRO": 0.11 + } + }, + { + "model_id": "ehristoforu/trd-7b-it", + "name": "trd-7b-it", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.2185, + "BBH": 0.299, + "MATH Level 5": 0.0317, + "GPQA": 0.2701, + "MUSR": 0.3794, + "MMLU-PRO": 0.1179 + } + }, + { + "model_id": "ehristoforu/ud-14b", + "name": "ud-14b", + "developer": "ehristoforu", + "scores": { + "IFEval": 0.4235, + "BBH": 0.3324, + "MATH Level 5": 0.1903, + "GPQA": 0.2374, + "MUSR": 0.4394, + "MMLU-PRO": 0.2415 + } + }, + { + "model_id": "elinas/Chronos-Gold-12B-1.0", + "name": "Chronos-Gold-12B-1.0", + "developer": "elinas", + "scores": { + "IFEval": 0.3166, + "BBH": 0.5515, + "MATH Level 5": 0.0695, + "GPQA": 0.318, + "MUSR": 0.474, + "MMLU-PRO": 0.3518 + } + }, + { + "model_id": "ell44ot/gemma-2b-def", + "name": "gemma-2b-def", + "developer": "ell44ot", + "scores": { + "IFEval": 0.2693, + "BBH": 0.3159, + "MATH Level 5": 0.0242, + "GPQA": 0.2735, + "MUSR": 0.367, + "MMLU-PRO": 0.1572 + } + }, + { + "model_id": "euclaise/ReMask-3B", + "name": "ReMask-3B", + "developer": "euclaise", + "scores": { + "IFEval": 0.2419, + "BBH": 0.3517, + "MATH Level 5": 0.0196, + "GPQA": 0.2668, + "MUSR": 0.3341, + "MMLU-PRO": 0.1357 + } + }, + { + "model_id": "eworojoshua/vas-01", + "name": "vas-01", + "developer": "eworojoshua", + "scores": { + "IFEval": 0.7612, + "BBH": 0.5418, + "MATH Level 5": 0.4736, + "GPQA": 0.3096, + "MUSR": 0.4432, + "MMLU-PRO": 0.4348 + } + }, + { + "model_id": "ewre324/Thinker-Llama-3.2-3B-Instruct-Reasoning", + "name": "Thinker-Llama-3.2-3B-Instruct-Reasoning", + "developer": "ewre324", + "scores": { + "IFEval": 0.4439, + "BBH": 0.4273, + "MATH Level 5": 0.0846, + "GPQA": 0.2768, + "MUSR": 0.3655, + "MMLU-PRO": 0.2886 + } + }, + { + "model_id": "ewre324/Thinker-Qwen2.5-0.5B-Instruct-Reasoning", + "name": "Thinker-Qwen2.5-0.5B-Instruct-Reasoning", + "developer": "ewre324", + "scores": { + "IFEval": 0.2476, + "BBH": 0.3292, + "MATH Level 5": 0.0287, + "GPQA": 0.2852, + "MUSR": 0.3382, + "MMLU-PRO": 0.1647 + } + }, + { + "model_id": "ewre324/Thinker-SmolLM2-135M-Instruct-Reasoning", + "name": "Thinker-SmolLM2-135M-Instruct-Reasoning", + "developer": "ewre324", + "scores": { + "IFEval": 0.2584, + "BBH": 0.3071, + "MATH Level 5": 0.0091, + "GPQA": 0.2525, + "MUSR": 0.3661, + "MMLU-PRO": 0.1094 + } + }, + { + "model_id": "ewre324/ewre324-R1-SmolLM2-135M-Distill", + "name": "ewre324-R1-SmolLM2-135M-Distill", + "developer": "ewre324", + "scores": { + "IFEval": 0.1649, + "BBH": 0.3042, + "MATH Level 5": 0.0128, + "GPQA": 0.2617, + "MUSR": 0.3409, + "MMLU-PRO": 0.1134 + } + }, + { + "model_id": "experiment-llm/exp-3-q-r", + "name": "exp-3-q-r", + "developer": "experiment-llm", + "scores": { + "IFEval": 0.6036, + "BBH": 0.5397, + "MATH Level 5": 0.2787, + "GPQA": 0.2936, + "MUSR": 0.4315, + "MMLU-PRO": 0.4316 + } + }, + { + "model_id": "facebook/opt-1.3b", + "name": "opt-1.3b", + "developer": "facebook", + "scores": { + "IFEval": 0.2383, + "BBH": 0.3094, + "MATH Level 5": 0.0091, + "GPQA": 0.2424, + "MUSR": 0.342, + "MMLU-PRO": 0.1107 + } + }, + { + "model_id": "facebook/opt-30b", + "name": "opt-30b", + "developer": "facebook", + "scores": { + "IFEval": 0.2453, + "BBH": 0.307, + "MATH Level 5": 0.0106, + "GPQA": 0.2693, + "MUSR": 0.3604, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "failspy/Llama-3-8B-Instruct-MopeyMule", + "name": "Llama-3-8B-Instruct-MopeyMule", + "developer": "failspy", + "scores": { + "IFEval": 0.675, + "BBH": 0.3839, + "MATH Level 5": 0.0196, + "GPQA": 0.2391, + "MUSR": 0.3513, + "MMLU-PRO": 0.1764 + } + }, + { + "model_id": "failspy/Llama-3-8B-Instruct-abliterated", + "name": "Llama-3-8B-Instruct-abliterated", + "developer": "failspy", + "scores": { + "IFEval": 0.5909, + "BBH": 0.4354, + "MATH Level 5": 0.0385, + "GPQA": 0.276, + "MUSR": 0.4116, + "MMLU-PRO": 0.2742 + } + }, + { + "model_id": "failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5", + "name": "Meta-Llama-3-70B-Instruct-abliterated-v3.5", + "developer": "failspy", + "scores": { + "IFEval": 0.7747, + "BBH": 0.5747, + "MATH Level 5": 0.1284, + "GPQA": 0.297, + "MUSR": 0.3982, + "MMLU-PRO": 0.4452 + } + }, + { + "model_id": "failspy/Meta-Llama-3-8B-Instruct-abliterated-v3", + "name": "Meta-Llama-3-8B-Instruct-abliterated-v3", + "developer": "failspy", + "scores": { + "IFEval": 0.7245, + "BBH": 0.4925, + "MATH Level 5": 0.0959, + "GPQA": 0.2643, + "MUSR": 0.3622, + "MMLU-PRO": 0.3654 + } + }, + { + "model_id": "failspy/Phi-3-medium-4k-instruct-abliterated-v3", + "name": "Phi-3-medium-4k-instruct-abliterated-v3", + "developer": "failspy", + "scores": { + "IFEval": 0.6319, + "BBH": 0.6305, + "MATH Level 5": 0.1594, + "GPQA": 0.3171, + "MUSR": 0.4604, + "MMLU-PRO": 0.44 + } + }, + { + "model_id": "failspy/llama-3-70B-Instruct-abliterated", + "name": "llama-3-70B-Instruct-abliterated", + "developer": "failspy", + "scores": { + "IFEval": 0.8023, + "BBH": 0.6465, + "MATH Level 5": 0.2432, + "GPQA": 0.2894, + "MUSR": 0.4128, + "MMLU-PRO": 0.5145 + } + }, + { + "model_id": "fblgit/TheBeagle-v2beta-32B-MGS", + "name": "TheBeagle-v2beta-32B-MGS", + "developer": "fblgit", + "scores": { + "IFEval": 0.5181, + "BBH": 0.7033, + "MATH Level 5": 0.4947, + "GPQA": 0.3826, + "MUSR": 0.5008, + "MMLU-PRO": 0.5915 + } + }, + { + "model_id": "fblgit/UNA-SimpleSmaug-34b-v1beta", + "name": "UNA-SimpleSmaug-34b-v1beta", + "developer": "fblgit", + "scores": { + "IFEval": 0.4556, + "BBH": 0.5287, + "MATH Level 5": 0.0718, + "GPQA": 0.3171, + "MUSR": 0.4256, + "MMLU-PRO": 0.454 + } + }, + { + "model_id": "fblgit/UNA-TheBeagle-7b-v1", + "name": "UNA-TheBeagle-7b-v1", + "developer": "fblgit", + "scores": { + "IFEval": 0.3689, + "BBH": 0.5029, + "MATH Level 5": 0.077, + "GPQA": 0.2844, + "MUSR": 0.4564, + "MMLU-PRO": 0.3019 + } + }, + { + "model_id": "fblgit/UNA-ThePitbull-21.4B-v2", + "name": "UNA-ThePitbull-21.4B-v2", + "developer": "fblgit", + "scores": { + "IFEval": 0.379, + "BBH": 0.635, + "MATH Level 5": 0.1216, + "GPQA": 0.302, + "MUSR": 0.3922, + "MMLU-PRO": 0.3516 + } + }, + { + "model_id": "fblgit/cybertron-v4-qw7B-MGS", + "name": "cybertron-v4-qw7B-MGS", + "developer": "fblgit", + "scores": { + "IFEval": 0.6264, + "BBH": 0.5592, + "MATH Level 5": 0.3489, + "GPQA": 0.3104, + "MUSR": 0.4371, + "MMLU-PRO": 0.4473 + } + }, + { + "model_id": "fblgit/cybertron-v4-qw7B-UNAMGS", + "name": "cybertron-v4-qw7B-UNAMGS", + "developer": "fblgit", + "scores": { + "IFEval": 0.609, + "BBH": 0.5643, + "MATH Level 5": 0.3731, + "GPQA": 0.3314, + "MUSR": 0.4343, + "MMLU-PRO": 0.45 + } + }, + { + "model_id": "fblgit/juanako-7b-UNA", + "name": "juanako-7b-UNA", + "developer": "fblgit", + "scores": { + "IFEval": 0.4837, + "BBH": 0.507, + "MATH Level 5": 0.034, + "GPQA": 0.2961, + "MUSR": 0.4645, + "MMLU-PRO": 0.2771 + } + }, + { + "model_id": "fblgit/miniclaus-qw1.5B-UNAMGS", + "name": "miniclaus-qw1.5B-UNAMGS", + "developer": "fblgit", + "scores": { + "IFEval": 0.3348, + "BBH": 0.4239, + "MATH Level 5": 0.1088, + "GPQA": 0.2919, + "MUSR": 0.4293, + "MMLU-PRO": 0.2937 + } + }, + { + "model_id": "fblgit/miniclaus-qw1.5B-UNAMGS-GRPO", + "name": "miniclaus-qw1.5B-UNAMGS-GRPO", + "developer": "fblgit", + "scores": { + "IFEval": 0.3518, + "BBH": 0.4234, + "MATH Level 5": 0.1103, + "GPQA": 0.2978, + "MUSR": 0.4254, + "MMLU-PRO": 0.2945 + } + }, + { + "model_id": "fblgit/pancho-v1-qw25-3B-UNAMGS", + "name": "pancho-v1-qw25-3B-UNAMGS", + "developer": "fblgit", + "scores": { + "IFEval": 0.5361, + "BBH": 0.4926, + "MATH Level 5": 0.1571, + "GPQA": 0.297, + "MUSR": 0.4027, + "MMLU-PRO": 0.3766 + } + }, + { + "model_id": "fblgit/una-cybertron-7b-v2-bf16", + "name": "una-cybertron-7b-v2-bf16", + "developer": "fblgit", + "scores": { + "IFEval": 0.4737, + "BBH": 0.3973, + "MATH Level 5": 0.0408, + "GPQA": 0.2978, + "MUSR": 0.4473, + "MMLU-PRO": 0.2443 + } + }, + { + "model_id": "fhai50032/RolePlayLake-7B", + "name": "RolePlayLake-7B", + "developer": "fhai50032", + "scores": { + "IFEval": 0.5057, + "BBH": 0.5252, + "MATH Level 5": 0.0725, + "GPQA": 0.3037, + "MUSR": 0.4459, + "MMLU-PRO": 0.316 + } + }, + { + "model_id": "fhai50032/Unaligned-Thinker-PHI-4", + "name": "Unaligned-Thinker-PHI-4", + "developer": "fhai50032", + "scores": { + "IFEval": 0.0563, + "BBH": 0.6643, + "MATH Level 5": 0.3353, + "GPQA": 0.3809, + "MUSR": 0.4679, + "MMLU-PRO": 0.5147 + } + }, + { + "model_id": "flammenai/Llama3.1-Flammades-70B", + "name": "Llama3.1-Flammades-70B", + "developer": "flammenai", + "scores": { + "IFEval": 0.7058, + "BBH": 0.666, + "MATH Level 5": 0.2092, + "GPQA": 0.354, + "MUSR": 0.4871, + "MMLU-PRO": 0.4752 + } + }, + { + "model_id": "flammenai/Mahou-1.2a-llama3-8B", + "name": "Mahou-1.2a-llama3-8B", + "developer": "flammenai", + "scores": { + "IFEval": 0.5093, + "BBH": 0.5094, + "MATH Level 5": 0.0838, + "GPQA": 0.2886, + "MUSR": 0.3847, + "MMLU-PRO": 0.3817 + } + }, + { + "model_id": "flammenai/Mahou-1.2a-mistral-7B", + "name": "Mahou-1.2a-mistral-7B", + "developer": "flammenai", + "scores": { + "IFEval": 0.4552, + "BBH": 0.5118, + "MATH Level 5": 0.0687, + "GPQA": 0.2718, + "MUSR": 0.3896, + "MMLU-PRO": 0.3163 + } + }, + { + "model_id": "flammenai/Mahou-1.5-llama3.1-70B", + "name": "Mahou-1.5-llama3.1-70B", + "developer": "flammenai", + "scores": { + "IFEval": 0.7147, + "BBH": 0.6651, + "MATH Level 5": 0.21, + "GPQA": 0.354, + "MUSR": 0.495, + "MMLU-PRO": 0.4749 + } + }, + { + "model_id": "flammenai/Mahou-1.5-mistral-nemo-12B", + "name": "Mahou-1.5-mistral-nemo-12B", + "developer": "flammenai", + "scores": { + "IFEval": 0.6751, + "BBH": 0.5522, + "MATH Level 5": 0.0869, + "GPQA": 0.276, + "MUSR": 0.452, + "MMLU-PRO": 0.3602 + } + }, + { + "model_id": "flammenai/flammen15-gutenberg-DPO-v1-7B", + "name": "flammen15-gutenberg-DPO-v1-7B", + "developer": "flammenai", + "scores": { + "IFEval": 0.4798, + "BBH": 0.5203, + "MATH Level 5": 0.0763, + "GPQA": 0.2844, + "MUSR": 0.4293, + "MMLU-PRO": 0.3186 + } + }, + { + "model_id": "fluently-lm/FluentlyLM-Prinum", + "name": "FluentlyLM-Prinum", + "developer": "fluently-lm", + "scores": { + "IFEval": 0.809, + "BBH": 0.7144, + "MATH Level 5": 0.54, + "GPQA": 0.3867, + "MUSR": 0.4471, + "MMLU-PRO": 0.5808 + } + }, + { + "model_id": "fluently-lm/Llama-TI-8B", + "name": "Llama-TI-8B", + "developer": "fluently-lm", + "scores": { + "IFEval": 0.288, + "BBH": 0.5201, + "MATH Level 5": 0.1964, + "GPQA": 0.2961, + "MUSR": 0.4103, + "MMLU-PRO": 0.344 + } + }, + { + "model_id": "fluently-lm/Llama-TI-8B-Instruct", + "name": "Llama-TI-8B-Instruct", + "developer": "fluently-lm", + "scores": { + "IFEval": 0.7716, + "BBH": 0.5252, + "MATH Level 5": 0.2304, + "GPQA": 0.2953, + "MUSR": 0.3813, + "MMLU-PRO": 0.3726 + } + }, + { + "model_id": "fluently-sets/FalconThink3-10B-IT", + "name": "FalconThink3-10B-IT", + "developer": "fluently-sets", + "scores": { + "IFEval": 0.7326, + "BBH": 0.62, + "MATH Level 5": 0.2447, + "GPQA": 0.3347, + "MUSR": 0.4479, + "MMLU-PRO": 0.4435 + } + }, + { + "model_id": "fluently-sets/reasoning-1-1k-demo", + "name": "reasoning-1-1k-demo", + "developer": "fluently-sets", + "scores": { + "IFEval": 0.7525, + "BBH": 0.6397, + "MATH Level 5": 0.4282, + "GPQA": 0.3356, + "MUSR": 0.4061, + "MMLU-PRO": 0.4774 + } + }, + { + "model_id": "formulae/mita-elite-sce-gen1.1-v1-7b-2-26-2025-exp", + "name": "mita-elite-sce-gen1.1-v1-7b-2-26-2025-exp", + "developer": "formulae", + "scores": { + "IFEval": 0.1614, + "BBH": 0.2976, + "MATH Level 5": 0.0015, + "GPQA": 0.2534, + "MUSR": 0.4219, + "MMLU-PRO": 0.1174 + } + }, + { + "model_id": "formulae/mita-elite-v1.1-7b-2-25-2025", + "name": "mita-elite-v1.1-7b-2-25-2025", + "developer": "formulae", + "scores": { + "IFEval": 0.125, + "BBH": 0.2867, + "MATH Level 5": 0.0, + "GPQA": 0.2483, + "MUSR": 0.3487, + "MMLU-PRO": 0.1098 + } + }, + { + "model_id": "formulae/mita-elite-v1.1-gen2-7b-2-25-2025", + "name": "mita-elite-v1.1-gen2-7b-2-25-2025", + "developer": "formulae", + "scores": { + "IFEval": 0.1411, + "BBH": 0.2924, + "MATH Level 5": 0.0, + "GPQA": 0.2525, + "MUSR": 0.3541, + "MMLU-PRO": 0.1101 + } + }, + { + "model_id": "formulae/mita-elite-v1.2-7b-2-26-2025", + "name": "mita-elite-v1.2-7b-2-26-2025", + "developer": "formulae", + "scores": { + "IFEval": 0.148, + "BBH": 0.293, + "MATH Level 5": 0.0023, + "GPQA": 0.2743, + "MUSR": 0.4287, + "MMLU-PRO": 0.1186 + } + }, + { + "model_id": "formulae/mita-gen3-7b-2-26-2025", + "name": "mita-gen3-7b-2-26-2025", + "developer": "formulae", + "scores": { + "IFEval": 0.1964, + "BBH": 0.2916, + "MATH Level 5": 0.0023, + "GPQA": 0.2651, + "MUSR": 0.3912, + "MMLU-PRO": 0.1124 + } + }, + { + "model_id": "formulae/mita-gen3-v1.2-7b-2-26-2025", + "name": "mita-gen3-v1.2-7b-2-26-2025", + "developer": "formulae", + "scores": { + "IFEval": 0.2044, + "BBH": 0.3058, + "MATH Level 5": 0.0023, + "GPQA": 0.2592, + "MUSR": 0.39, + "MMLU-PRO": 0.1128 + } + }, + { + "model_id": "formulae/mita-math-v2.3-2-25-2025", + "name": "mita-math-v2.3-2-25-2025", + "developer": "formulae", + "scores": { + "IFEval": 0.1373, + "BBH": 0.2949, + "MATH Level 5": 0.0, + "GPQA": 0.2508, + "MUSR": 0.3698, + "MMLU-PRO": 0.1118 + } + }, + { + "model_id": "formulae/mita-v1-7b", + "name": "mita-v1-7b", + "developer": "formulae", + "scores": { + "IFEval": 0.1972, + "BBH": 0.3003, + "MATH Level 5": 0.0023, + "GPQA": 0.25, + "MUSR": 0.4152, + "MMLU-PRO": 0.1147 + } + }, + { + "model_id": "formulae/mita-v1.1-7b-2-24-2025", + "name": "mita-v1.1-7b-2-24-2025", + "developer": "formulae", + "scores": { + "IFEval": 0.3412, + "BBH": 0.5442, + "MATH Level 5": 0.435, + "GPQA": 0.3146, + "MUSR": 0.4557, + "MMLU-PRO": 0.4524 + } + }, + { + "model_id": "formulae/mita-v1.2-7b-2-24-2025", + "name": "mita-v1.2-7b-2-24-2025", + "developer": "formulae", + "scores": { + "IFEval": 0.2564, + "BBH": 0.4919, + "MATH Level 5": 0.4879, + "GPQA": 0.3062, + "MUSR": 0.4344, + "MMLU-PRO": 0.3359 + } + }, + { + "model_id": "frameai/Loxa-4B", + "name": "Loxa-4B", + "developer": "frameai", + "scores": { + "IFEval": 0.4765, + "BBH": 0.4217, + "MATH Level 5": 0.1095, + "GPQA": 0.2836, + "MUSR": 0.3377, + "MMLU-PRO": 0.2802 + } + }, + { + "model_id": "freewheelin/free-evo-qwen72b-v0.8-re", + "name": "free-evo-qwen72b-v0.8-re", + "developer": "freewheelin", + "scores": { + "IFEval": 0.5331, + "BBH": 0.6127, + "MATH Level 5": 0.1805, + "GPQA": 0.3565, + "MUSR": 0.4872, + "MMLU-PRO": 0.487 + } + }, + { + "model_id": "freewheelin/free-solar-evo-v0.1", + "name": "free-solar-evo-v0.1", + "developer": "freewheelin", + "scores": { + "IFEval": 0.205, + "BBH": 0.4502, + "MATH Level 5": 0.0083, + "GPQA": 0.2911, + "MUSR": 0.4946, + "MMLU-PRO": 0.3414 + } + }, + { + "model_id": "freewheelin/free-solar-evo-v0.11", + "name": "free-solar-evo-v0.11", + "developer": "freewheelin", + "scores": { + "IFEval": 0.2027, + "BBH": 0.4545, + "MATH Level 5": 0.0083, + "GPQA": 0.2852, + "MUSR": 0.5052, + "MMLU-PRO": 0.3467 + } + }, + { + "model_id": "freewheelin/free-solar-evo-v0.13", + "name": "free-solar-evo-v0.13", + "developer": "freewheelin", + "scores": { + "IFEval": 0.2321, + "BBH": 0.4555, + "MATH Level 5": 0.0121, + "GPQA": 0.2886, + "MUSR": 0.5052, + "MMLU-PRO": 0.347 + } + }, + { + "model_id": "fulim/FineLlama-3.1-8B", + "name": "FineLlama-3.1-8B", + "developer": "fulim", + "scores": { + "IFEval": 0.1439, + "BBH": 0.4569, + "MATH Level 5": 0.0476, + "GPQA": 0.2928, + "MUSR": 0.3867, + "MMLU-PRO": 0.3167 + } + }, + { + "model_id": "gabrielmbmb/SmolLM-1.7B-Instruct-IFEval", + "name": "SmolLM-1.7B-Instruct-IFEval", + "developer": "gabrielmbmb", + "scores": { + "IFEval": 0.2306, + "BBH": 0.3138, + "MATH Level 5": 0.0106, + "GPQA": 0.2534, + "MUSR": 0.3328, + "MMLU-PRO": 0.1156 + } + }, + { + "model_id": "gaverfraxz/Meta-Llama-3.1-8B-Instruct-HalfAbliterated-DELLA", + "name": "Meta-Llama-3.1-8B-Instruct-HalfAbliterated-DELLA", + "developer": "gaverfraxz", + "scores": { + "IFEval": 0.4009, + "BBH": 0.3985, + "MATH Level 5": 0.0196, + "GPQA": 0.2844, + "MUSR": 0.365, + "MMLU-PRO": 0.1654 + } + }, + { + "model_id": "gaverfraxz/Meta-Llama-3.1-8B-Instruct-HalfAbliterated-TIES", + "name": "Meta-Llama-3.1-8B-Instruct-HalfAbliterated-TIES", + "developer": "gaverfraxz", + "scores": { + "IFEval": 0.4551, + "BBH": 0.5044, + "MATH Level 5": 0.1299, + "GPQA": 0.2668, + "MUSR": 0.3738, + "MMLU-PRO": 0.3679 + } + }, + { + "model_id": "gbueno86/Brinebreath-Llama-3.1-70B", + "name": "Brinebreath-Llama-3.1-70B", + "developer": "gbueno86", + "scores": { + "IFEval": 0.5533, + "BBH": 0.6881, + "MATH Level 5": 0.2976, + "GPQA": 0.3465, + "MUSR": 0.4541, + "MMLU-PRO": 0.5196 + } + }, + { + "model_id": "gbueno86/Meta-LLama-3-Cat-Smaug-LLama-70b", + "name": "Meta-LLama-3-Cat-Smaug-LLama-70b", + "developer": "gbueno86", + "scores": { + "IFEval": 0.8072, + "BBH": 0.6674, + "MATH Level 5": 0.2938, + "GPQA": 0.3272, + "MUSR": 0.4368, + "MMLU-PRO": 0.5075 + } + }, + { + "model_id": "ghost-x/ghost-8b-beta-1608", + "name": "ghost-8b-beta-1608", + "developer": "ghost-x", + "scores": { + "IFEval": 0.4273, + "BBH": 0.4517, + "MATH Level 5": 0.0695, + "GPQA": 0.2584, + "MUSR": 0.3516, + "MMLU-PRO": 0.284 + } + }, + { + "model_id": "glaiveai/Reflection-Llama-3.1-70B", + "name": "Reflection-Llama-3.1-70B", + "developer": "glaiveai", + "scores": { + "IFEval": 0.5991, + "BBH": 0.5681, + "MATH Level 5": 0.2757, + "GPQA": 0.3146, + "MUSR": 0.438, + "MMLU-PRO": 0.6341 + } + }, + { + "model_id": "gmonsoon/SahabatAI-Llama-11B-Test", + "name": "SahabatAI-Llama-11B-Test", + "developer": "gmonsoon", + "scores": { + "IFEval": 0.3376, + "BBH": 0.4728, + "MATH Level 5": 0.031, + "GPQA": 0.2819, + "MUSR": 0.4001, + "MMLU-PRO": 0.3182 + } + }, + { + "model_id": "gmonsoon/SahabatAI-MediChatIndo-8B-v1", + "name": "SahabatAI-MediChatIndo-8B-v1", + "developer": "gmonsoon", + "scores": { + "IFEval": 0.4163, + "BBH": 0.4509, + "MATH Level 5": 0.0619, + "GPQA": 0.2827, + "MUSR": 0.3754, + "MMLU-PRO": 0.3108 + } + }, + { + "model_id": "gmonsoon/SahabatAI-Rebase-8B-Test", + "name": "SahabatAI-Rebase-8B-Test", + "developer": "gmonsoon", + "scores": { + "IFEval": 0.5156, + "BBH": 0.523, + "MATH Level 5": 0.1148, + "GPQA": 0.2878, + "MUSR": 0.4133, + "MMLU-PRO": 0.3664 + } + }, + { + "model_id": "gmonsoon/StockSeaLLMs-7B-v1", + "name": "StockSeaLLMs-7B-v1", + "developer": "gmonsoon", + "scores": { + "IFEval": 0.4599, + "BBH": 0.5271, + "MATH Level 5": 0.1964, + "GPQA": 0.3029, + "MUSR": 0.4214, + "MMLU-PRO": 0.3952 + } + }, + { + "model_id": "gmonsoon/gemma2-9b-sahabatai-v1-instruct-BaseTIES", + "name": "gemma2-9b-sahabatai-v1-instruct-BaseTIES", + "developer": "gmonsoon", + "scores": { + "IFEval": 0.7378, + "BBH": 0.6077, + "MATH Level 5": 0.1994, + "GPQA": 0.3205, + "MUSR": 0.4778, + "MMLU-PRO": 0.4347 + } + }, + { + "model_id": "godlikehhd/alpaca_data_full_2", + "name": "alpaca_data_full_2", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3178, + "BBH": 0.4217, + "MATH Level 5": 0.0929, + "GPQA": 0.2978, + "MUSR": 0.4052, + "MMLU-PRO": 0.2854 + } + }, + { + "model_id": "godlikehhd/alpaca_data_full_3B", + "name": "alpaca_data_full_3B", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3696, + "BBH": 0.4684, + "MATH Level 5": 0.1337, + "GPQA": 0.2777, + "MUSR": 0.4955, + "MMLU-PRO": 0.3357 + } + }, + { + "model_id": "godlikehhd/alpaca_data_ifd_max_2600", + "name": "alpaca_data_ifd_max_2600", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3043, + "BBH": 0.4029, + "MATH Level 5": 0.0989, + "GPQA": 0.3029, + "MUSR": 0.3509, + "MMLU-PRO": 0.2916 + } + }, + { + "model_id": "godlikehhd/alpaca_data_ifd_max_2600_3B", + "name": "alpaca_data_ifd_max_2600_3B", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.2982, + "BBH": 0.4626, + "MATH Level 5": 0.1594, + "GPQA": 0.2727, + "MUSR": 0.4346, + "MMLU-PRO": 0.3288 + } + }, + { + "model_id": "godlikehhd/alpaca_data_ifd_me_max_5200", + "name": "alpaca_data_ifd_me_max_5200", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3683, + "BBH": 0.4153, + "MATH Level 5": 0.0974, + "GPQA": 0.2911, + "MUSR": 0.3483, + "MMLU-PRO": 0.2982 + } + }, + { + "model_id": "godlikehhd/alpaca_data_ifd_min_2600", + "name": "alpaca_data_ifd_min_2600", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.375, + "BBH": 0.4219, + "MATH Level 5": 0.0967, + "GPQA": 0.2919, + "MUSR": 0.3656, + "MMLU-PRO": 0.2893 + } + }, + { + "model_id": "godlikehhd/alpaca_data_ins_ans_max_5200", + "name": "alpaca_data_ins_ans_max_5200", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3479, + "BBH": 0.4098, + "MATH Level 5": 0.1027, + "GPQA": 0.2911, + "MUSR": 0.3602, + "MMLU-PRO": 0.2901 + } + }, + { + "model_id": "godlikehhd/alpaca_data_ins_max_5200", + "name": "alpaca_data_ins_max_5200", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3275, + "BBH": 0.4155, + "MATH Level 5": 0.0997, + "GPQA": 0.2961, + "MUSR": 0.3614, + "MMLU-PRO": 0.2916 + } + }, + { + "model_id": "godlikehhd/alpaca_data_ins_min_2600", + "name": "alpaca_data_ins_min_2600", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.333, + "BBH": 0.4187, + "MATH Level 5": 0.111, + "GPQA": 0.2978, + "MUSR": 0.3853, + "MMLU-PRO": 0.288 + } + }, + { + "model_id": "godlikehhd/alpaca_data_ins_min_5200", + "name": "alpaca_data_ins_min_5200", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.336, + "BBH": 0.4289, + "MATH Level 5": 0.1035, + "GPQA": 0.2869, + "MUSR": 0.3906, + "MMLU-PRO": 0.2949 + } + }, + { + "model_id": "godlikehhd/alpaca_data_sampled_ifd_5200", + "name": "alpaca_data_sampled_ifd_5200", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.2924, + "BBH": 0.4033, + "MATH Level 5": 0.1254, + "GPQA": 0.3087, + "MUSR": 0.3521, + "MMLU-PRO": 0.2896 + } + }, + { + "model_id": "godlikehhd/alpaca_data_sampled_ifd_new_5200", + "name": "alpaca_data_sampled_ifd_new_5200", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3663, + "BBH": 0.4178, + "MATH Level 5": 0.0944, + "GPQA": 0.2936, + "MUSR": 0.3613, + "MMLU-PRO": 0.2925 + } + }, + { + "model_id": "godlikehhd/alpaca_data_score_max_0.1_2600", + "name": "alpaca_data_score_max_0.1_2600", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3288, + "BBH": 0.4252, + "MATH Level 5": 0.0989, + "GPQA": 0.2911, + "MUSR": 0.3706, + "MMLU-PRO": 0.2923 + } + }, + { + "model_id": "godlikehhd/alpaca_data_score_max_0.3_2600", + "name": "alpaca_data_score_max_0.3_2600", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3375, + "BBH": 0.4151, + "MATH Level 5": 0.1035, + "GPQA": 0.2894, + "MUSR": 0.3759, + "MMLU-PRO": 0.2913 + } + }, + { + "model_id": "godlikehhd/alpaca_data_score_max_0.7_2600", + "name": "alpaca_data_score_max_0.7_2600", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.364, + "BBH": 0.4185, + "MATH Level 5": 0.1073, + "GPQA": 0.3037, + "MUSR": 0.3469, + "MMLU-PRO": 0.2983 + } + }, + { + "model_id": "godlikehhd/alpaca_data_score_max_2500", + "name": "alpaca_data_score_max_2500", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3564, + "BBH": 0.418, + "MATH Level 5": 0.0952, + "GPQA": 0.2953, + "MUSR": 0.3627, + "MMLU-PRO": 0.294 + } + }, + { + "model_id": "godlikehhd/alpaca_data_score_max_2600_3B", + "name": "alpaca_data_score_max_2600_3B", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3358, + "BBH": 0.4716, + "MATH Level 5": 0.1548, + "GPQA": 0.2651, + "MUSR": 0.4474, + "MMLU-PRO": 0.3342 + } + }, + { + "model_id": "godlikehhd/alpaca_data_score_max_5200", + "name": "alpaca_data_score_max_5200", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3445, + "BBH": 0.4242, + "MATH Level 5": 0.0974, + "GPQA": 0.2978, + "MUSR": 0.3878, + "MMLU-PRO": 0.2945 + } + }, + { + "model_id": "godlikehhd/ifd_2500_qwen", + "name": "ifd_2500_qwen", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3365, + "BBH": 0.4298, + "MATH Level 5": 0.0982, + "GPQA": 0.2953, + "MUSR": 0.3615, + "MMLU-PRO": 0.2921 + } + }, + { + "model_id": "godlikehhd/ifd_new_correct_all_sample_2500_qwen", + "name": "ifd_new_correct_all_sample_2500_qwen", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3376, + "BBH": 0.402, + "MATH Level 5": 0.0959, + "GPQA": 0.2903, + "MUSR": 0.3562, + "MMLU-PRO": 0.2889 + } + }, + { + "model_id": "godlikehhd/ifd_new_correct_sample_2500_qwen", + "name": "ifd_new_correct_sample_2500_qwen", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3397, + "BBH": 0.411, + "MATH Level 5": 0.1042, + "GPQA": 0.3079, + "MUSR": 0.3627, + "MMLU-PRO": 0.2932 + } + }, + { + "model_id": "godlikehhd/ifd_new_qwen_2500", + "name": "ifd_new_qwen_2500", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.324, + "BBH": 0.416, + "MATH Level 5": 0.1118, + "GPQA": 0.3003, + "MUSR": 0.359, + "MMLU-PRO": 0.2911 + } + }, + { + "model_id": "godlikehhd/qwen-2.5-1.5b-cherry", + "name": "qwen-2.5-1.5b-cherry", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.2893, + "BBH": 0.4036, + "MATH Level 5": 0.102, + "GPQA": 0.3003, + "MUSR": 0.3456, + "MMLU-PRO": 0.2923 + } + }, + { + "model_id": "godlikehhd/qwen_2.5-1.5b-cherry_new", + "name": "qwen_2.5-1.5b-cherry_new", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.312, + "BBH": 0.415, + "MATH Level 5": 0.0967, + "GPQA": 0.2978, + "MUSR": 0.3496, + "MMLU-PRO": 0.2894 + } + }, + { + "model_id": "godlikehhd/qwen_full_data_alpaca", + "name": "qwen_full_data_alpaca", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.3136, + "BBH": 0.4229, + "MATH Level 5": 0.0921, + "GPQA": 0.2928, + "MUSR": 0.4052, + "MMLU-PRO": 0.2851 + } + }, + { + "model_id": "godlikehhd/qwen_ins_ans_2500", + "name": "qwen_ins_ans_2500", + "developer": "godlikehhd", + "scores": { + "IFEval": 0.2698, + "BBH": 0.4074, + "MATH Level 5": 0.114, + "GPQA": 0.2919, + "MUSR": 0.3589, + "MMLU-PRO": 0.2809 + } + }, + { + "model_id": "google/codegemma-1.1-2b", + "name": "codegemma-1.1-2b", + "developer": "google", + "scores": { + "IFEval": 0.2294, + "BBH": 0.3353, + "MATH Level 5": 0.0128, + "GPQA": 0.2651, + "MUSR": 0.3871, + "MMLU-PRO": 0.1278 + } + }, + { + "model_id": "google/flan-t5-base", + "name": "flan-t5-base", + "developer": "google", + "scores": { + "IFEval": 0.1891, + "BBH": 0.3526, + "MATH Level 5": 0.0106, + "GPQA": 0.2383, + "MUSR": 0.3671, + "MMLU-PRO": 0.1357 + } + }, + { + "model_id": "google/flan-t5-large", + "name": "flan-t5-large", + "developer": "google", + "scores": { + "IFEval": 0.2201, + "BBH": 0.4153, + "MATH Level 5": 0.0144, + "GPQA": 0.2508, + "MUSR": 0.4083, + "MMLU-PRO": 0.1709 + } + }, + { + "model_id": "google/flan-t5-small", + "name": "flan-t5-small", + "developer": "google", + "scores": { + "IFEval": 0.1524, + "BBH": 0.3283, + "MATH Level 5": 0.0076, + "GPQA": 0.2609, + "MUSR": 0.4123, + "MMLU-PRO": 0.1233 + } + }, + { + "model_id": "google/flan-t5-xl", + "name": "flan-t5-xl", + "developer": "google", + "scores": { + "IFEval": 0.2237, + "BBH": 0.4531, + "MATH Level 5": 0.0076, + "GPQA": 0.2525, + "MUSR": 0.4181, + "MMLU-PRO": 0.2147 + } + }, + { + "model_id": "google/flan-t5-xxl", + "name": "flan-t5-xxl", + "developer": "google", + "scores": { + "IFEval": 0.22, + "BBH": 0.5066, + "MATH Level 5": 0.0106, + "GPQA": 0.2701, + "MUSR": 0.4218, + "MMLU-PRO": 0.2343 + } + }, + { + "model_id": "google/flan-ul2", + "name": "flan-ul2", + "developer": "google", + "scores": { + "IFEval": 0.2393, + "BBH": 0.5054, + "MATH Level 5": 0.0091, + "GPQA": 0.2878, + "MUSR": 0.3844, + "MMLU-PRO": 0.2493 + } + }, + { + "model_id": "google/gemma-1.1-2b-it", + "name": "gemma-1.1-2b-it", + "developer": "google", + "scores": { + "IFEval": 0.3067, + "BBH": 0.3185, + "MATH Level 5": 0.0181, + "GPQA": 0.2693, + "MUSR": 0.3394, + "MMLU-PRO": 0.1484 + } + }, + { + "model_id": "google/gemma-1.1-7b-it", + "name": "gemma-1.1-7b-it", + "developer": "google", + "scores": { + "IFEval": 0.5039, + "BBH": 0.3935, + "MATH Level 5": 0.0491, + "GPQA": 0.2936, + "MUSR": 0.423, + "MMLU-PRO": 0.2584 + } + }, + { + "model_id": "google/gemma-2-27b", + "name": "Gemma 2 27B", + "developer": "google", + "scores": { + "IFEval": 0.2475, + "BBH": 0.5643, + "MATH Level 5": 0.1662, + "GPQA": 0.3507, + "MUSR": 0.4396, + "MMLU-PRO": 0.4371 + } + }, + { + "model_id": "google/gemma-2-27b-it", + "name": "Gemma 2 Instruct 27B", + "developer": "google", + "scores": { + "IFEval": 0.7978, + "BBH": 0.6451, + "MATH Level 5": 0.2387, + "GPQA": 0.375, + "MUSR": 0.4033, + "MMLU-PRO": 0.4451 + } + }, + { + "model_id": "google/gemma-2-2b", + "name": "gemma-2-2b", + "developer": "google", + "scores": { + "IFEval": 0.2018, + "BBH": 0.3709, + "MATH Level 5": 0.0302, + "GPQA": 0.2626, + "MUSR": 0.4219, + "MMLU-PRO": 0.2217 + } + }, + { + "model_id": "google/gemma-2-2b-it", + "name": "gemma-2-2b-it", + "developer": "google", + "scores": { + "IFEval": 0.5668, + "BBH": 0.4199, + "MATH Level 5": 0.0008, + "GPQA": 0.2743, + "MUSR": 0.3929, + "MMLU-PRO": 0.255 + } + }, + { + "model_id": "google/gemma-2-2b-jpn-it", + "name": "gemma-2-2b-jpn-it", + "developer": "google", + "scores": { + "IFEval": 0.5078, + "BBH": 0.4226, + "MATH Level 5": 0.0347, + "GPQA": 0.2852, + "MUSR": 0.3964, + "MMLU-PRO": 0.2578 + } + }, + { + "model_id": "google/gemma-2-9b", + "name": "Gemma 2 9B", + "developer": "google", + "scores": { + "IFEval": 0.204, + "BBH": 0.5377, + "MATH Level 5": 0.1344, + "GPQA": 0.3289, + "MUSR": 0.4461, + "MMLU-PRO": 0.4103 + } + }, + { + "model_id": "google/gemma-2-9b-it", + "name": "Gemma 2 Instruct 9B", + "developer": "google", + "scores": { + "IFEval": 0.7436, + "BBH": 0.599, + "MATH Level 5": 0.1949, + "GPQA": 0.3607, + "MUSR": 0.4073, + "MMLU-PRO": 0.3875 + } + }, + { + "model_id": "google/gemma-2b", + "name": "gemma-2b", + "developer": "google", + "scores": { + "IFEval": 0.2038, + "BBH": 0.3366, + "MATH Level 5": 0.0302, + "GPQA": 0.255, + "MUSR": 0.3978, + "MMLU-PRO": 0.1366 + } + }, + { + "model_id": "google/gemma-2b-it", + "name": "gemma-2b-it", + "developer": "google", + "scores": { + "IFEval": 0.269, + "BBH": 0.3151, + "MATH Level 5": 0.0204, + "GPQA": 0.2785, + "MUSR": 0.3341, + "MMLU-PRO": 0.1353 + } + }, + { + "model_id": "google/gemma-7b", + "name": "Gemma 7B", + "developer": "google", + "scores": { + "IFEval": 0.2659, + "BBH": 0.4362, + "MATH Level 5": 0.074, + "GPQA": 0.2869, + "MUSR": 0.4062, + "MMLU-PRO": 0.2948 + } + }, + { + "model_id": "google/gemma-7b-it", + "name": "gemma-7b-it", + "developer": "google", + "scores": { + "IFEval": 0.3868, + "BBH": 0.3646, + "MATH Level 5": 0.0295, + "GPQA": 0.2844, + "MUSR": 0.4274, + "MMLU-PRO": 0.1695 + } + }, + { + "model_id": "google/mt5-base", + "name": "mt5-base", + "developer": "google", + "scores": { + "IFEval": 0.1645, + "BBH": 0.2883, + "MATH Level 5": 0.0091, + "GPQA": 0.2391, + "MUSR": 0.3672, + "MMLU-PRO": 0.107 + } + }, + { + "model_id": "google/mt5-small", + "name": "mt5-small", + "developer": "google", + "scores": { + "IFEval": 0.1718, + "BBH": 0.2766, + "MATH Level 5": 0.0, + "GPQA": 0.2424, + "MUSR": 0.3857, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "google/mt5-xl", + "name": "mt5-xl", + "developer": "google", + "scores": { + "IFEval": 0.196, + "BBH": 0.3047, + "MATH Level 5": 0.0, + "GPQA": 0.2643, + "MUSR": 0.3795, + "MMLU-PRO": 0.112 + } + }, + { + "model_id": "google/mt5-xxl", + "name": "mt5-xxl", + "developer": "google", + "scores": { + "IFEval": 0.2358, + "BBH": 0.2959, + "MATH Level 5": 0.0, + "GPQA": 0.2416, + "MUSR": 0.3689, + "MMLU-PRO": 0.1089 + } + }, + { + "model_id": "google/recurrentgemma-2b", + "name": "recurrentgemma-2b", + "developer": "google", + "scores": { + "IFEval": 0.3017, + "BBH": 0.3197, + "MATH Level 5": 0.0204, + "GPQA": 0.2458, + "MUSR": 0.3446, + "MMLU-PRO": 0.1176 + } + }, + { + "model_id": "google/recurrentgemma-2b-it", + "name": "recurrentgemma-2b-it", + "developer": "google", + "scores": { + "IFEval": 0.2949, + "BBH": 0.333, + "MATH Level 5": 0.0196, + "GPQA": 0.2534, + "MUSR": 0.3341, + "MMLU-PRO": 0.1402 + } + }, + { + "model_id": "google/recurrentgemma-9b", + "name": "recurrentgemma-9b", + "developer": "google", + "scores": { + "IFEval": 0.3116, + "BBH": 0.3956, + "MATH Level 5": 0.0665, + "GPQA": 0.2852, + "MUSR": 0.3803, + "MMLU-PRO": 0.2605 + } + }, + { + "model_id": "google/recurrentgemma-9b-it", + "name": "recurrentgemma-9b-it", + "developer": "google", + "scores": { + "IFEval": 0.501, + "BBH": 0.4367, + "MATH Level 5": 0.0665, + "GPQA": 0.2701, + "MUSR": 0.4379, + "MMLU-PRO": 0.2843 + } + }, + { + "model_id": "google/switch-base-8", + "name": "switch-base-8", + "developer": "google", + "scores": { + "IFEval": 0.1585, + "BBH": 0.2876, + "MATH Level 5": 0.0, + "GPQA": 0.25, + "MUSR": 0.3517, + "MMLU-PRO": 0.1098 + } + }, + { + "model_id": "google/umt5-base", + "name": "umt5-base", + "developer": "google", + "scores": { + "IFEval": 0.1746, + "BBH": 0.2788, + "MATH Level 5": 0.0045, + "GPQA": 0.2542, + "MUSR": 0.3382, + "MMLU-PRO": 0.1078 + } + }, + { + "model_id": "goulue5/merging_LLM", + "name": "merging_LLM", + "developer": "goulue5", + "scores": { + "IFEval": 0.3233, + "BBH": 0.4216, + "MATH Level 5": 0.0967, + "GPQA": 0.2911, + "MUSR": 0.4333, + "MMLU-PRO": 0.2958 + } + }, + { + "model_id": "gradientai/Llama-3-8B-Instruct-Gradient-1048k", + "name": "Llama-3-8B-Instruct-Gradient-1048k", + "developer": "gradientai", + "scores": { + "IFEval": 0.4456, + "BBH": 0.4346, + "MATH Level 5": 0.0536, + "GPQA": 0.2777, + "MUSR": 0.4298, + "MMLU-PRO": 0.294 + } + }, + { + "model_id": "grimjim/DeepSauerHuatuoSkywork-R1-o1-Llama-3.1-8B", + "name": "DeepSauerHuatuoSkywork-R1-o1-Llama-3.1-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.4797, + "BBH": 0.5269, + "MATH Level 5": 0.2221, + "GPQA": 0.3381, + "MUSR": 0.4408, + "MMLU-PRO": 0.3957 + } + }, + { + "model_id": "grimjim/Gigantes-v1-gemma2-9b-it", + "name": "Gigantes-v1-gemma2-9b-it", + "developer": "grimjim", + "scores": { + "IFEval": 0.6925, + "BBH": 0.5978, + "MATH Level 5": 0.2145, + "GPQA": 0.3532, + "MUSR": 0.4555, + "MMLU-PRO": 0.4225 + } + }, + { + "model_id": "grimjim/Gigantes-v2-gemma2-9b-it", + "name": "Gigantes-v2-gemma2-9b-it", + "developer": "grimjim", + "scores": { + "IFEval": 0.7351, + "BBH": 0.5987, + "MATH Level 5": 0.2017, + "GPQA": 0.3515, + "MUSR": 0.4595, + "MMLU-PRO": 0.4259 + } + }, + { + "model_id": "grimjim/Gigantes-v3-gemma2-9b-it", + "name": "Gigantes-v3-gemma2-9b-it", + "developer": "grimjim", + "scores": { + "IFEval": 0.6976, + "BBH": 0.5984, + "MATH Level 5": 0.21, + "GPQA": 0.3565, + "MUSR": 0.4608, + "MMLU-PRO": 0.4226 + } + }, + { + "model_id": "grimjim/HuatuoSkywork-o1-Llama-3.1-8B", + "name": "HuatuoSkywork-o1-Llama-3.1-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.3961, + "BBH": 0.4886, + "MATH Level 5": 0.3882, + "GPQA": 0.2928, + "MUSR": 0.3839, + "MMLU-PRO": 0.3095 + } + }, + { + "model_id": "grimjim/Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge", + "name": "Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge", + "developer": "grimjim", + "scores": { + "IFEval": 0.4271, + "BBH": 0.4962, + "MATH Level 5": 0.0997, + "GPQA": 0.2903, + "MUSR": 0.4043, + "MMLU-PRO": 0.3625 + } + }, + { + "model_id": "grimjim/Llama-3-Instruct-8B-SimPO-SPPO-Iter3-merge", + "name": "Llama-3-Instruct-8B-SimPO-SPPO-Iter3-merge", + "developer": "grimjim", + "scores": { + "IFEval": 0.6806, + "BBH": 0.5022, + "MATH Level 5": 0.0891, + "GPQA": 0.2626, + "MUSR": 0.3885, + "MMLU-PRO": 0.3684 + } + }, + { + "model_id": "grimjim/Llama-3.1-8B-Instruct-abliterated_via_adapter", + "name": "Llama-3.1-8B-Instruct-abliterated_via_adapter", + "developer": "grimjim", + "scores": { + "IFEval": 0.487, + "BBH": 0.5105, + "MATH Level 5": 0.1397, + "GPQA": 0.3138, + "MUSR": 0.401, + "MMLU-PRO": 0.3651 + } + }, + { + "model_id": "grimjim/Llama-3.1-Bonsaikraft-8B-Instruct", + "name": "Llama-3.1-Bonsaikraft-8B-Instruct", + "developer": "grimjim", + "scores": { + "IFEval": 0.425, + "BBH": 0.5287, + "MATH Level 5": 0.1314, + "GPQA": 0.3037, + "MUSR": 0.4235, + "MMLU-PRO": 0.3764 + } + }, + { + "model_id": "grimjim/Llama-Nephilim-Metamorphosis-v2-8B", + "name": "Llama-Nephilim-Metamorphosis-v2-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.4545, + "BBH": 0.5013, + "MATH Level 5": 0.1397, + "GPQA": 0.323, + "MUSR": 0.4091, + "MMLU-PRO": 0.3809 + } + }, + { + "model_id": "grimjim/Llama3.1-SuperNovaLite-HuatuoSkywork-o1-8B", + "name": "Llama3.1-SuperNovaLite-HuatuoSkywork-o1-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.4366, + "BBH": 0.5287, + "MATH Level 5": 0.3006, + "GPQA": 0.3112, + "MUSR": 0.3999, + "MMLU-PRO": 0.3684 + } + }, + { + "model_id": "grimjim/Magnolia-v1-Gemma2-8k-9B", + "name": "Magnolia-v1-Gemma2-8k-9B", + "developer": "grimjim", + "scores": { + "IFEval": 0.3531, + "BBH": 0.5589, + "MATH Level 5": 0.1684, + "GPQA": 0.3364, + "MUSR": 0.4645, + "MMLU-PRO": 0.4242 + } + }, + { + "model_id": "grimjim/Magnolia-v2-12B", + "name": "Magnolia-v2-12B", + "developer": "grimjim", + "scores": { + "IFEval": 0.3506, + "BBH": 0.529, + "MATH Level 5": 0.1292, + "GPQA": 0.3188, + "MUSR": 0.4171, + "MMLU-PRO": 0.3601 + } + }, + { + "model_id": "grimjim/Magnolia-v2-Gemma2-8k-9B", + "name": "Magnolia-v2-Gemma2-8k-9B", + "developer": "grimjim", + "scores": { + "IFEval": 0.7384, + "BBH": 0.6016, + "MATH Level 5": 0.2281, + "GPQA": 0.3574, + "MUSR": 0.4488, + "MMLU-PRO": 0.4332 + } + }, + { + "model_id": "grimjim/Magnolia-v3-12B", + "name": "Magnolia-v3-12B", + "developer": "grimjim", + "scores": { + "IFEval": 0.3965, + "BBH": 0.5327, + "MATH Level 5": 0.1352, + "GPQA": 0.3255, + "MUSR": 0.4184, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "grimjim/Magnolia-v3-Gemma2-8k-9B", + "name": "Magnolia-v3-Gemma2-8k-9B", + "developer": "grimjim", + "scores": { + "IFEval": 0.7378, + "BBH": 0.6015, + "MATH Level 5": 0.2319, + "GPQA": 0.3565, + "MUSR": 0.4488, + "MMLU-PRO": 0.4337 + } + }, + { + "model_id": "grimjim/Magnolia-v4-12B", + "name": "Magnolia-v4-12B", + "developer": "grimjim", + "scores": { + "IFEval": 0.3418, + "BBH": 0.5431, + "MATH Level 5": 0.1314, + "GPQA": 0.328, + "MUSR": 0.4211, + "MMLU-PRO": 0.3672 + } + }, + { + "model_id": "grimjim/Magnolia-v5a-12B", + "name": "Magnolia-v5a-12B", + "developer": "grimjim", + "scores": { + "IFEval": 0.4114, + "BBH": 0.5312, + "MATH Level 5": 0.1375, + "GPQA": 0.3221, + "MUSR": 0.4145, + "MMLU-PRO": 0.3601 + } + }, + { + "model_id": "grimjim/Magot-v1-Gemma2-8k-9B", + "name": "Magot-v1-Gemma2-8k-9B", + "developer": "grimjim", + "scores": { + "IFEval": 0.2997, + "BBH": 0.6019, + "MATH Level 5": 0.0989, + "GPQA": 0.3465, + "MUSR": 0.4488, + "MMLU-PRO": 0.4337 + } + }, + { + "model_id": "grimjim/Magot-v2-Gemma2-8k-9B", + "name": "Magot-v2-Gemma2-8k-9B", + "developer": "grimjim", + "scores": { + "IFEval": 0.7347, + "BBH": 0.5897, + "MATH Level 5": 0.2017, + "GPQA": 0.354, + "MUSR": 0.4344, + "MMLU-PRO": 0.4223 + } + }, + { + "model_id": "grimjim/SauerHuatuoSkywork-o1-Llama-3.1-8B", + "name": "SauerHuatuoSkywork-o1-Llama-3.1-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.5219, + "BBH": 0.5222, + "MATH Level 5": 0.173, + "GPQA": 0.3213, + "MUSR": 0.4527, + "MMLU-PRO": 0.3991 + } + }, + { + "model_id": "grimjim/llama-3-Nephilim-v1-8B", + "name": "llama-3-Nephilim-v1-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.4277, + "BBH": 0.5132, + "MATH Level 5": 0.0906, + "GPQA": 0.302, + "MUSR": 0.4136, + "MMLU-PRO": 0.3796 + } + }, + { + "model_id": "grimjim/llama-3-Nephilim-v2-8B", + "name": "llama-3-Nephilim-v2-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.3922, + "BBH": 0.5048, + "MATH Level 5": 0.1065, + "GPQA": 0.2995, + "MUSR": 0.3895, + "MMLU-PRO": 0.3641 + } + }, + { + "model_id": "grimjim/llama-3-Nephilim-v2.1-8B", + "name": "llama-3-Nephilim-v2.1-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.3895, + "BBH": 0.5095, + "MATH Level 5": 0.0997, + "GPQA": 0.2995, + "MUSR": 0.3935, + "MMLU-PRO": 0.3644 + } + }, + { + "model_id": "grimjim/llama-3-Nephilim-v3-8B", + "name": "llama-3-Nephilim-v3-8B", + "developer": "grimjim", + "scores": { + "IFEval": 0.4174, + "BBH": 0.5013, + "MATH Level 5": 0.0952, + "GPQA": 0.2953, + "MUSR": 0.3989, + "MMLU-PRO": 0.3612 + } + }, + { + "model_id": "gupta-tanish/llama-7b-dpo-baseline", + "name": "llama-7b-dpo-baseline", + "developer": "gupta-tanish", + "scores": { + "IFEval": 0.2693, + "BBH": 0.3897, + "MATH Level 5": 0.0196, + "GPQA": 0.2626, + "MUSR": 0.4456, + "MMLU-PRO": 0.2028 + } + }, + { + "model_id": "gz987/qwen2.5-7b-cabs-v0.1", + "name": "qwen2.5-7b-cabs-v0.1", + "developer": "gz987", + "scores": { + "IFEval": 0.7506, + "BBH": 0.5482, + "MATH Level 5": 0.4796, + "GPQA": 0.3138, + "MUSR": 0.4376, + "MMLU-PRO": 0.4406 + } + }, + { + "model_id": "gz987/qwen2.5-7b-cabs-v0.2", + "name": "qwen2.5-7b-cabs-v0.2", + "developer": "gz987", + "scores": { + "IFEval": 0.7418, + "BBH": 0.5516, + "MATH Level 5": 0.4902, + "GPQA": 0.307, + "MUSR": 0.4429, + "MMLU-PRO": 0.4397 + } + }, + { + "model_id": "gz987/qwen2.5-7b-cabs-v0.3", + "name": "qwen2.5-7b-cabs-v0.3", + "developer": "gz987", + "scores": { + "IFEval": 0.757, + "BBH": 0.5494, + "MATH Level 5": 0.4932, + "GPQA": 0.307, + "MUSR": 0.443, + "MMLU-PRO": 0.4402 + } + }, + { + "model_id": "gz987/qwen2.5-7b-cabs-v0.4", + "name": "qwen2.5-7b-cabs-v0.4", + "developer": "gz987", + "scores": { + "IFEval": 0.7583, + "BBH": 0.5524, + "MATH Level 5": 0.4849, + "GPQA": 0.3079, + "MUSR": 0.443, + "MMLU-PRO": 0.4396 + } + }, + { + "model_id": "h2oai/h2o-danube-1.8b-chat", + "name": "h2o-danube-1.8b-chat", + "developer": "h2oai", + "scores": { + "IFEval": 0.2199, + "BBH": 0.322, + "MATH Level 5": 0.0136, + "GPQA": 0.2542, + "MUSR": 0.3989, + "MMLU-PRO": 0.1314 + } + }, + { + "model_id": "h2oai/h2o-danube3-4b-base", + "name": "h2o-danube3-4b-base", + "developer": "h2oai", + "scores": { + "IFEval": 0.2338, + "BBH": 0.3599, + "MATH Level 5": 0.0227, + "GPQA": 0.2911, + "MUSR": 0.3778, + "MMLU-PRO": 0.2109 + } + }, + { + "model_id": "h2oai/h2o-danube3-4b-chat", + "name": "h2o-danube3-4b-chat", + "developer": "h2oai", + "scores": { + "IFEval": 0.3629, + "BBH": 0.3466, + "MATH Level 5": 0.0408, + "GPQA": 0.2601, + "MUSR": 0.3781, + "MMLU-PRO": 0.2228 + } + }, + { + "model_id": "h2oai/h2o-danube3-500m-chat", + "name": "h2o-danube3-500m-chat", + "developer": "h2oai", + "scores": { + "IFEval": 0.2208, + "BBH": 0.3035, + "MATH Level 5": 0.0166, + "GPQA": 0.2307, + "MUSR": 0.3434, + "MMLU-PRO": 0.1144 + } + }, + { + "model_id": "h2oai/h2o-danube3.1-4b-chat", + "name": "h2o-danube3.1-4b-chat", + "developer": "h2oai", + "scores": { + "IFEval": 0.5021, + "BBH": 0.3608, + "MATH Level 5": 0.0332, + "GPQA": 0.2852, + "MUSR": 0.4102, + "MMLU-PRO": 0.2719 + } + }, + { + "model_id": "haoranxu/ALMA-13B-R", + "name": "ALMA-13B-R", + "developer": "haoranxu", + "scores": { + "IFEval": 0.0039, + "BBH": 0.3457, + "MATH Level 5": 0.0174, + "GPQA": 0.2576, + "MUSR": 0.3528, + "MMLU-PRO": 0.1817 + } + }, + { + "model_id": "haoranxu/Llama-3-Instruct-8B-CPO-SimPO", + "name": "Llama-3-Instruct-8B-CPO-SimPO", + "developer": "haoranxu", + "scores": { + "IFEval": 0.7046, + "BBH": 0.5048, + "MATH Level 5": 0.1027, + "GPQA": 0.2928, + "MUSR": 0.3567, + "MMLU-PRO": 0.3686 + } + }, + { + "model_id": "haoranxu/Llama-3-Instruct-8B-SimPO", + "name": "Llama-3-Instruct-8B-SimPO", + "developer": "haoranxu", + "scores": { + "IFEval": 0.7347, + "BBH": 0.4979, + "MATH Level 5": 0.0876, + "GPQA": 0.2903, + "MUSR": 0.3566, + "MMLU-PRO": 0.3733 + } + }, + { + "model_id": "hatemmahmoud/qwen2.5-1.5b-sft-raft-grpo-hra-doc", + "name": "qwen2.5-1.5b-sft-raft-grpo-hra-doc", + "developer": "hatemmahmoud", + "scores": { + "IFEval": 0.4196, + "BBH": 0.427, + "MATH Level 5": 0.2175, + "GPQA": 0.2676, + "MUSR": 0.361, + "MMLU-PRO": 0.2776 + } + }, + { + "model_id": "hon9kon9ize/CantoneseLLMChat-v0.5", + "name": "CantoneseLLMChat-v0.5", + "developer": "hon9kon9ize", + "scores": { + "IFEval": 0.3231, + "BBH": 0.4345, + "MATH Level 5": 0.0415, + "GPQA": 0.2777, + "MUSR": 0.4706, + "MMLU-PRO": 0.2504 + } + }, + { + "model_id": "hon9kon9ize/CantoneseLLMChat-v1.0-7B", + "name": "CantoneseLLMChat-v1.0-7B", + "developer": "hon9kon9ize", + "scores": { + "IFEval": 0.4455, + "BBH": 0.4866, + "MATH Level 5": 0.2107, + "GPQA": 0.3221, + "MUSR": 0.3883, + "MMLU-PRO": 0.3785 + } + }, + { + "model_id": "hongbai12/li-0.4-pre", + "name": "li-0.4-pre", + "developer": "hongbai12", + "scores": { + "IFEval": 0.52, + "BBH": 0.6298, + "MATH Level 5": 0.4924, + "GPQA": 0.323, + "MUSR": 0.4513, + "MMLU-PRO": 0.5015 + } + }, + { + "model_id": "hotmailuser/Deepseek-qwen-modelstock-2B", + "name": "Deepseek-qwen-modelstock-2B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.2149, + "BBH": 0.3549, + "MATH Level 5": 0.3399, + "GPQA": 0.2802, + "MUSR": 0.3475, + "MMLU-PRO": 0.1911 + } + }, + { + "model_id": "hotmailuser/Falcon3Slerp1-10B", + "name": "Falcon3Slerp1-10B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.5694, + "BBH": 0.617, + "MATH Level 5": 0.2598, + "GPQA": 0.344, + "MUSR": 0.4318, + "MMLU-PRO": 0.4402 + } + }, + { + "model_id": "hotmailuser/Falcon3Slerp2-10B", + "name": "Falcon3Slerp2-10B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.6118, + "BBH": 0.6164, + "MATH Level 5": 0.2319, + "GPQA": 0.3381, + "MUSR": 0.4096, + "MMLU-PRO": 0.4369 + } + }, + { + "model_id": "hotmailuser/Falcon3Slerp4-10B", + "name": "Falcon3Slerp4-10B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.6072, + "BBH": 0.6114, + "MATH Level 5": 0.2289, + "GPQA": 0.3289, + "MUSR": 0.4017, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "hotmailuser/FalconSlerp-3B", + "name": "FalconSlerp-3B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.5695, + "BBH": 0.4624, + "MATH Level 5": 0.176, + "GPQA": 0.2878, + "MUSR": 0.3989, + "MMLU-PRO": 0.2968 + } + }, + { + "model_id": "hotmailuser/FalconSlerp1-7B", + "name": "FalconSlerp1-7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.5395, + "BBH": 0.5355, + "MATH Level 5": 0.2379, + "GPQA": 0.3196, + "MUSR": 0.4452, + "MMLU-PRO": 0.4129 + } + }, + { + "model_id": "hotmailuser/FalconSlerp2-7B", + "name": "FalconSlerp2-7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.616, + "BBH": 0.5538, + "MATH Level 5": 0.2983, + "GPQA": 0.3196, + "MUSR": 0.4479, + "MMLU-PRO": 0.4141 + } + }, + { + "model_id": "hotmailuser/FalconSlerp3-10B", + "name": "FalconSlerp3-10B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.6002, + "BBH": 0.606, + "MATH Level 5": 0.2273, + "GPQA": 0.3356, + "MUSR": 0.4031, + "MMLU-PRO": 0.4323 + } + }, + { + "model_id": "hotmailuser/FalconSlerp3-7B", + "name": "FalconSlerp3-7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.6096, + "BBH": 0.5533, + "MATH Level 5": 0.3157, + "GPQA": 0.3188, + "MUSR": 0.4507, + "MMLU-PRO": 0.4127 + } + }, + { + "model_id": "hotmailuser/FalconSlerp4-7B", + "name": "FalconSlerp4-7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.6285, + "BBH": 0.5524, + "MATH Level 5": 0.2213, + "GPQA": 0.3322, + "MUSR": 0.4585, + "MMLU-PRO": 0.4032 + } + }, + { + "model_id": "hotmailuser/FalconSlerp6-7B", + "name": "FalconSlerp6-7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.6027, + "BBH": 0.5384, + "MATH Level 5": 0.2047, + "GPQA": 0.318, + "MUSR": 0.4492, + "MMLU-PRO": 0.3995 + } + }, + { + "model_id": "hotmailuser/Gemma2Crono-27B", + "name": "Gemma2Crono-27B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.7086, + "BBH": 0.6505, + "MATH Level 5": 0.2424, + "GPQA": 0.3708, + "MUSR": 0.4567, + "MMLU-PRO": 0.4633 + } + }, + { + "model_id": "hotmailuser/Gemma2SimPO-27B", + "name": "Gemma2SimPO-27B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.7222, + "BBH": 0.6413, + "MATH Level 5": 0.2817, + "GPQA": 0.3582, + "MUSR": 0.4447, + "MMLU-PRO": 0.4642 + } + }, + { + "model_id": "hotmailuser/Gemma2atlas-27B", + "name": "Gemma2atlas-27B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.7214, + "BBH": 0.6545, + "MATH Level 5": 0.2145, + "GPQA": 0.3557, + "MUSR": 0.4445, + "MMLU-PRO": 0.475 + } + }, + { + "model_id": "hotmailuser/Gemma2magnum-27b", + "name": "Gemma2magnum-27b", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.5051, + "BBH": 0.62, + "MATH Level 5": 0.2205, + "GPQA": 0.3851, + "MUSR": 0.4723, + "MMLU-PRO": 0.4596 + } + }, + { + "model_id": "hotmailuser/Llama-Hermes-slerp-8B", + "name": "Llama-Hermes-slerp-8B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.339, + "BBH": 0.531, + "MATH Level 5": 0.0801, + "GPQA": 0.2936, + "MUSR": 0.4078, + "MMLU-PRO": 0.3331 + } + }, + { + "model_id": "hotmailuser/Llama-Hermes-slerp2-8B", + "name": "Llama-Hermes-slerp2-8B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.3728, + "BBH": 0.5265, + "MATH Level 5": 0.0974, + "GPQA": 0.2961, + "MUSR": 0.4248, + "MMLU-PRO": 0.3379 + } + }, + { + "model_id": "hotmailuser/LlamaStock-8B", + "name": "LlamaStock-8B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.425, + "BBH": 0.5329, + "MATH Level 5": 0.1699, + "GPQA": 0.3272, + "MUSR": 0.4129, + "MMLU-PRO": 0.3807 + } + }, + { + "model_id": "hotmailuser/Mistral-modelstock-24B", + "name": "Mistral-modelstock-24B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.3424, + "BBH": 0.6452, + "MATH Level 5": 0.1307, + "GPQA": 0.4102, + "MUSR": 0.459, + "MMLU-PRO": 0.507 + } + }, + { + "model_id": "hotmailuser/Mistral-modelstock2-24B", + "name": "Mistral-modelstock2-24B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.4318, + "BBH": 0.6689, + "MATH Level 5": 0.2402, + "GPQA": 0.3926, + "MUSR": 0.4616, + "MMLU-PRO": 0.5318 + } + }, + { + "model_id": "hotmailuser/Phi4-Slerp4-14B", + "name": "Phi4-Slerp4-14B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.0629, + "BBH": 0.6731, + "MATH Level 5": 0.3474, + "GPQA": 0.3968, + "MUSR": 0.5097, + "MMLU-PRO": 0.5278 + } + }, + { + "model_id": "hotmailuser/Qwen2.5-HomerSlerp-7B", + "name": "Qwen2.5-HomerSlerp-7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.4488, + "BBH": 0.5633, + "MATH Level 5": 0.3316, + "GPQA": 0.3138, + "MUSR": 0.4383, + "MMLU-PRO": 0.4549 + } + }, + { + "model_id": "hotmailuser/QwenModelStock-1.8B", + "name": "QwenModelStock-1.8B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.3263, + "BBH": 0.4188, + "MATH Level 5": 0.0989, + "GPQA": 0.2869, + "MUSR": 0.4359, + "MMLU-PRO": 0.2959 + } + }, + { + "model_id": "hotmailuser/QwenSlerp-14B", + "name": "QwenSlerp-14B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.7025, + "BBH": 0.6491, + "MATH Level 5": 0.3837, + "GPQA": 0.3876, + "MUSR": 0.4634, + "MMLU-PRO": 0.54 + } + }, + { + "model_id": "hotmailuser/QwenSlerp-3B", + "name": "QwenSlerp-3B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.4334, + "BBH": 0.4892, + "MATH Level 5": 0.2749, + "GPQA": 0.2945, + "MUSR": 0.4317, + "MMLU-PRO": 0.3693 + } + }, + { + "model_id": "hotmailuser/QwenSlerp-7B", + "name": "QwenSlerp-7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.4673, + "BBH": 0.5636, + "MATH Level 5": 0.3444, + "GPQA": 0.318, + "MUSR": 0.4409, + "MMLU-PRO": 0.4509 + } + }, + { + "model_id": "hotmailuser/QwenSlerp2-14B", + "name": "QwenSlerp2-14B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.7037, + "BBH": 0.6493, + "MATH Level 5": 0.3965, + "GPQA": 0.3809, + "MUSR": 0.4807, + "MMLU-PRO": 0.5379 + } + }, + { + "model_id": "hotmailuser/QwenSlerp2-3B", + "name": "QwenSlerp2-3B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.428, + "BBH": 0.4802, + "MATH Level 5": 0.2606, + "GPQA": 0.297, + "MUSR": 0.4252, + "MMLU-PRO": 0.3742 + } + }, + { + "model_id": "hotmailuser/QwenSlerp3-14B", + "name": "QwenSlerp3-14B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.6632, + "BBH": 0.6267, + "MATH Level 5": 0.4305, + "GPQA": 0.3666, + "MUSR": 0.4808, + "MMLU-PRO": 0.5263 + } + }, + { + "model_id": "hotmailuser/QwenSparse-7B", + "name": "QwenSparse-7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.1086, + "BBH": 0.2896, + "MATH Level 5": 0.0106, + "GPQA": 0.2601, + "MUSR": 0.3562, + "MMLU-PRO": 0.1122 + } + }, + { + "model_id": "hotmailuser/QwenStock-0.5B", + "name": "QwenStock-0.5B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.2049, + "BBH": 0.2912, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3575, + "MMLU-PRO": 0.1167 + } + }, + { + "model_id": "hotmailuser/QwenStock-1.7B", + "name": "QwenStock-1.7B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.3214, + "BBH": 0.4188, + "MATH Level 5": 0.0997, + "GPQA": 0.2878, + "MUSR": 0.4412, + "MMLU-PRO": 0.2955 + } + }, + { + "model_id": "hotmailuser/QwenStock1-14B", + "name": "QwenStock1-14B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.6693, + "BBH": 0.6502, + "MATH Level 5": 0.3701, + "GPQA": 0.3859, + "MUSR": 0.4781, + "MMLU-PRO": 0.5416 + } + }, + { + "model_id": "hotmailuser/RombosBeagle-v2beta-MGS-32B", + "name": "RombosBeagle-v2beta-MGS-32B", + "developer": "hotmailuser", + "scores": { + "IFEval": 0.5157, + "BBH": 0.7037, + "MATH Level 5": 0.4992, + "GPQA": 0.38, + "MUSR": 0.5021, + "MMLU-PRO": 0.5908 + } + }, + { + "model_id": "huggyllama/llama-13b", + "name": "llama-13b", + "developer": "huggyllama", + "scores": { + "IFEval": 0.2411, + "BBH": 0.3988, + "MATH Level 5": 0.0204, + "GPQA": 0.255, + "MUSR": 0.3462, + "MMLU-PRO": 0.1952 + } + }, + { + "model_id": "huggyllama/llama-65b", + "name": "llama-65b", + "developer": "huggyllama", + "scores": { + "IFEval": 0.2526, + "BBH": 0.4703, + "MATH Level 5": 0.031, + "GPQA": 0.276, + "MUSR": 0.3595, + "MMLU-PRO": 0.3078 + } + }, + { + "model_id": "huggyllama/llama-7b", + "name": "llama-7b", + "developer": "huggyllama", + "scores": { + "IFEval": 0.2501, + "BBH": 0.3277, + "MATH Level 5": 0.0083, + "GPQA": 0.2525, + "MUSR": 0.3354, + "MMLU-PRO": 0.1313 + } + }, + { + "model_id": "huihui-ai/DeepSeek-R1-Distill-Qwen-14B-abliterated-v2", + "name": "DeepSeek-R1-Distill-Qwen-14B-abliterated-v2", + "developer": "huihui-ai", + "scores": { + "IFEval": 0.4211, + "BBH": 0.3487, + "MATH Level 5": 0.2205, + "GPQA": 0.276, + "MUSR": 0.4701, + "MMLU-PRO": 0.1915 + } + }, + { + "model_id": "huihui-ai/QwQ-32B-Coder-Fusion-7030", + "name": "QwQ-32B-Coder-Fusion-7030", + "developer": "huihui-ai", + "scores": { + "IFEval": 0.3865, + "BBH": 0.6178, + "MATH Level 5": 0.2795, + "GPQA": 0.2844, + "MUSR": 0.3922, + "MMLU-PRO": 0.4368 + } + }, + { + "model_id": "huihui-ai/QwQ-32B-Coder-Fusion-8020", + "name": "QwQ-32B-Coder-Fusion-8020", + "developer": "huihui-ai", + "scores": { + "IFEval": 0.6021, + "BBH": 0.6665, + "MATH Level 5": 0.4592, + "GPQA": 0.3549, + "MUSR": 0.4293, + "MMLU-PRO": 0.5367 + } + }, + { + "model_id": "huihui-ai/QwQ-32B-Coder-Fusion-9010", + "name": "QwQ-32B-Coder-Fusion-9010", + "developer": "huihui-ai", + "scores": { + "IFEval": 0.5778, + "BBH": 0.6727, + "MATH Level 5": 0.5317, + "GPQA": 0.3616, + "MUSR": 0.4682, + "MMLU-PRO": 0.56 + } + }, + { + "model_id": "huihui-ai/Qwen2.5-14B-Instruct-abliterated-v2", + "name": "Qwen2.5-14B-Instruct-abliterated-v2", + "developer": "huihui-ai", + "scores": { + "IFEval": 0.8328, + "BBH": 0.6324, + "MATH Level 5": 0.5302, + "GPQA": 0.3339, + "MUSR": 0.422, + "MMLU-PRO": 0.4962 + } + }, + { + "model_id": "huihui-ai/Qwen2.5-72B-Instruct-abliterated", + "name": "Qwen2.5-72B-Instruct-abliterated", + "developer": "huihui-ai", + "scores": { + "IFEval": 0.8593, + "BBH": 0.719, + "MATH Level 5": 0.6012, + "GPQA": 0.3951, + "MUSR": 0.4233, + "MMLU-PRO": 0.5537 + } + }, + { + "model_id": "huihui-ai/Qwen2.5-7B-Instruct-abliterated", + "name": "Qwen2.5-7B-Instruct-abliterated", + "developer": "huihui-ai", + "scores": { + "IFEval": 0.7546, + "BBH": 0.5262, + "MATH Level 5": 0.4577, + "GPQA": 0.3154, + "MUSR": 0.3967, + "MMLU-PRO": 0.418 + } + }, + { + "model_id": "huihui-ai/Qwen2.5-7B-Instruct-abliterated-v2", + "name": "Qwen2.5-7B-Instruct-abliterated-v2", + "developer": "huihui-ai", + "scores": { + "IFEval": 0.7606, + "BBH": 0.5377, + "MATH Level 5": 0.4637, + "GPQA": 0.3087, + "MUSR": 0.3981, + "MMLU-PRO": 0.4208 + } + }, + { + "model_id": "huu-ontocord/wide_3b_orpo_stage1.1-ss1-orpo3", + "name": "wide_3b_orpo_stage1.1-ss1-orpo3", + "developer": "huu-ontocord", + "scores": { + "IFEval": 0.1505, + "BBH": 0.2937, + "MATH Level 5": 0.0098, + "GPQA": 0.2584, + "MUSR": 0.3618, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "iFaz/llama31_8B_en_emo_v4", + "name": "llama31_8B_en_emo_v4", + "developer": "iFaz", + "scores": { + "IFEval": 0.3043, + "BBH": 0.4916, + "MATH Level 5": 0.0884, + "GPQA": 0.297, + "MUSR": 0.3643, + "MMLU-PRO": 0.3049 + } + }, + { + "model_id": "iFaz/llama32_1B_en_emo_v1", + "name": "llama32_1B_en_emo_v1", + "developer": "iFaz", + "scores": { + "IFEval": 0.4408, + "BBH": 0.338, + "MATH Level 5": 0.0378, + "GPQA": 0.25, + "MUSR": 0.3489, + "MMLU-PRO": 0.1761 + } + }, + { + "model_id": "iFaz/llama32_3B_en_emo_1000_stp", + "name": "llama32_3B_en_emo_1000_stp", + "developer": "iFaz", + "scores": { + "IFEval": 0.7295, + "BBH": 0.4522, + "MATH Level 5": 0.1465, + "GPQA": 0.2777, + "MUSR": 0.3621, + "MMLU-PRO": 0.3123 + } + }, + { + "model_id": "iFaz/llama32_3B_en_emo_2000_stp", + "name": "llama32_3B_en_emo_2000_stp", + "developer": "iFaz", + "scores": { + "IFEval": 0.7369, + "BBH": 0.4535, + "MATH Level 5": 0.1533, + "GPQA": 0.2836, + "MUSR": 0.3527, + "MMLU-PRO": 0.3098 + } + }, + { + "model_id": "iFaz/llama32_3B_en_emo_300_stp", + "name": "llama32_3B_en_emo_300_stp", + "developer": "iFaz", + "scores": { + "IFEval": 0.7256, + "BBH": 0.4505, + "MATH Level 5": 0.1601, + "GPQA": 0.2743, + "MUSR": 0.3621, + "MMLU-PRO": 0.3148 + } + }, + { + "model_id": "iFaz/llama32_3B_en_emo_5000_stp", + "name": "llama32_3B_en_emo_5000_stp", + "developer": "iFaz", + "scores": { + "IFEval": 0.71, + "BBH": 0.4568, + "MATH Level 5": 0.1292, + "GPQA": 0.2794, + "MUSR": 0.3446, + "MMLU-PRO": 0.3067 + } + }, + { + "model_id": "iFaz/llama32_3B_en_emo_v2", + "name": "llama32_3B_en_emo_v2", + "developer": "iFaz", + "scores": { + "IFEval": 0.5454, + "BBH": 0.4284, + "MATH Level 5": 0.1088, + "GPQA": 0.2676, + "MUSR": 0.3482, + "MMLU-PRO": 0.3004 + } + }, + { + "model_id": "iFaz/llama32_3B_en_emo_v3", + "name": "llama32_3B_en_emo_v3", + "developer": "iFaz", + "scores": { + "IFEval": 0.5759, + "BBH": 0.4301, + "MATH Level 5": 0.068, + "GPQA": 0.2676, + "MUSR": 0.3553, + "MMLU-PRO": 0.271 + } + }, + { + "model_id": "iRyanBell/ARC1", + "name": "ARC1", + "developer": "iRyanBell", + "scores": { + "IFEval": 0.4411, + "BBH": 0.4903, + "MATH Level 5": 0.0687, + "GPQA": 0.2945, + "MUSR": 0.3991, + "MMLU-PRO": 0.3371 + } + }, + { + "model_id": "iRyanBell/ARC1-II", + "name": "ARC1-II", + "developer": "iRyanBell", + "scores": { + "IFEval": 0.1708, + "BBH": 0.3382, + "MATH Level 5": 0.0219, + "GPQA": 0.2718, + "MUSR": 0.4913, + "MMLU-PRO": 0.1686 + } + }, + { + "model_id": "ibivibiv/colossus_120b", + "name": "colossus_120b", + "developer": "ibivibiv", + "scores": { + "IFEval": 0.4276, + "BBH": 0.6061, + "MATH Level 5": 0.0566, + "GPQA": 0.3087, + "MUSR": 0.4733, + "MMLU-PRO": 0.3961 + } + }, + { + "model_id": "ibivibiv/multimaster-7b-v6", + "name": "multimaster-7b-v6", + "developer": "ibivibiv", + "scores": { + "IFEval": 0.4473, + "BBH": 0.5194, + "MATH Level 5": 0.0559, + "GPQA": 0.3037, + "MUSR": 0.4396, + "MMLU-PRO": 0.3095 + } + }, + { + "model_id": "ibm-granite/granite-3.0-1b-a400m-base", + "name": "granite-3.0-1b-a400m-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.2404, + "BBH": 0.3221, + "MATH Level 5": 0.0264, + "GPQA": 0.2475, + "MUSR": 0.3367, + "MMLU-PRO": 0.1152 + } + }, + { + "model_id": "ibm-granite/granite-3.0-1b-a400m-instruct", + "name": "granite-3.0-1b-a400m-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.3332, + "BBH": 0.3224, + "MATH Level 5": 0.0279, + "GPQA": 0.2609, + "MUSR": 0.3623, + "MMLU-PRO": 0.1244 + } + }, + { + "model_id": "ibm-granite/granite-3.0-2b-base", + "name": "granite-3.0-2b-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.3874, + "BBH": 0.4047, + "MATH Level 5": 0.0544, + "GPQA": 0.2802, + "MUSR": 0.3434, + "MMLU-PRO": 0.2381 + } + }, + { + "model_id": "ibm-granite/granite-3.0-2b-instruct", + "name": "granite-3.0-2b-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.514, + "BBH": 0.4412, + "MATH Level 5": 0.0921, + "GPQA": 0.2995, + "MUSR": 0.3515, + "MMLU-PRO": 0.2814 + } + }, + { + "model_id": "ibm-granite/granite-3.0-3b-a800m-base", + "name": "granite-3.0-3b-a800m-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.2732, + "BBH": 0.3667, + "MATH Level 5": 0.0483, + "GPQA": 0.2517, + "MUSR": 0.342, + "MMLU-PRO": 0.1891 + } + }, + { + "model_id": "ibm-granite/granite-3.0-3b-a800m-instruct", + "name": "granite-3.0-3b-a800m-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.4298, + "BBH": 0.3753, + "MATH Level 5": 0.0702, + "GPQA": 0.281, + "MUSR": 0.3487, + "MMLU-PRO": 0.2152 + } + }, + { + "model_id": "ibm-granite/granite-3.0-8b-base", + "name": "granite-3.0-8b-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.4583, + "BBH": 0.4944, + "MATH Level 5": 0.1012, + "GPQA": 0.3255, + "MUSR": 0.4081, + "MMLU-PRO": 0.3313 + } + }, + { + "model_id": "ibm-granite/granite-3.0-8b-instruct", + "name": "granite-3.0-8b-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.531, + "BBH": 0.5192, + "MATH Level 5": 0.142, + "GPQA": 0.3322, + "MUSR": 0.3901, + "MMLU-PRO": 0.3457 + } + }, + { + "model_id": "ibm-granite/granite-3.1-1b-a400m-base", + "name": "granite-3.1-1b-a400m-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.2519, + "BBH": 0.3299, + "MATH Level 5": 0.0272, + "GPQA": 0.2517, + "MUSR": 0.3501, + "MMLU-PRO": 0.1139 + } + }, + { + "model_id": "ibm-granite/granite-3.1-1b-a400m-instruct", + "name": "granite-3.1-1b-a400m-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.4686, + "BBH": 0.328, + "MATH Level 5": 0.0453, + "GPQA": 0.2399, + "MUSR": 0.3302, + "MMLU-PRO": 0.1217 + } + }, + { + "model_id": "ibm-granite/granite-3.1-2b-base", + "name": "granite-3.1-2b-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.3522, + "BBH": 0.4047, + "MATH Level 5": 0.0566, + "GPQA": 0.2777, + "MUSR": 0.3486, + "MMLU-PRO": 0.2251 + } + }, + { + "model_id": "ibm-granite/granite-3.1-2b-instruct", + "name": "granite-3.1-2b-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.6286, + "BBH": 0.4409, + "MATH Level 5": 0.1526, + "GPQA": 0.2894, + "MUSR": 0.3605, + "MMLU-PRO": 0.2819 + } + }, + { + "model_id": "ibm-granite/granite-3.1-3b-a800m-base", + "name": "granite-3.1-3b-a800m-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.2996, + "BBH": 0.3628, + "MATH Level 5": 0.0453, + "GPQA": 0.2777, + "MUSR": 0.3275, + "MMLU-PRO": 0.1793 + } + }, + { + "model_id": "ibm-granite/granite-3.1-3b-a800m-instruct", + "name": "granite-3.1-3b-a800m-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.5516, + "BBH": 0.4009, + "MATH Level 5": 0.114, + "GPQA": 0.2886, + "MUSR": 0.3486, + "MMLU-PRO": 0.2148 + } + }, + { + "model_id": "ibm-granite/granite-3.1-8b-base", + "name": "granite-3.1-8b-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.4221, + "BBH": 0.4777, + "MATH Level 5": 0.0944, + "GPQA": 0.3213, + "MUSR": 0.3922, + "MMLU-PRO": 0.3232 + } + }, + { + "model_id": "ibm-granite/granite-3.1-8b-instruct", + "name": "granite-3.1-8b-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.7208, + "BBH": 0.5364, + "MATH Level 5": 0.2198, + "GPQA": 0.3121, + "MUSR": 0.4707, + "MMLU-PRO": 0.3537 + } + }, + { + "model_id": "ibm-granite/granite-3.2-2b-instruct", + "name": "granite-3.2-2b-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.6152, + "BBH": 0.4387, + "MATH Level 5": 0.1443, + "GPQA": 0.2903, + "MUSR": 0.3646, + "MMLU-PRO": 0.2783 + } + }, + { + "model_id": "ibm-granite/granite-3.2-8b-instruct", + "name": "granite-3.2-8b-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.7275, + "BBH": 0.5402, + "MATH Level 5": 0.2379, + "GPQA": 0.3154, + "MUSR": 0.4562, + "MMLU-PRO": 0.3512 + } + }, + { + "model_id": "ibm-granite/granite-7b-base", + "name": "granite-7b-base", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.2414, + "BBH": 0.348, + "MATH Level 5": 0.0159, + "GPQA": 0.2458, + "MUSR": 0.3555, + "MMLU-PRO": 0.1834 + } + }, + { + "model_id": "ibm-granite/granite-7b-instruct", + "name": "granite-7b-instruct", + "developer": "ibm-granite", + "scores": { + "IFEval": 0.2972, + "BBH": 0.3723, + "MATH Level 5": 0.0204, + "GPQA": 0.2852, + "MUSR": 0.402, + "MMLU-PRO": 0.2286 + } + }, + { + "model_id": "ibm/PowerLM-3b", + "name": "PowerLM-3b", + "developer": "ibm", + "scores": { + "IFEval": 0.3321, + "BBH": 0.3679, + "MATH Level 5": 0.0363, + "GPQA": 0.2752, + "MUSR": 0.3563, + "MMLU-PRO": 0.2016 + } + }, + { + "model_id": "ibm/merlinite-7b", + "name": "merlinite-7b", + "developer": "ibm", + "scores": { + "IFEval": 0.2499, + "BBH": 0.5007, + "MATH Level 5": 0.0242, + "GPQA": 0.297, + "MUSR": 0.4412, + "MMLU-PRO": 0.3068 + } + }, + { + "model_id": "icefog72/Ice0.15-02.10-RP", + "name": "Ice0.15-02.10-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5343, + "BBH": 0.4976, + "MATH Level 5": 0.0574, + "GPQA": 0.2777, + "MUSR": 0.432, + "MMLU-PRO": 0.3066 + } + }, + { + "model_id": "icefog72/Ice0.16-02.10-RP", + "name": "Ice0.16-02.10-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5069, + "BBH": 0.4946, + "MATH Level 5": 0.0589, + "GPQA": 0.2794, + "MUSR": 0.4334, + "MMLU-PRO": 0.3068 + } + }, + { + "model_id": "icefog72/Ice0.17-03.10-RP", + "name": "Ice0.17-03.10-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5124, + "BBH": 0.5007, + "MATH Level 5": 0.0612, + "GPQA": 0.2819, + "MUSR": 0.4334, + "MMLU-PRO": 0.3085 + } + }, + { + "model_id": "icefog72/Ice0.27-06.11-RP", + "name": "Ice0.27-06.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4918, + "BBH": 0.5112, + "MATH Level 5": 0.0566, + "GPQA": 0.3121, + "MUSR": 0.4328, + "MMLU-PRO": 0.3154 + } + }, + { + "model_id": "icefog72/Ice0.29-06.11-RP", + "name": "Ice0.29-06.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4861, + "BBH": 0.5088, + "MATH Level 5": 0.0566, + "GPQA": 0.3029, + "MUSR": 0.4459, + "MMLU-PRO": 0.3093 + } + }, + { + "model_id": "icefog72/Ice0.31-08.11-RP", + "name": "Ice0.31-08.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5146, + "BBH": 0.5032, + "MATH Level 5": 0.0612, + "GPQA": 0.3079, + "MUSR": 0.4277, + "MMLU-PRO": 0.3131 + } + }, + { + "model_id": "icefog72/Ice0.32-10.11-RP", + "name": "Ice0.32-10.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4915, + "BBH": 0.5048, + "MATH Level 5": 0.0514, + "GPQA": 0.3121, + "MUSR": 0.4382, + "MMLU-PRO": 0.31 + } + }, + { + "model_id": "icefog72/Ice0.34b-14.11-RP", + "name": "Ice0.34b-14.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4762, + "BBH": 0.5067, + "MATH Level 5": 0.065, + "GPQA": 0.3096, + "MUSR": 0.442, + "MMLU-PRO": 0.3125 + } + }, + { + "model_id": "icefog72/Ice0.34n-14.11-RP", + "name": "Ice0.34n-14.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4787, + "BBH": 0.5091, + "MATH Level 5": 0.0725, + "GPQA": 0.3138, + "MUSR": 0.438, + "MMLU-PRO": 0.3124 + } + }, + { + "model_id": "icefog72/Ice0.37-18.11-RP", + "name": "Ice0.37-18.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4972, + "BBH": 0.5084, + "MATH Level 5": 0.0642, + "GPQA": 0.3121, + "MUSR": 0.4339, + "MMLU-PRO": 0.3143 + } + }, + { + "model_id": "icefog72/Ice0.38-19.11-RP", + "name": "Ice0.38-19.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4403, + "BBH": 0.5101, + "MATH Level 5": 0.0551, + "GPQA": 0.3045, + "MUSR": 0.4367, + "MMLU-PRO": 0.314 + } + }, + { + "model_id": "icefog72/Ice0.39-19.11-RP", + "name": "Ice0.39-19.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4757, + "BBH": 0.5093, + "MATH Level 5": 0.0498, + "GPQA": 0.3104, + "MUSR": 0.4341, + "MMLU-PRO": 0.3127 + } + }, + { + "model_id": "icefog72/Ice0.40-20.11-RP", + "name": "Ice0.40-20.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4763, + "BBH": 0.5093, + "MATH Level 5": 0.0642, + "GPQA": 0.307, + "MUSR": 0.4446, + "MMLU-PRO": 0.3099 + } + }, + { + "model_id": "icefog72/Ice0.41-22.11-RP", + "name": "Ice0.41-22.11-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.462, + "BBH": 0.4723, + "MATH Level 5": 0.031, + "GPQA": 0.2869, + "MUSR": 0.456, + "MMLU-PRO": 0.2618 + } + }, + { + "model_id": "icefog72/Ice0.50-16.01-RP", + "name": "Ice0.50-16.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4385, + "BBH": 0.498, + "MATH Level 5": 0.0468, + "GPQA": 0.2995, + "MUSR": 0.4381, + "MMLU-PRO": 0.3069 + } + }, + { + "model_id": "icefog72/Ice0.50.1-16.01-RP", + "name": "Ice0.50.1-16.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4829, + "BBH": 0.5107, + "MATH Level 5": 0.0612, + "GPQA": 0.3096, + "MUSR": 0.4327, + "MMLU-PRO": 0.3132 + } + }, + { + "model_id": "icefog72/Ice0.51-16.01-RP", + "name": "Ice0.51-16.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4431, + "BBH": 0.5044, + "MATH Level 5": 0.0514, + "GPQA": 0.3045, + "MUSR": 0.4437, + "MMLU-PRO": 0.306 + } + }, + { + "model_id": "icefog72/Ice0.51.1-16.01-RP", + "name": "Ice0.51.1-16.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4573, + "BBH": 0.5121, + "MATH Level 5": 0.0642, + "GPQA": 0.3062, + "MUSR": 0.4394, + "MMLU-PRO": 0.3104 + } + }, + { + "model_id": "icefog72/Ice0.52-16.01-RP", + "name": "Ice0.52-16.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4503, + "BBH": 0.5047, + "MATH Level 5": 0.0506, + "GPQA": 0.3087, + "MUSR": 0.4396, + "MMLU-PRO": 0.308 + } + }, + { + "model_id": "icefog72/Ice0.52.1-16.01-RP", + "name": "Ice0.52.1-16.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4549, + "BBH": 0.5106, + "MATH Level 5": 0.0627, + "GPQA": 0.3037, + "MUSR": 0.4394, + "MMLU-PRO": 0.3105 + } + }, + { + "model_id": "icefog72/Ice0.53-16.01-RP", + "name": "Ice0.53-16.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4741, + "BBH": 0.5102, + "MATH Level 5": 0.0634, + "GPQA": 0.3087, + "MUSR": 0.4327, + "MMLU-PRO": 0.313 + } + }, + { + "model_id": "icefog72/Ice0.54-17.01-RP", + "name": "Ice0.54-17.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4379, + "BBH": 0.4853, + "MATH Level 5": 0.0408, + "GPQA": 0.3096, + "MUSR": 0.4874, + "MMLU-PRO": 0.2326 + } + }, + { + "model_id": "icefog72/Ice0.55-17.01-RP", + "name": "Ice0.55-17.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4961, + "BBH": 0.5077, + "MATH Level 5": 0.0604, + "GPQA": 0.2869, + "MUSR": 0.4725, + "MMLU-PRO": 0.2658 + } + }, + { + "model_id": "icefog72/Ice0.57-17.01-RP", + "name": "Ice0.57-17.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5152, + "BBH": 0.5064, + "MATH Level 5": 0.0514, + "GPQA": 0.297, + "MUSR": 0.4686, + "MMLU-PRO": 0.2651 + } + }, + { + "model_id": "icefog72/Ice0.60-18.01-RP", + "name": "Ice0.60-18.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5374, + "BBH": 0.5094, + "MATH Level 5": 0.0536, + "GPQA": 0.3045, + "MUSR": 0.467, + "MMLU-PRO": 0.2837 + } + }, + { + "model_id": "icefog72/Ice0.60.1-18.01-RP", + "name": "Ice0.60.1-18.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5188, + "BBH": 0.512, + "MATH Level 5": 0.0461, + "GPQA": 0.302, + "MUSR": 0.4498, + "MMLU-PRO": 0.2914 + } + }, + { + "model_id": "icefog72/Ice0.61-18.01-RP", + "name": "Ice0.61-18.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5441, + "BBH": 0.5105, + "MATH Level 5": 0.0468, + "GPQA": 0.2987, + "MUSR": 0.4697, + "MMLU-PRO": 0.2709 + } + }, + { + "model_id": "icefog72/Ice0.62-18.01-RP", + "name": "Ice0.62-18.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5367, + "BBH": 0.5103, + "MATH Level 5": 0.0574, + "GPQA": 0.2978, + "MUSR": 0.4538, + "MMLU-PRO": 0.2877 + } + }, + { + "model_id": "icefog72/Ice0.62.1-24.01-RP", + "name": "Ice0.62.1-24.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5182, + "BBH": 0.5109, + "MATH Level 5": 0.0559, + "GPQA": 0.3003, + "MUSR": 0.4551, + "MMLU-PRO": 0.2871 + } + }, + { + "model_id": "icefog72/Ice0.64-24.01-RP", + "name": "Ice0.64-24.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5441, + "BBH": 0.506, + "MATH Level 5": 0.0627, + "GPQA": 0.3037, + "MUSR": 0.462, + "MMLU-PRO": 0.2933 + } + }, + { + "model_id": "icefog72/Ice0.64.1-24.01-RP", + "name": "Ice0.64.1-24.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5447, + "BBH": 0.506, + "MATH Level 5": 0.0627, + "GPQA": 0.3037, + "MUSR": 0.462, + "MMLU-PRO": 0.2933 + } + }, + { + "model_id": "icefog72/Ice0.65-25.01-RP", + "name": "Ice0.65-25.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5029, + "BBH": 0.5096, + "MATH Level 5": 0.065, + "GPQA": 0.3045, + "MUSR": 0.434, + "MMLU-PRO": 0.2997 + } + }, + { + "model_id": "icefog72/Ice0.66-25.01-RP", + "name": "Ice0.66-25.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5325, + "BBH": 0.5129, + "MATH Level 5": 0.0604, + "GPQA": 0.307, + "MUSR": 0.4434, + "MMLU-PRO": 0.3039 + } + }, + { + "model_id": "icefog72/Ice0.67-25.01-RP", + "name": "Ice0.67-25.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5361, + "BBH": 0.5113, + "MATH Level 5": 0.0748, + "GPQA": 0.2852, + "MUSR": 0.4279, + "MMLU-PRO": 0.3097 + } + }, + { + "model_id": "icefog72/Ice0.68-25.01-RP", + "name": "Ice0.68-25.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5514, + "BBH": 0.513, + "MATH Level 5": 0.0725, + "GPQA": 0.3104, + "MUSR": 0.4446, + "MMLU-PRO": 0.3012 + } + }, + { + "model_id": "icefog72/Ice0.69-25.01-RP", + "name": "Ice0.69-25.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5438, + "BBH": 0.5098, + "MATH Level 5": 0.0566, + "GPQA": 0.3129, + "MUSR": 0.4486, + "MMLU-PRO": 0.2965 + } + }, + { + "model_id": "icefog72/Ice0.7-29.09-RP", + "name": "Ice0.7-29.09-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5176, + "BBH": 0.5048, + "MATH Level 5": 0.0665, + "GPQA": 0.2878, + "MUSR": 0.4238, + "MMLU-PRO": 0.3127 + } + }, + { + "model_id": "icefog72/Ice0.70-25.01-RP", + "name": "Ice0.70-25.01-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5498, + "BBH": 0.5136, + "MATH Level 5": 0.0597, + "GPQA": 0.3079, + "MUSR": 0.4512, + "MMLU-PRO": 0.2996 + } + }, + { + "model_id": "icefog72/Ice0.70.1-01.02-RP", + "name": "Ice0.70.1-01.02-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.507, + "BBH": 0.506, + "MATH Level 5": 0.034, + "GPQA": 0.2978, + "MUSR": 0.4599, + "MMLU-PRO": 0.2749 + } + }, + { + "model_id": "icefog72/Ice0.73-01.02-RP", + "name": "Ice0.73-01.02-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5292, + "BBH": 0.5103, + "MATH Level 5": 0.0385, + "GPQA": 0.2911, + "MUSR": 0.4664, + "MMLU-PRO": 0.2702 + } + }, + { + "model_id": "icefog72/Ice0.74-02.02-RP", + "name": "Ice0.74-02.02-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.2935, + "BBH": 0.4646, + "MATH Level 5": 0.0015, + "GPQA": 0.2961, + "MUSR": 0.428, + "MMLU-PRO": 0.2143 + } + }, + { + "model_id": "icefog72/Ice0.76-02.02-RP", + "name": "Ice0.76-02.02-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4529, + "BBH": 0.5086, + "MATH Level 5": 0.0144, + "GPQA": 0.2869, + "MUSR": 0.4362, + "MMLU-PRO": 0.2652 + } + }, + { + "model_id": "icefog72/Ice0.77-02.02-RP", + "name": "Ice0.77-02.02-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.531, + "BBH": 0.5109, + "MATH Level 5": 0.0393, + "GPQA": 0.2852, + "MUSR": 0.4765, + "MMLU-PRO": 0.2999 + } + }, + { + "model_id": "icefog72/Ice0.78-02.02-RP", + "name": "Ice0.78-02.02-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4053, + "BBH": 0.5002, + "MATH Level 5": 0.0438, + "GPQA": 0.2936, + "MUSR": 0.4686, + "MMLU-PRO": 0.2955 + } + }, + { + "model_id": "icefog72/Ice0.80-03.02-RP", + "name": "Ice0.80-03.02-RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.5516, + "BBH": 0.5098, + "MATH Level 5": 0.0559, + "GPQA": 0.2785, + "MUSR": 0.4923, + "MMLU-PRO": 0.2912 + } + }, + { + "model_id": "icefog72/IceCocoaRP-7b", + "name": "IceCocoaRP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.4962, + "BBH": 0.4938, + "MATH Level 5": 0.0574, + "GPQA": 0.2953, + "MUSR": 0.4198, + "MMLU-PRO": 0.3098 + } + }, + { + "model_id": "icefog72/IceCoffeeRP-7b", + "name": "IceCoffeeRP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.4959, + "BBH": 0.4889, + "MATH Level 5": 0.0544, + "GPQA": 0.2852, + "MUSR": 0.416, + "MMLU-PRO": 0.2975 + } + }, + { + "model_id": "icefog72/IceDrinkByFrankensteinV3RP", + "name": "IceDrinkByFrankensteinV3RP", + "developer": "icefog72", + "scores": { + "IFEval": 0.4975, + "BBH": 0.4833, + "MATH Level 5": 0.0506, + "GPQA": 0.2617, + "MUSR": 0.4253, + "MMLU-PRO": 0.2927 + } + }, + { + "model_id": "icefog72/IceDrinkNameGoesHereRP-7b-Model_Stock", + "name": "IceDrinkNameGoesHereRP-7b-Model_Stock", + "developer": "icefog72", + "scores": { + "IFEval": 0.4968, + "BBH": 0.4658, + "MATH Level 5": 0.0408, + "GPQA": 0.2685, + "MUSR": 0.4067, + "MMLU-PRO": 0.2817 + } + }, + { + "model_id": "icefog72/IceDrinkNameNotFoundRP-7b-Model_Stock", + "name": "IceDrinkNameNotFoundRP-7b-Model_Stock", + "developer": "icefog72", + "scores": { + "IFEval": 0.513, + "BBH": 0.5026, + "MATH Level 5": 0.0604, + "GPQA": 0.2777, + "MUSR": 0.4372, + "MMLU-PRO": 0.3064 + } + }, + { + "model_id": "icefog72/IceDrunkCherryRP-7b", + "name": "IceDrunkCherryRP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.4898, + "BBH": 0.4847, + "MATH Level 5": 0.0612, + "GPQA": 0.2768, + "MUSR": 0.4292, + "MMLU-PRO": 0.3009 + } + }, + { + "model_id": "icefog72/IceDrunkenCherryRP-7b", + "name": "IceDrunkenCherryRP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.4763, + "BBH": 0.5093, + "MATH Level 5": 0.0642, + "GPQA": 0.307, + "MUSR": 0.4446, + "MMLU-PRO": 0.3099 + } + }, + { + "model_id": "icefog72/IceEspressoRPv2-7b", + "name": "IceEspressoRPv2-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.4977, + "BBH": 0.5055, + "MATH Level 5": 0.0619, + "GPQA": 0.2894, + "MUSR": 0.4331, + "MMLU-PRO": 0.3061 + } + }, + { + "model_id": "icefog72/IceLemonTeaRP-32k-7b", + "name": "IceLemonTeaRP-32k-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.5212, + "BBH": 0.4997, + "MATH Level 5": 0.0544, + "GPQA": 0.2903, + "MUSR": 0.429, + "MMLU-PRO": 0.3068 + } + }, + { + "model_id": "icefog72/IceMartiniRP-7b", + "name": "IceMartiniRP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.5045, + "BBH": 0.4972, + "MATH Level 5": 0.0665, + "GPQA": 0.2794, + "MUSR": 0.4345, + "MMLU-PRO": 0.3073 + } + }, + { + "model_id": "icefog72/IceNalyvkaRP-7b", + "name": "IceNalyvkaRP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.5498, + "BBH": 0.5136, + "MATH Level 5": 0.0597, + "GPQA": 0.3079, + "MUSR": 0.4512, + "MMLU-PRO": 0.2996 + } + }, + { + "model_id": "icefog72/IceSakeRP-7b", + "name": "IceSakeRP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.5228, + "BBH": 0.5119, + "MATH Level 5": 0.0634, + "GPQA": 0.2852, + "MUSR": 0.413, + "MMLU-PRO": 0.3177 + } + }, + { + "model_id": "icefog72/IceSakeV4RP-7b", + "name": "IceSakeV4RP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.4634, + "BBH": 0.493, + "MATH Level 5": 0.0559, + "GPQA": 0.2945, + "MUSR": 0.4082, + "MMLU-PRO": 0.3103 + } + }, + { + "model_id": "icefog72/IceSakeV6RP-7b", + "name": "IceSakeV6RP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.5033, + "BBH": 0.4976, + "MATH Level 5": 0.0619, + "GPQA": 0.2911, + "MUSR": 0.42, + "MMLU-PRO": 0.3093 + } + }, + { + "model_id": "icefog72/IceSakeV8RP-7b", + "name": "IceSakeV8RP-7b", + "developer": "icefog72", + "scores": { + "IFEval": 0.6086, + "BBH": 0.4885, + "MATH Level 5": 0.0597, + "GPQA": 0.276, + "MUSR": 0.3993, + "MMLU-PRO": 0.301 + } + }, + { + "model_id": "icefog72/IceTea21EnergyDrinkRPV13-DPOv3", + "name": "IceTea21EnergyDrinkRPV13-DPOv3", + "developer": "icefog72", + "scores": { + "IFEval": 0.5263, + "BBH": 0.502, + "MATH Level 5": 0.0582, + "GPQA": 0.2836, + "MUSR": 0.4372, + "MMLU-PRO": 0.3056 + } + }, + { + "model_id": "icefog72/IceTea21EnergyDrinkRPV13-DPOv3.5", + "name": "IceTea21EnergyDrinkRPV13-DPOv3.5", + "developer": "icefog72", + "scores": { + "IFEval": 0.4871, + "BBH": 0.44, + "MATH Level 5": 0.0363, + "GPQA": 0.2844, + "MUSR": 0.3964, + "MMLU-PRO": 0.2498 + } + }, + { + "model_id": "ifable/gemma-2-Ifable-9B", + "name": "gemma-2-Ifable-9B", + "developer": "ifable", + "scores": { + "IFEval": 0.2984, + "BBH": 0.5866, + "MATH Level 5": 0.1397, + "GPQA": 0.3414, + "MUSR": 0.4053, + "MMLU-PRO": 0.4226 + } + }, + { + "model_id": "ilsp/Llama-Krikri-8B-Instruct", + "name": "Llama-Krikri-8B-Instruct", + "developer": "ilsp", + "scores": { + "IFEval": 0.6079, + "BBH": 0.5047, + "MATH Level 5": 0.1178, + "GPQA": 0.3029, + "MUSR": 0.408, + "MMLU-PRO": 0.3313 + } + }, + { + "model_id": "inflatebot/MN-12B-Mag-Mell-R1", + "name": "MN-12B-Mag-Mell-R1", + "developer": "inflatebot", + "scores": { + "IFEval": 0.4613, + "BBH": 0.5304, + "MATH Level 5": 0.1299, + "GPQA": 0.3163, + "MUSR": 0.4002, + "MMLU-PRO": 0.3438 + } + }, + { + "model_id": "informatiker/Qwen2-7B-Instruct-abliterated", + "name": "Qwen2-7B-Instruct-abliterated", + "developer": "informatiker", + "scores": { + "IFEval": 0.5822, + "BBH": 0.5534, + "MATH Level 5": 0.2636, + "GPQA": 0.3012, + "MUSR": 0.3888, + "MMLU-PRO": 0.3873 + } + }, + { + "model_id": "insightfactory/Llama-3.2-3B-Instruct-unsloth-bnb-4bitlora_model", + "name": "Llama-3.2-3B-Instruct-unsloth-bnb-4bitlora_model", + "developer": "insightfactory", + "scores": { + "IFEval": 0.4588, + "BBH": 0.4146, + "MATH Level 5": 0.105, + "GPQA": 0.2718, + "MUSR": 0.3499, + "MMLU-PRO": 0.296 + } + }, + { + "model_id": "instruction-pretrain/InstructLM-500M", + "name": "InstructLM-500M", + "developer": "instruction-pretrain", + "scores": { + "IFEval": 0.1028, + "BBH": 0.2941, + "MATH Level 5": 0.0, + "GPQA": 0.2567, + "MUSR": 0.3528, + "MMLU-PRO": 0.1141 + } + }, + { + "model_id": "internlm/internlm2-1_8b", + "name": "internlm2-1_8b", + "developer": "internlm", + "scores": { + "IFEval": 0.2198, + "BBH": 0.388, + "MATH Level 5": 0.0211, + "GPQA": 0.2483, + "MUSR": 0.3813, + "MMLU-PRO": 0.1588 + } + }, + { + "model_id": "internlm/internlm2-7b", + "name": "internlm2-7b", + "developer": "internlm", + "scores": { + "IFEval": 0.228, + "BBH": 0.5825, + "MATH Level 5": 0.0857, + "GPQA": 0.3367, + "MUSR": 0.44, + "MMLU-PRO": 0.19 + } + }, + { + "model_id": "internlm/internlm2-chat-1_8b", + "name": "internlm2-chat-1_8b", + "developer": "internlm", + "scores": { + "IFEval": 0.2387, + "BBH": 0.4452, + "MATH Level 5": 0.0325, + "GPQA": 0.2659, + "MUSR": 0.3631, + "MMLU-PRO": 0.1839 + } + }, + { + "model_id": "internlm/internlm2_5-1_8b-chat", + "name": "internlm2_5-1_8b-chat", + "developer": "internlm", + "scores": { + "IFEval": 0.3849, + "BBH": 0.4489, + "MATH Level 5": 0.1586, + "GPQA": 0.2903, + "MUSR": 0.3594, + "MMLU-PRO": 0.1299 + } + }, + { + "model_id": "internlm/internlm2_5-20b-chat", + "name": "internlm2_5-20b-chat", + "developer": "internlm", + "scores": { + "IFEval": 0.701, + "BBH": 0.7474, + "MATH Level 5": 0.4079, + "GPQA": 0.3213, + "MUSR": 0.4558, + "MMLU-PRO": 0.3998 + } + }, + { + "model_id": "internlm/internlm2_5-7b-chat", + "name": "internlm2_5-7b-chat", + "developer": "internlm", + "scores": { + "IFEval": 0.5539, + "BBH": 0.7073, + "MATH Level 5": 0.253, + "GPQA": 0.3473, + "MUSR": 0.4594, + "MMLU-PRO": 0.3777 + } + }, + { + "model_id": "intervitens/mini-magnum-12b-v1.1", + "name": "mini-magnum-12b-v1.1", + "developer": "intervitens", + "scores": { + "IFEval": 0.5156, + "BBH": 0.5062, + "MATH Level 5": 0.0619, + "GPQA": 0.2886, + "MUSR": 0.4004, + "MMLU-PRO": 0.3291 + } + }, + { + "model_id": "inumulaisk/eval_model", + "name": "eval_model", + "developer": "inumulaisk", + "scores": { + "IFEval": 0.1931, + "BBH": 0.3512, + "MATH Level 5": 0.2976, + "GPQA": 0.2794, + "MUSR": 0.358, + "MMLU-PRO": 0.1664 + } + }, + { + "model_id": "invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp", + "name": "Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp", + "developer": "invalid-coder", + "scores": { + "IFEval": 0.4555, + "BBH": 0.5158, + "MATH Level 5": 0.0491, + "GPQA": 0.3054, + "MUSR": 0.3992, + "MMLU-PRO": 0.3146 + } + }, + { + "model_id": "invisietch/EtherealRainbow-v0.2-8B", + "name": "EtherealRainbow-v0.2-8B", + "developer": "invisietch", + "scores": { + "IFEval": 0.3903, + "BBH": 0.5102, + "MATH Level 5": 0.0823, + "GPQA": 0.3029, + "MUSR": 0.3827, + "MMLU-PRO": 0.3653 + } + }, + { + "model_id": "invisietch/EtherealRainbow-v0.3-8B", + "name": "EtherealRainbow-v0.3-8B", + "developer": "invisietch", + "scores": { + "IFEval": 0.3682, + "BBH": 0.5097, + "MATH Level 5": 0.0763, + "GPQA": 0.3045, + "MUSR": 0.3904, + "MMLU-PRO": 0.3626 + } + }, + { + "model_id": "invisietch/MiS-Firefly-v0.2-22B", + "name": "MiS-Firefly-v0.2-22B", + "developer": "invisietch", + "scores": { + "IFEval": 0.5371, + "BBH": 0.5514, + "MATH Level 5": 0.1654, + "GPQA": 0.3045, + "MUSR": 0.4694, + "MMLU-PRO": 0.362 + } + }, + { + "model_id": "invisietch/Nimbus-Miqu-v0.1-70B", + "name": "Nimbus-Miqu-v0.1-70B", + "developer": "invisietch", + "scores": { + "IFEval": 0.4647, + "BBH": 0.601, + "MATH Level 5": 0.0604, + "GPQA": 0.3389, + "MUSR": 0.4133, + "MMLU-PRO": 0.3853 + } + }, + { + "model_id": "irahulpandey/mistralai-7B-slerp-v0.1", + "name": "mistralai-7B-slerp-v0.1", + "developer": "irahulpandey", + "scores": { + "IFEval": 0.4966, + "BBH": 0.5011, + "MATH Level 5": 0.0514, + "GPQA": 0.3037, + "MUSR": 0.455, + "MMLU-PRO": 0.2951 + } + }, + { + "model_id": "jaredjoss/pythia-410m-roberta-lr_8e7-kl_01-steps_12000-rlhf-model", + "name": "pythia-410m-roberta-lr_8e7-kl_01-steps_12000-rlhf-model", + "developer": "jaredjoss", + "scores": { + "IFEval": 0.1572, + "BBH": 0.2863, + "MATH Level 5": 0.0, + "GPQA": 0.2592, + "MUSR": 0.3607, + "MMLU-PRO": 0.1169 + } + }, + { + "model_id": "jaspionjader/Auro-Kosmos-EVAA-v2-8B", + "name": "Auro-Kosmos-EVAA-v2-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4778, + "BBH": 0.5447, + "MATH Level 5": 0.1412, + "GPQA": 0.3154, + "MUSR": 0.425, + "MMLU-PRO": 0.3858 + } + }, + { + "model_id": "jaspionjader/Auro-Kosmos-EVAA-v2.1-8B", + "name": "Auro-Kosmos-EVAA-v2.1-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4666, + "BBH": 0.5444, + "MATH Level 5": 0.1458, + "GPQA": 0.3087, + "MUSR": 0.4317, + "MMLU-PRO": 0.3826 + } + }, + { + "model_id": "jaspionjader/Auro-Kosmos-EVAA-v2.2-8B", + "name": "Auro-Kosmos-EVAA-v2.2-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4268, + "BBH": 0.5431, + "MATH Level 5": 0.1412, + "GPQA": 0.3104, + "MUSR": 0.4251, + "MMLU-PRO": 0.3798 + } + }, + { + "model_id": "jaspionjader/Auro-Kosmos-EVAA-v2.3-8B", + "name": "Auro-Kosmos-EVAA-v2.3-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4271, + "BBH": 0.5441, + "MATH Level 5": 0.1344, + "GPQA": 0.3121, + "MUSR": 0.4278, + "MMLU-PRO": 0.3784 + } + }, + { + "model_id": "jaspionjader/Kosmos-Aurora_faustus-8B", + "name": "Kosmos-Aurora_faustus-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4432, + "BBH": 0.526, + "MATH Level 5": 0.1125, + "GPQA": 0.2953, + "MUSR": 0.4117, + "MMLU-PRO": 0.3813 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-8B", + "name": "Kosmos-EVAA-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4405, + "BBH": 0.5312, + "MATH Level 5": 0.1178, + "GPQA": 0.2995, + "MUSR": 0.4237, + "MMLU-PRO": 0.3818 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-Franken-Immersive-v39-8B", + "name": "Kosmos-EVAA-Franken-Immersive-v39-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4378, + "BBH": 0.519, + "MATH Level 5": 0.1292, + "GPQA": 0.3154, + "MUSR": 0.4236, + "MMLU-PRO": 0.39 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-Franken-v38-8B", + "name": "Kosmos-EVAA-Franken-v38-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4356, + "BBH": 0.523, + "MATH Level 5": 0.1292, + "GPQA": 0.3087, + "MUSR": 0.4212, + "MMLU-PRO": 0.389 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-Fusion-8B", + "name": "Kosmos-EVAA-Fusion-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4418, + "BBH": 0.5406, + "MATH Level 5": 0.1352, + "GPQA": 0.3062, + "MUSR": 0.4277, + "MMLU-PRO": 0.386 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-8B", + "name": "Kosmos-EVAA-PRP-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.3405, + "BBH": 0.5196, + "MATH Level 5": 0.0884, + "GPQA": 0.3129, + "MUSR": 0.4301, + "MMLU-PRO": 0.3647 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-light-8B", + "name": "Kosmos-EVAA-PRP-light-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.3824, + "BBH": 0.5271, + "MATH Level 5": 0.1103, + "GPQA": 0.3121, + "MUSR": 0.4249, + "MMLU-PRO": 0.3782 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v23-8B", + "name": "Kosmos-EVAA-PRP-v23-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4041, + "BBH": 0.529, + "MATH Level 5": 0.1156, + "GPQA": 0.3087, + "MUSR": 0.4368, + "MMLU-PRO": 0.3706 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v24-8B", + "name": "Kosmos-EVAA-PRP-v24-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4259, + "BBH": 0.5276, + "MATH Level 5": 0.1103, + "GPQA": 0.3104, + "MUSR": 0.429, + "MMLU-PRO": 0.3779 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v25-8B", + "name": "Kosmos-EVAA-PRP-v25-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4421, + "BBH": 0.5291, + "MATH Level 5": 0.1186, + "GPQA": 0.318, + "MUSR": 0.4303, + "MMLU-PRO": 0.3716 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v26-8B", + "name": "Kosmos-EVAA-PRP-v26-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4414, + "BBH": 0.5271, + "MATH Level 5": 0.1133, + "GPQA": 0.3045, + "MUSR": 0.4264, + "MMLU-PRO": 0.3793 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v27-8B", + "name": "Kosmos-EVAA-PRP-v27-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4378, + "BBH": 0.529, + "MATH Level 5": 0.1193, + "GPQA": 0.3087, + "MUSR": 0.4343, + "MMLU-PRO": 0.3755 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v28-8B", + "name": "Kosmos-EVAA-PRP-v28-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4366, + "BBH": 0.5295, + "MATH Level 5": 0.1171, + "GPQA": 0.307, + "MUSR": 0.433, + "MMLU-PRO": 0.375 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v29-8B", + "name": "Kosmos-EVAA-PRP-v29-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4487, + "BBH": 0.5275, + "MATH Level 5": 0.1201, + "GPQA": 0.3104, + "MUSR": 0.4237, + "MMLU-PRO": 0.3765 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v30-8B", + "name": "Kosmos-EVAA-PRP-v30-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4295, + "BBH": 0.5328, + "MATH Level 5": 0.1178, + "GPQA": 0.3045, + "MUSR": 0.4263, + "MMLU-PRO": 0.3938 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v31-8B", + "name": "Kosmos-EVAA-PRP-v31-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4399, + "BBH": 0.5315, + "MATH Level 5": 0.1133, + "GPQA": 0.3138, + "MUSR": 0.4251, + "MMLU-PRO": 0.3935 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v32-8B", + "name": "Kosmos-EVAA-PRP-v32-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4487, + "BBH": 0.5293, + "MATH Level 5": 0.1148, + "GPQA": 0.3163, + "MUSR": 0.4211, + "MMLU-PRO": 0.3777 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v33-8B", + "name": "Kosmos-EVAA-PRP-v33-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4302, + "BBH": 0.5321, + "MATH Level 5": 0.1178, + "GPQA": 0.3129, + "MUSR": 0.4184, + "MMLU-PRO": 0.3909 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-PRP-v34-8B", + "name": "Kosmos-EVAA-PRP-v34-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4563, + "BBH": 0.5333, + "MATH Level 5": 0.1125, + "GPQA": 0.3112, + "MUSR": 0.4237, + "MMLU-PRO": 0.3927 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-TSN-8B", + "name": "Kosmos-EVAA-TSN-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4721, + "BBH": 0.5177, + "MATH Level 5": 0.1344, + "GPQA": 0.3029, + "MUSR": 0.4329, + "MMLU-PRO": 0.3816 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-TSN-light-8B", + "name": "Kosmos-EVAA-TSN-light-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4685, + "BBH": 0.5235, + "MATH Level 5": 0.1216, + "GPQA": 0.3045, + "MUSR": 0.4289, + "MMLU-PRO": 0.3806 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-TSN-v19-8B", + "name": "Kosmos-EVAA-TSN-v19-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4564, + "BBH": 0.5316, + "MATH Level 5": 0.1156, + "GPQA": 0.3054, + "MUSR": 0.4277, + "MMLU-PRO": 0.379 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-TSN-v20-8B", + "name": "Kosmos-EVAA-TSN-v20-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4423, + "BBH": 0.525, + "MATH Level 5": 0.1246, + "GPQA": 0.3138, + "MUSR": 0.421, + "MMLU-PRO": 0.3936 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-TSN-v21-8B", + "name": "Kosmos-EVAA-TSN-v21-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.467, + "BBH": 0.5248, + "MATH Level 5": 0.1193, + "GPQA": 0.3121, + "MUSR": 0.4343, + "MMLU-PRO": 0.3816 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-TSN-v22-8B", + "name": "Kosmos-EVAA-TSN-v22-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4673, + "BBH": 0.5246, + "MATH Level 5": 0.1133, + "GPQA": 0.307, + "MUSR": 0.4303, + "MMLU-PRO": 0.3812 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-8B", + "name": "Kosmos-EVAA-gamma-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4572, + "BBH": 0.5322, + "MATH Level 5": 0.105, + "GPQA": 0.3188, + "MUSR": 0.4306, + "MMLU-PRO": 0.3901 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-alt-8B", + "name": "Kosmos-EVAA-gamma-alt-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4542, + "BBH": 0.5298, + "MATH Level 5": 0.1095, + "GPQA": 0.3247, + "MUSR": 0.4292, + "MMLU-PRO": 0.3896 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-light-8B", + "name": "Kosmos-EVAA-gamma-light-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4581, + "BBH": 0.5376, + "MATH Level 5": 0.1103, + "GPQA": 0.3163, + "MUSR": 0.4291, + "MMLU-PRO": 0.3943 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-light-alt-8B", + "name": "Kosmos-EVAA-gamma-light-alt-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4454, + "BBH": 0.5327, + "MATH Level 5": 0.1133, + "GPQA": 0.3138, + "MUSR": 0.4305, + "MMLU-PRO": 0.3923 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-ultra-light-8B", + "name": "Kosmos-EVAA-gamma-ultra-light-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4563, + "BBH": 0.5316, + "MATH Level 5": 0.1178, + "GPQA": 0.3163, + "MUSR": 0.4197, + "MMLU-PRO": 0.3915 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-v13-8B", + "name": "Kosmos-EVAA-gamma-v13-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4429, + "BBH": 0.5359, + "MATH Level 5": 0.1118, + "GPQA": 0.3138, + "MUSR": 0.4278, + "MMLU-PRO": 0.393 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-v14-8B", + "name": "Kosmos-EVAA-gamma-v14-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.438, + "BBH": 0.5363, + "MATH Level 5": 0.1103, + "GPQA": 0.3129, + "MUSR": 0.4277, + "MMLU-PRO": 0.3931 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-v15-8B", + "name": "Kosmos-EVAA-gamma-v15-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4654, + "BBH": 0.5343, + "MATH Level 5": 0.111, + "GPQA": 0.3112, + "MUSR": 0.4277, + "MMLU-PRO": 0.3941 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-v16-8B", + "name": "Kosmos-EVAA-gamma-v16-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4557, + "BBH": 0.5344, + "MATH Level 5": 0.1171, + "GPQA": 0.3154, + "MUSR": 0.4264, + "MMLU-PRO": 0.3917 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-v17-8B", + "name": "Kosmos-EVAA-gamma-v17-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4462, + "BBH": 0.5347, + "MATH Level 5": 0.111, + "GPQA": 0.3112, + "MUSR": 0.4291, + "MMLU-PRO": 0.3923 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-gamma-v18-8B", + "name": "Kosmos-EVAA-gamma-v18-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4341, + "BBH": 0.5339, + "MATH Level 5": 0.111, + "GPQA": 0.3112, + "MUSR": 0.4317, + "MMLU-PRO": 0.3905 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-immersive-sof-v44-8B", + "name": "Kosmos-EVAA-immersive-sof-v44-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4408, + "BBH": 0.5215, + "MATH Level 5": 0.1186, + "GPQA": 0.3096, + "MUSR": 0.4144, + "MMLU-PRO": 0.3888 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v10-8B", + "name": "Kosmos-EVAA-v10-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4262, + "BBH": 0.5376, + "MATH Level 5": 0.1246, + "GPQA": 0.2995, + "MUSR": 0.4224, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v11-8B", + "name": "Kosmos-EVAA-v11-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4426, + "BBH": 0.5359, + "MATH Level 5": 0.1322, + "GPQA": 0.3154, + "MUSR": 0.4184, + "MMLU-PRO": 0.3836 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v12-8B", + "name": "Kosmos-EVAA-v12-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4378, + "BBH": 0.5349, + "MATH Level 5": 0.1367, + "GPQA": 0.3096, + "MUSR": 0.4211, + "MMLU-PRO": 0.3836 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v2-8B", + "name": "Kosmos-EVAA-v2-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4396, + "BBH": 0.5341, + "MATH Level 5": 0.1322, + "GPQA": 0.2978, + "MUSR": 0.4211, + "MMLU-PRO": 0.3826 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v3-8B", + "name": "Kosmos-EVAA-v3-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4411, + "BBH": 0.5331, + "MATH Level 5": 0.1329, + "GPQA": 0.3054, + "MUSR": 0.4224, + "MMLU-PRO": 0.3821 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v4-8B", + "name": "Kosmos-EVAA-v4-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4289, + "BBH": 0.5337, + "MATH Level 5": 0.1254, + "GPQA": 0.3003, + "MUSR": 0.4197, + "MMLU-PRO": 0.3817 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v5-8B", + "name": "Kosmos-EVAA-v5-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.446, + "BBH": 0.5345, + "MATH Level 5": 0.1261, + "GPQA": 0.3037, + "MUSR": 0.4224, + "MMLU-PRO": 0.3821 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v6-8B", + "name": "Kosmos-EVAA-v6-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4396, + "BBH": 0.538, + "MATH Level 5": 0.1292, + "GPQA": 0.302, + "MUSR": 0.4184, + "MMLU-PRO": 0.3821 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v7-8B", + "name": "Kosmos-EVAA-v7-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4277, + "BBH": 0.5335, + "MATH Level 5": 0.1337, + "GPQA": 0.3054, + "MUSR": 0.4171, + "MMLU-PRO": 0.3836 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v8-8B", + "name": "Kosmos-EVAA-v8-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4383, + "BBH": 0.5359, + "MATH Level 5": 0.1307, + "GPQA": 0.3037, + "MUSR": 0.421, + "MMLU-PRO": 0.3827 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v9-8B", + "name": "Kosmos-EVAA-v9-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4369, + "BBH": 0.5361, + "MATH Level 5": 0.1276, + "GPQA": 0.3062, + "MUSR": 0.4184, + "MMLU-PRO": 0.382 + } + }, + { + "model_id": "jaspionjader/Kosmos-EVAA-v9-TitanFusion-Mix-8B", + "name": "Kosmos-EVAA-v9-TitanFusion-Mix-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4284, + "BBH": 0.554, + "MATH Level 5": 0.1148, + "GPQA": 0.2878, + "MUSR": 0.4354, + "MMLU-PRO": 0.3836 + } + }, + { + "model_id": "jaspionjader/Kosmos-Elusive-8b", + "name": "Kosmos-Elusive-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4169, + "BBH": 0.5339, + "MATH Level 5": 0.1261, + "GPQA": 0.3079, + "MUSR": 0.4078, + "MMLU-PRO": 0.376 + } + }, + { + "model_id": "jaspionjader/Kosmos-Elusive-VENN-8B", + "name": "Kosmos-Elusive-VENN-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4233, + "BBH": 0.5356, + "MATH Level 5": 0.1246, + "GPQA": 0.2995, + "MUSR": 0.4157, + "MMLU-PRO": 0.3797 + } + }, + { + "model_id": "jaspionjader/Kosmos-Elusive-VENN-Asymmetric-8B", + "name": "Kosmos-Elusive-VENN-Asymmetric-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4542, + "BBH": 0.5313, + "MATH Level 5": 0.1344, + "GPQA": 0.2945, + "MUSR": 0.4251, + "MMLU-PRO": 0.3842 + } + }, + { + "model_id": "jaspionjader/Kosmos-Elusive-VENN-Aurora_faustus-8B", + "name": "Kosmos-Elusive-VENN-Aurora_faustus-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4335, + "BBH": 0.5304, + "MATH Level 5": 0.1125, + "GPQA": 0.2953, + "MUSR": 0.417, + "MMLU-PRO": 0.3795 + } + }, + { + "model_id": "jaspionjader/Kosmos-VENN-8B", + "name": "Kosmos-VENN-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4332, + "BBH": 0.5318, + "MATH Level 5": 0.1412, + "GPQA": 0.2928, + "MUSR": 0.4211, + "MMLU-PRO": 0.3801 + } + }, + { + "model_id": "jaspionjader/PRP-Kosmos-EVAA-8B", + "name": "PRP-Kosmos-EVAA-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.3633, + "BBH": 0.5237, + "MATH Level 5": 0.0959, + "GPQA": 0.3096, + "MUSR": 0.425, + "MMLU-PRO": 0.3766 + } + }, + { + "model_id": "jaspionjader/PRP-Kosmos-EVAA-light-8B", + "name": "PRP-Kosmos-EVAA-light-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4321, + "BBH": 0.5275, + "MATH Level 5": 0.1103, + "GPQA": 0.3221, + "MUSR": 0.4235, + "MMLU-PRO": 0.3631 + } + }, + { + "model_id": "jaspionjader/TSN-Kosmos-EVAA-8B", + "name": "TSN-Kosmos-EVAA-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4903, + "BBH": 0.5347, + "MATH Level 5": 0.145, + "GPQA": 0.3205, + "MUSR": 0.4173, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "jaspionjader/TSN-Kosmos-EVAA-v2-8B", + "name": "TSN-Kosmos-EVAA-v2-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4667, + "BBH": 0.5343, + "MATH Level 5": 0.108, + "GPQA": 0.3221, + "MUSR": 0.4186, + "MMLU-PRO": 0.3762 + } + }, + { + "model_id": "jaspionjader/bbb-1", + "name": "bbb-1", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4864, + "BBH": 0.5376, + "MATH Level 5": 0.1367, + "GPQA": 0.3138, + "MUSR": 0.4171, + "MMLU-PRO": 0.3897 + } + }, + { + "model_id": "jaspionjader/bbb-2", + "name": "bbb-2", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4077, + "BBH": 0.5067, + "MATH Level 5": 0.1125, + "GPQA": 0.302, + "MUSR": 0.4145, + "MMLU-PRO": 0.3635 + } + }, + { + "model_id": "jaspionjader/bbb-3", + "name": "bbb-3", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4168, + "BBH": 0.5158, + "MATH Level 5": 0.1405, + "GPQA": 0.3112, + "MUSR": 0.4265, + "MMLU-PRO": 0.3856 + } + }, + { + "model_id": "jaspionjader/bbb-4", + "name": "bbb-4", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4768, + "BBH": 0.5212, + "MATH Level 5": 0.1276, + "GPQA": 0.2978, + "MUSR": 0.4092, + "MMLU-PRO": 0.3773 + } + }, + { + "model_id": "jaspionjader/bbb-5", + "name": "bbb-5", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4703, + "BBH": 0.5207, + "MATH Level 5": 0.1397, + "GPQA": 0.3045, + "MUSR": 0.3998, + "MMLU-PRO": 0.3834 + } + }, + { + "model_id": "jaspionjader/bbb-6", + "name": "bbb-6", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.488, + "BBH": 0.5211, + "MATH Level 5": 0.139, + "GPQA": 0.3104, + "MUSR": 0.4052, + "MMLU-PRO": 0.3871 + } + }, + { + "model_id": "jaspionjader/bbb-7", + "name": "bbb-7", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4828, + "BBH": 0.5211, + "MATH Level 5": 0.1367, + "GPQA": 0.3104, + "MUSR": 0.4038, + "MMLU-PRO": 0.386 + } + }, + { + "model_id": "jaspionjader/bh-1", + "name": "bh-1", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4284, + "BBH": 0.589, + "MATH Level 5": 0.0536, + "GPQA": 0.2945, + "MUSR": 0.4441, + "MMLU-PRO": 0.3449 + } + }, + { + "model_id": "jaspionjader/bh-10", + "name": "bh-10", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4618, + "BBH": 0.5856, + "MATH Level 5": 0.1103, + "GPQA": 0.3003, + "MUSR": 0.4199, + "MMLU-PRO": 0.3708 + } + }, + { + "model_id": "jaspionjader/bh-11", + "name": "bh-11", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4575, + "BBH": 0.5851, + "MATH Level 5": 0.1178, + "GPQA": 0.307, + "MUSR": 0.4146, + "MMLU-PRO": 0.3738 + } + }, + { + "model_id": "jaspionjader/bh-12", + "name": "bh-12", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4734, + "BBH": 0.5802, + "MATH Level 5": 0.1186, + "GPQA": 0.3003, + "MUSR": 0.4145, + "MMLU-PRO": 0.3737 + } + }, + { + "model_id": "jaspionjader/bh-13", + "name": "bh-13", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4698, + "BBH": 0.5778, + "MATH Level 5": 0.1125, + "GPQA": 0.307, + "MUSR": 0.4159, + "MMLU-PRO": 0.373 + } + }, + { + "model_id": "jaspionjader/bh-15", + "name": "bh-15", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4745, + "BBH": 0.5819, + "MATH Level 5": 0.1246, + "GPQA": 0.2987, + "MUSR": 0.4105, + "MMLU-PRO": 0.3767 + } + }, + { + "model_id": "jaspionjader/bh-16", + "name": "bh-16", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4731, + "BBH": 0.5783, + "MATH Level 5": 0.1193, + "GPQA": 0.3029, + "MUSR": 0.4159, + "MMLU-PRO": 0.3776 + } + }, + { + "model_id": "jaspionjader/bh-17", + "name": "bh-17", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4722, + "BBH": 0.5776, + "MATH Level 5": 0.1133, + "GPQA": 0.2978, + "MUSR": 0.4158, + "MMLU-PRO": 0.3757 + } + }, + { + "model_id": "jaspionjader/bh-18", + "name": "bh-18", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4725, + "BBH": 0.5824, + "MATH Level 5": 0.1186, + "GPQA": 0.3003, + "MUSR": 0.4185, + "MMLU-PRO": 0.3757 + } + }, + { + "model_id": "jaspionjader/bh-19", + "name": "bh-19", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4584, + "BBH": 0.5766, + "MATH Level 5": 0.1193, + "GPQA": 0.297, + "MUSR": 0.4171, + "MMLU-PRO": 0.3775 + } + }, + { + "model_id": "jaspionjader/bh-2", + "name": "bh-2", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4579, + "BBH": 0.5937, + "MATH Level 5": 0.1027, + "GPQA": 0.3012, + "MUSR": 0.4186, + "MMLU-PRO": 0.3695 + } + }, + { + "model_id": "jaspionjader/bh-20", + "name": "bh-20", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4727, + "BBH": 0.575, + "MATH Level 5": 0.1201, + "GPQA": 0.2878, + "MUSR": 0.4105, + "MMLU-PRO": 0.3768 + } + }, + { + "model_id": "jaspionjader/bh-21", + "name": "bh-21", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.47, + "BBH": 0.5738, + "MATH Level 5": 0.1216, + "GPQA": 0.2978, + "MUSR": 0.4158, + "MMLU-PRO": 0.3776 + } + }, + { + "model_id": "jaspionjader/bh-22", + "name": "bh-22", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.46, + "BBH": 0.5793, + "MATH Level 5": 0.1186, + "GPQA": 0.2961, + "MUSR": 0.4172, + "MMLU-PRO": 0.3764 + } + }, + { + "model_id": "jaspionjader/bh-23", + "name": "bh-23", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4658, + "BBH": 0.57, + "MATH Level 5": 0.1201, + "GPQA": 0.2945, + "MUSR": 0.4197, + "MMLU-PRO": 0.3796 + } + }, + { + "model_id": "jaspionjader/bh-24", + "name": "bh-24", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4715, + "BBH": 0.5717, + "MATH Level 5": 0.1269, + "GPQA": 0.2961, + "MUSR": 0.4158, + "MMLU-PRO": 0.3809 + } + }, + { + "model_id": "jaspionjader/bh-25", + "name": "bh-25", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4752, + "BBH": 0.5706, + "MATH Level 5": 0.1133, + "GPQA": 0.2911, + "MUSR": 0.4118, + "MMLU-PRO": 0.3782 + } + }, + { + "model_id": "jaspionjader/bh-26", + "name": "bh-26", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4691, + "BBH": 0.5735, + "MATH Level 5": 0.1163, + "GPQA": 0.2995, + "MUSR": 0.4277, + "MMLU-PRO": 0.3772 + } + }, + { + "model_id": "jaspionjader/bh-27", + "name": "bh-27", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4819, + "BBH": 0.5714, + "MATH Level 5": 0.1276, + "GPQA": 0.2961, + "MUSR": 0.4091, + "MMLU-PRO": 0.3799 + } + }, + { + "model_id": "jaspionjader/bh-28", + "name": "bh-28", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4785, + "BBH": 0.5703, + "MATH Level 5": 0.1231, + "GPQA": 0.2987, + "MUSR": 0.4131, + "MMLU-PRO": 0.3812 + } + }, + { + "model_id": "jaspionjader/bh-29", + "name": "bh-29", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4688, + "BBH": 0.567, + "MATH Level 5": 0.1208, + "GPQA": 0.2953, + "MUSR": 0.4237, + "MMLU-PRO": 0.3819 + } + }, + { + "model_id": "jaspionjader/bh-3", + "name": "bh-3", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4664, + "BBH": 0.5891, + "MATH Level 5": 0.1148, + "GPQA": 0.302, + "MUSR": 0.4173, + "MMLU-PRO": 0.3702 + } + }, + { + "model_id": "jaspionjader/bh-30", + "name": "bh-30", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4666, + "BBH": 0.5706, + "MATH Level 5": 0.1231, + "GPQA": 0.2928, + "MUSR": 0.4144, + "MMLU-PRO": 0.3782 + } + }, + { + "model_id": "jaspionjader/bh-31", + "name": "bh-31", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4727, + "BBH": 0.5665, + "MATH Level 5": 0.1284, + "GPQA": 0.2936, + "MUSR": 0.4104, + "MMLU-PRO": 0.382 + } + }, + { + "model_id": "jaspionjader/bh-32", + "name": "bh-32", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4636, + "BBH": 0.5662, + "MATH Level 5": 0.1246, + "GPQA": 0.297, + "MUSR": 0.4157, + "MMLU-PRO": 0.3812 + } + }, + { + "model_id": "jaspionjader/bh-33", + "name": "bh-33", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4685, + "BBH": 0.5653, + "MATH Level 5": 0.1178, + "GPQA": 0.2961, + "MUSR": 0.4157, + "MMLU-PRO": 0.3808 + } + }, + { + "model_id": "jaspionjader/bh-34", + "name": "bh-34", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4624, + "BBH": 0.5681, + "MATH Level 5": 0.1208, + "GPQA": 0.2919, + "MUSR": 0.4185, + "MMLU-PRO": 0.3804 + } + }, + { + "model_id": "jaspionjader/bh-35", + "name": "bh-35", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4721, + "BBH": 0.564, + "MATH Level 5": 0.1246, + "GPQA": 0.2953, + "MUSR": 0.4183, + "MMLU-PRO": 0.383 + } + }, + { + "model_id": "jaspionjader/bh-36", + "name": "bh-36", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4666, + "BBH": 0.5664, + "MATH Level 5": 0.1239, + "GPQA": 0.302, + "MUSR": 0.4196, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "jaspionjader/bh-37", + "name": "bh-37", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.488, + "BBH": 0.5625, + "MATH Level 5": 0.1216, + "GPQA": 0.2945, + "MUSR": 0.4156, + "MMLU-PRO": 0.3828 + } + }, + { + "model_id": "jaspionjader/bh-38", + "name": "bh-38", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4618, + "BBH": 0.5658, + "MATH Level 5": 0.1239, + "GPQA": 0.2978, + "MUSR": 0.4117, + "MMLU-PRO": 0.3811 + } + }, + { + "model_id": "jaspionjader/bh-39", + "name": "bh-39", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4576, + "BBH": 0.5633, + "MATH Level 5": 0.1254, + "GPQA": 0.3003, + "MUSR": 0.4262, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "jaspionjader/bh-4", + "name": "bh-4", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4673, + "BBH": 0.5892, + "MATH Level 5": 0.1095, + "GPQA": 0.2961, + "MUSR": 0.4173, + "MMLU-PRO": 0.3705 + } + }, + { + "model_id": "jaspionjader/bh-40", + "name": "bh-40", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4536, + "BBH": 0.5634, + "MATH Level 5": 0.1246, + "GPQA": 0.2987, + "MUSR": 0.4236, + "MMLU-PRO": 0.3835 + } + }, + { + "model_id": "jaspionjader/bh-41", + "name": "bh-41", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.474, + "BBH": 0.5614, + "MATH Level 5": 0.1254, + "GPQA": 0.2928, + "MUSR": 0.4183, + "MMLU-PRO": 0.3825 + } + }, + { + "model_id": "jaspionjader/bh-42", + "name": "bh-42", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.466, + "BBH": 0.5646, + "MATH Level 5": 0.1269, + "GPQA": 0.2961, + "MUSR": 0.421, + "MMLU-PRO": 0.3812 + } + }, + { + "model_id": "jaspionjader/bh-43", + "name": "bh-43", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.46, + "BBH": 0.5635, + "MATH Level 5": 0.1239, + "GPQA": 0.2945, + "MUSR": 0.4156, + "MMLU-PRO": 0.382 + } + }, + { + "model_id": "jaspionjader/bh-44", + "name": "bh-44", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4706, + "BBH": 0.5643, + "MATH Level 5": 0.1216, + "GPQA": 0.2961, + "MUSR": 0.4249, + "MMLU-PRO": 0.3834 + } + }, + { + "model_id": "jaspionjader/bh-46", + "name": "bh-46", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4727, + "BBH": 0.5632, + "MATH Level 5": 0.1276, + "GPQA": 0.2961, + "MUSR": 0.4262, + "MMLU-PRO": 0.3822 + } + }, + { + "model_id": "jaspionjader/bh-47", + "name": "bh-47", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4652, + "BBH": 0.5546, + "MATH Level 5": 0.1276, + "GPQA": 0.2945, + "MUSR": 0.4156, + "MMLU-PRO": 0.3855 + } + }, + { + "model_id": "jaspionjader/bh-48", + "name": "bh-48", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4688, + "BBH": 0.5541, + "MATH Level 5": 0.1254, + "GPQA": 0.2945, + "MUSR": 0.4209, + "MMLU-PRO": 0.386 + } + }, + { + "model_id": "jaspionjader/bh-49", + "name": "bh-49", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4725, + "BBH": 0.554, + "MATH Level 5": 0.1201, + "GPQA": 0.2945, + "MUSR": 0.4129, + "MMLU-PRO": 0.3808 + } + }, + { + "model_id": "jaspionjader/bh-5", + "name": "bh-5", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4652, + "BBH": 0.5882, + "MATH Level 5": 0.1057, + "GPQA": 0.2995, + "MUSR": 0.4186, + "MMLU-PRO": 0.3702 + } + }, + { + "model_id": "jaspionjader/bh-50", + "name": "bh-50", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4725, + "BBH": 0.5553, + "MATH Level 5": 0.1208, + "GPQA": 0.2936, + "MUSR": 0.4169, + "MMLU-PRO": 0.3842 + } + }, + { + "model_id": "jaspionjader/bh-51", + "name": "bh-51", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.463, + "BBH": 0.5557, + "MATH Level 5": 0.1239, + "GPQA": 0.2928, + "MUSR": 0.4168, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "jaspionjader/bh-52", + "name": "bh-52", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4536, + "BBH": 0.5444, + "MATH Level 5": 0.1201, + "GPQA": 0.2919, + "MUSR": 0.4169, + "MMLU-PRO": 0.3843 + } + }, + { + "model_id": "jaspionjader/bh-53", + "name": "bh-53", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.478, + "BBH": 0.5494, + "MATH Level 5": 0.1269, + "GPQA": 0.2987, + "MUSR": 0.4196, + "MMLU-PRO": 0.3858 + } + }, + { + "model_id": "jaspionjader/bh-54", + "name": "bh-54", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4841, + "BBH": 0.5548, + "MATH Level 5": 0.1292, + "GPQA": 0.2945, + "MUSR": 0.4155, + "MMLU-PRO": 0.3825 + } + }, + { + "model_id": "jaspionjader/bh-55", + "name": "bh-55", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4709, + "BBH": 0.555, + "MATH Level 5": 0.1284, + "GPQA": 0.3062, + "MUSR": 0.4222, + "MMLU-PRO": 0.3846 + } + }, + { + "model_id": "jaspionjader/bh-56", + "name": "bh-56", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.46, + "BBH": 0.5447, + "MATH Level 5": 0.1231, + "GPQA": 0.3003, + "MUSR": 0.4116, + "MMLU-PRO": 0.3844 + } + }, + { + "model_id": "jaspionjader/bh-57", + "name": "bh-57", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4405, + "BBH": 0.5425, + "MATH Level 5": 0.1261, + "GPQA": 0.3037, + "MUSR": 0.421, + "MMLU-PRO": 0.3896 + } + }, + { + "model_id": "jaspionjader/bh-58", + "name": "bh-58", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.463, + "BBH": 0.5446, + "MATH Level 5": 0.1322, + "GPQA": 0.3062, + "MUSR": 0.4183, + "MMLU-PRO": 0.3896 + } + }, + { + "model_id": "jaspionjader/bh-59", + "name": "bh-59", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4341, + "BBH": 0.5512, + "MATH Level 5": 0.1541, + "GPQA": 0.3154, + "MUSR": 0.417, + "MMLU-PRO": 0.3838 + } + }, + { + "model_id": "jaspionjader/bh-6", + "name": "bh-6", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4621, + "BBH": 0.5891, + "MATH Level 5": 0.1088, + "GPQA": 0.2995, + "MUSR": 0.4199, + "MMLU-PRO": 0.3698 + } + }, + { + "model_id": "jaspionjader/bh-60", + "name": "bh-60", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4207, + "BBH": 0.5369, + "MATH Level 5": 0.1579, + "GPQA": 0.3255, + "MUSR": 0.4289, + "MMLU-PRO": 0.3689 + } + }, + { + "model_id": "jaspionjader/bh-61", + "name": "bh-61", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4247, + "BBH": 0.5271, + "MATH Level 5": 0.1707, + "GPQA": 0.3188, + "MUSR": 0.4356, + "MMLU-PRO": 0.3679 + } + }, + { + "model_id": "jaspionjader/bh-62", + "name": "bh-62", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.415, + "BBH": 0.5379, + "MATH Level 5": 0.1624, + "GPQA": 0.3205, + "MUSR": 0.4289, + "MMLU-PRO": 0.3719 + } + }, + { + "model_id": "jaspionjader/bh-63", + "name": "bh-63", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4308, + "BBH": 0.4917, + "MATH Level 5": 0.111, + "GPQA": 0.3029, + "MUSR": 0.4313, + "MMLU-PRO": 0.3248 + } + }, + { + "model_id": "jaspionjader/bh-64", + "name": "bh-64", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.414, + "BBH": 0.536, + "MATH Level 5": 0.1548, + "GPQA": 0.3213, + "MUSR": 0.4355, + "MMLU-PRO": 0.3693 + } + }, + { + "model_id": "jaspionjader/bh-7", + "name": "bh-7", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4624, + "BBH": 0.5861, + "MATH Level 5": 0.114, + "GPQA": 0.3037, + "MUSR": 0.4119, + "MMLU-PRO": 0.3715 + } + }, + { + "model_id": "jaspionjader/bh-8", + "name": "bh-8", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4597, + "BBH": 0.59, + "MATH Level 5": 0.1178, + "GPQA": 0.3012, + "MUSR": 0.4265, + "MMLU-PRO": 0.372 + } + }, + { + "model_id": "jaspionjader/bh-9", + "name": "bh-9", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4509, + "BBH": 0.585, + "MATH Level 5": 0.1156, + "GPQA": 0.302, + "MUSR": 0.4146, + "MMLU-PRO": 0.3703 + } + }, + { + "model_id": "jaspionjader/dp-6-8b", + "name": "dp-6-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4806, + "BBH": 0.53, + "MATH Level 5": 0.1329, + "GPQA": 0.3079, + "MUSR": 0.4434, + "MMLU-PRO": 0.3897 + } + }, + { + "model_id": "jaspionjader/dp-7-8b", + "name": "dp-7-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4498, + "BBH": 0.5291, + "MATH Level 5": 0.1261, + "GPQA": 0.3062, + "MUSR": 0.4407, + "MMLU-PRO": 0.3934 + } + }, + { + "model_id": "jaspionjader/ek-6", + "name": "ek-6", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4642, + "BBH": 0.5219, + "MATH Level 5": 0.1322, + "GPQA": 0.3087, + "MUSR": 0.4144, + "MMLU-PRO": 0.3861 + } + }, + { + "model_id": "jaspionjader/ek-7", + "name": "ek-7", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4767, + "BBH": 0.5194, + "MATH Level 5": 0.1329, + "GPQA": 0.3163, + "MUSR": 0.4171, + "MMLU-PRO": 0.3887 + } + }, + { + "model_id": "jaspionjader/f-1-8b", + "name": "f-1-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4983, + "BBH": 0.5141, + "MATH Level 5": 0.1284, + "GPQA": 0.3087, + "MUSR": 0.4527, + "MMLU-PRO": 0.3907 + } + }, + { + "model_id": "jaspionjader/f-2-8b", + "name": "f-2-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4824, + "BBH": 0.5294, + "MATH Level 5": 0.1171, + "GPQA": 0.2995, + "MUSR": 0.4501, + "MMLU-PRO": 0.3962 + } + }, + { + "model_id": "jaspionjader/f-3-8b", + "name": "f-3-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4803, + "BBH": 0.5275, + "MATH Level 5": 0.1216, + "GPQA": 0.3138, + "MUSR": 0.4421, + "MMLU-PRO": 0.3954 + } + }, + { + "model_id": "jaspionjader/f-4-8b", + "name": "f-4-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4797, + "BBH": 0.5289, + "MATH Level 5": 0.1148, + "GPQA": 0.3087, + "MUSR": 0.4514, + "MMLU-PRO": 0.3956 + } + }, + { + "model_id": "jaspionjader/f-5-8b", + "name": "f-5-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.5044, + "BBH": 0.5313, + "MATH Level 5": 0.1239, + "GPQA": 0.3087, + "MUSR": 0.4461, + "MMLU-PRO": 0.3949 + } + }, + { + "model_id": "jaspionjader/f-6-8b", + "name": "f-6-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4846, + "BBH": 0.5241, + "MATH Level 5": 0.1193, + "GPQA": 0.3079, + "MUSR": 0.4474, + "MMLU-PRO": 0.3939 + } + }, + { + "model_id": "jaspionjader/f-7-8b", + "name": "f-7-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4462, + "BBH": 0.5277, + "MATH Level 5": 0.1239, + "GPQA": 0.3129, + "MUSR": 0.4315, + "MMLU-PRO": 0.3936 + } + }, + { + "model_id": "jaspionjader/f-8-8b", + "name": "f-8-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4739, + "BBH": 0.5259, + "MATH Level 5": 0.1224, + "GPQA": 0.3096, + "MUSR": 0.4354, + "MMLU-PRO": 0.394 + } + }, + { + "model_id": "jaspionjader/f-9-8b", + "name": "f-9-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4602, + "BBH": 0.5292, + "MATH Level 5": 0.1299, + "GPQA": 0.3062, + "MUSR": 0.4461, + "MMLU-PRO": 0.3944 + } + }, + { + "model_id": "jaspionjader/fct-14-8b", + "name": "fct-14-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4129, + "BBH": 0.5206, + "MATH Level 5": 0.1201, + "GPQA": 0.3163, + "MUSR": 0.4186, + "MMLU-PRO": 0.3875 + } + }, + { + "model_id": "jaspionjader/fct-9-8b", + "name": "fct-9-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4354, + "BBH": 0.5205, + "MATH Level 5": 0.1193, + "GPQA": 0.3079, + "MUSR": 0.4291, + "MMLU-PRO": 0.3932 + } + }, + { + "model_id": "jaspionjader/fr-1-8b", + "name": "fr-1-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4211, + "BBH": 0.5142, + "MATH Level 5": 0.1118, + "GPQA": 0.3054, + "MUSR": 0.4277, + "MMLU-PRO": 0.361 + } + }, + { + "model_id": "jaspionjader/fr-10-8b", + "name": "fr-10-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4402, + "BBH": 0.5207, + "MATH Level 5": 0.1224, + "GPQA": 0.3171, + "MUSR": 0.4119, + "MMLU-PRO": 0.3863 + } + }, + { + "model_id": "jaspionjader/fr-3-8b", + "name": "fr-3-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4326, + "BBH": 0.5255, + "MATH Level 5": 0.1133, + "GPQA": 0.3054, + "MUSR": 0.4198, + "MMLU-PRO": 0.3863 + } + }, + { + "model_id": "jaspionjader/gamma-Kosmos-EVAA-8B", + "name": "gamma-Kosmos-EVAA-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.425, + "BBH": 0.5253, + "MATH Level 5": 0.0899, + "GPQA": 0.3138, + "MUSR": 0.4412, + "MMLU-PRO": 0.3776 + } + }, + { + "model_id": "jaspionjader/gamma-Kosmos-EVAA-v2-8B", + "name": "gamma-Kosmos-EVAA-v2-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4233, + "BBH": 0.5262, + "MATH Level 5": 0.1057, + "GPQA": 0.3205, + "MUSR": 0.4344, + "MMLU-PRO": 0.3756 + } + }, + { + "model_id": "jaspionjader/gamma-Kosmos-EVAA-v3-8B", + "name": "gamma-Kosmos-EVAA-v3-8B", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4333, + "BBH": 0.5278, + "MATH Level 5": 0.111, + "GPQA": 0.3129, + "MUSR": 0.4263, + "MMLU-PRO": 0.3898 + } + }, + { + "model_id": "jaspionjader/knf-2-8b", + "name": "knf-2-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.425, + "BBH": 0.5207, + "MATH Level 5": 0.1201, + "GPQA": 0.3104, + "MUSR": 0.4185, + "MMLU-PRO": 0.3875 + } + }, + { + "model_id": "jaspionjader/knfp-2-8b", + "name": "knfp-2-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.5327, + "BBH": 0.5305, + "MATH Level 5": 0.1427, + "GPQA": 0.2928, + "MUSR": 0.4185, + "MMLU-PRO": 0.3726 + } + }, + { + "model_id": "jaspionjader/knfp-3-8b", + "name": "knfp-3-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4946, + "BBH": 0.52, + "MATH Level 5": 0.1224, + "GPQA": 0.307, + "MUSR": 0.4171, + "MMLU-PRO": 0.3881 + } + }, + { + "model_id": "jaspionjader/kstc-1-8b", + "name": "kstc-1-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4643, + "BBH": 0.5209, + "MATH Level 5": 0.1171, + "GPQA": 0.3171, + "MUSR": 0.4158, + "MMLU-PRO": 0.3892 + } + }, + { + "model_id": "jaspionjader/kstc-11-8b", + "name": "kstc-11-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4757, + "BBH": 0.5189, + "MATH Level 5": 0.1201, + "GPQA": 0.3029, + "MUSR": 0.4118, + "MMLU-PRO": 0.3879 + } + }, + { + "model_id": "jaspionjader/kstc-4-8b", + "name": "kstc-4-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.477, + "BBH": 0.5216, + "MATH Level 5": 0.1239, + "GPQA": 0.3037, + "MUSR": 0.4118, + "MMLU-PRO": 0.3869 + } + }, + { + "model_id": "jaspionjader/kstc-5-8b", + "name": "kstc-5-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4721, + "BBH": 0.5211, + "MATH Level 5": 0.1299, + "GPQA": 0.3154, + "MUSR": 0.4224, + "MMLU-PRO": 0.3892 + } + }, + { + "model_id": "jaspionjader/kstc-6-8b", + "name": "kstc-6-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4944, + "BBH": 0.5231, + "MATH Level 5": 0.1246, + "GPQA": 0.2995, + "MUSR": 0.4105, + "MMLU-PRO": 0.3857 + } + }, + { + "model_id": "jaspionjader/kstc-8-8b", + "name": "kstc-8-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.491, + "BBH": 0.5239, + "MATH Level 5": 0.1307, + "GPQA": 0.3054, + "MUSR": 0.4211, + "MMLU-PRO": 0.3889 + } + }, + { + "model_id": "jaspionjader/kstc-9-8b", + "name": "kstc-9-8b", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4861, + "BBH": 0.5238, + "MATH Level 5": 0.136, + "GPQA": 0.3012, + "MUSR": 0.4118, + "MMLU-PRO": 0.3872 + } + }, + { + "model_id": "jaspionjader/slu-10", + "name": "slu-10", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.436, + "BBH": 0.5096, + "MATH Level 5": 0.0974, + "GPQA": 0.3138, + "MUSR": 0.392, + "MMLU-PRO": 0.3664 + } + }, + { + "model_id": "jaspionjader/slu-11", + "name": "slu-11", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.3725, + "BBH": 0.489, + "MATH Level 5": 0.0559, + "GPQA": 0.3037, + "MUSR": 0.3919, + "MMLU-PRO": 0.3382 + } + }, + { + "model_id": "jaspionjader/slu-13", + "name": "slu-13", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4378, + "BBH": 0.5097, + "MATH Level 5": 0.0808, + "GPQA": 0.3079, + "MUSR": 0.3814, + "MMLU-PRO": 0.358 + } + }, + { + "model_id": "jaspionjader/slu-14", + "name": "slu-14", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4107, + "BBH": 0.5089, + "MATH Level 5": 0.0974, + "GPQA": 0.3079, + "MUSR": 0.396, + "MMLU-PRO": 0.3627 + } + }, + { + "model_id": "jaspionjader/slu-17", + "name": "slu-17", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4217, + "BBH": 0.5071, + "MATH Level 5": 0.0853, + "GPQA": 0.3087, + "MUSR": 0.3761, + "MMLU-PRO": 0.3619 + } + }, + { + "model_id": "jaspionjader/slu-2", + "name": "slu-2", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4016, + "BBH": 0.5008, + "MATH Level 5": 0.0634, + "GPQA": 0.2987, + "MUSR": 0.3959, + "MMLU-PRO": 0.3506 + } + }, + { + "model_id": "jaspionjader/slu-20", + "name": "slu-20", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4393, + "BBH": 0.5061, + "MATH Level 5": 0.0869, + "GPQA": 0.3087, + "MUSR": 0.3933, + "MMLU-PRO": 0.3665 + } + }, + { + "model_id": "jaspionjader/slu-22", + "name": "slu-22", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4321, + "BBH": 0.5082, + "MATH Level 5": 0.0793, + "GPQA": 0.3163, + "MUSR": 0.3893, + "MMLU-PRO": 0.365 + } + }, + { + "model_id": "jaspionjader/slu-23", + "name": "slu-23", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4478, + "BBH": 0.5132, + "MATH Level 5": 0.0944, + "GPQA": 0.3045, + "MUSR": 0.4092, + "MMLU-PRO": 0.3725 + } + }, + { + "model_id": "jaspionjader/slu-25", + "name": "slu-25", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.45, + "BBH": 0.5095, + "MATH Level 5": 0.0838, + "GPQA": 0.3087, + "MUSR": 0.3946, + "MMLU-PRO": 0.3684 + } + }, + { + "model_id": "jaspionjader/slu-29", + "name": "slu-29", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4431, + "BBH": 0.5096, + "MATH Level 5": 0.0869, + "GPQA": 0.307, + "MUSR": 0.3933, + "MMLU-PRO": 0.3669 + } + }, + { + "model_id": "jaspionjader/slu-32", + "name": "slu-32", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4516, + "BBH": 0.5167, + "MATH Level 5": 0.1073, + "GPQA": 0.302, + "MUSR": 0.4039, + "MMLU-PRO": 0.3766 + } + }, + { + "model_id": "jaspionjader/slu-33", + "name": "slu-33", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4457, + "BBH": 0.5081, + "MATH Level 5": 0.0997, + "GPQA": 0.3121, + "MUSR": 0.3867, + "MMLU-PRO": 0.3679 + } + }, + { + "model_id": "jaspionjader/slu-34", + "name": "slu-34", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4351, + "BBH": 0.5077, + "MATH Level 5": 0.0997, + "GPQA": 0.3079, + "MUSR": 0.388, + "MMLU-PRO": 0.372 + } + }, + { + "model_id": "jaspionjader/slu-35", + "name": "slu-35", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4242, + "BBH": 0.5103, + "MATH Level 5": 0.1012, + "GPQA": 0.3121, + "MUSR": 0.3946, + "MMLU-PRO": 0.3676 + } + }, + { + "model_id": "jaspionjader/slu-36", + "name": "slu-36", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4518, + "BBH": 0.5087, + "MATH Level 5": 0.0906, + "GPQA": 0.3121, + "MUSR": 0.3933, + "MMLU-PRO": 0.3711 + } + }, + { + "model_id": "jaspionjader/slu-37", + "name": "slu-37", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4534, + "BBH": 0.51, + "MATH Level 5": 0.0974, + "GPQA": 0.307, + "MUSR": 0.3946, + "MMLU-PRO": 0.3695 + } + }, + { + "model_id": "jaspionjader/slu-6", + "name": "slu-6", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4117, + "BBH": 0.5099, + "MATH Level 5": 0.0944, + "GPQA": 0.3029, + "MUSR": 0.4066, + "MMLU-PRO": 0.3611 + } + }, + { + "model_id": "jaspionjader/slu-mix-1", + "name": "slu-mix-1", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4569, + "BBH": 0.524, + "MATH Level 5": 0.1118, + "GPQA": 0.3003, + "MUSR": 0.4277, + "MMLU-PRO": 0.393 + } + }, + { + "model_id": "jaspionjader/sof-1", + "name": "sof-1", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4314, + "BBH": 0.501, + "MATH Level 5": 0.114, + "GPQA": 0.3029, + "MUSR": 0.4082, + "MMLU-PRO": 0.3674 + } + }, + { + "model_id": "jaspionjader/sof-10", + "name": "sof-10", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4648, + "BBH": 0.5197, + "MATH Level 5": 0.1239, + "GPQA": 0.3062, + "MUSR": 0.4091, + "MMLU-PRO": 0.3874 + } + }, + { + "model_id": "jaspionjader/sof-3", + "name": "sof-3", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4637, + "BBH": 0.5206, + "MATH Level 5": 0.1276, + "GPQA": 0.297, + "MUSR": 0.4131, + "MMLU-PRO": 0.3812 + } + }, + { + "model_id": "jaspionjader/sof-6", + "name": "sof-6", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4354, + "BBH": 0.5209, + "MATH Level 5": 0.1299, + "GPQA": 0.2995, + "MUSR": 0.4171, + "MMLU-PRO": 0.3844 + } + }, + { + "model_id": "jaspionjader/test-10", + "name": "test-10", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4578, + "BBH": 0.5316, + "MATH Level 5": 0.114, + "GPQA": 0.3196, + "MUSR": 0.4251, + "MMLU-PRO": 0.3936 + } + }, + { + "model_id": "jaspionjader/test-11", + "name": "test-11", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4541, + "BBH": 0.535, + "MATH Level 5": 0.1201, + "GPQA": 0.3238, + "MUSR": 0.429, + "MMLU-PRO": 0.3939 + } + }, + { + "model_id": "jaspionjader/test-12", + "name": "test-12", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4368, + "BBH": 0.5347, + "MATH Level 5": 0.108, + "GPQA": 0.3188, + "MUSR": 0.425, + "MMLU-PRO": 0.3935 + } + }, + { + "model_id": "jaspionjader/test-13", + "name": "test-13", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4581, + "BBH": 0.5318, + "MATH Level 5": 0.1057, + "GPQA": 0.3163, + "MUSR": 0.4264, + "MMLU-PRO": 0.3935 + } + }, + { + "model_id": "jaspionjader/test-14", + "name": "test-14", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4444, + "BBH": 0.5323, + "MATH Level 5": 0.1103, + "GPQA": 0.3146, + "MUSR": 0.4317, + "MMLU-PRO": 0.393 + } + }, + { + "model_id": "jaspionjader/test-15", + "name": "test-15", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4365, + "BBH": 0.5328, + "MATH Level 5": 0.1118, + "GPQA": 0.3121, + "MUSR": 0.4264, + "MMLU-PRO": 0.393 + } + }, + { + "model_id": "jaspionjader/test-16", + "name": "test-16", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4599, + "BBH": 0.533, + "MATH Level 5": 0.1095, + "GPQA": 0.3138, + "MUSR": 0.4225, + "MMLU-PRO": 0.393 + } + }, + { + "model_id": "jaspionjader/test-17", + "name": "test-17", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4267, + "BBH": 0.5329, + "MATH Level 5": 0.1103, + "GPQA": 0.3129, + "MUSR": 0.429, + "MMLU-PRO": 0.3929 + } + }, + { + "model_id": "jaspionjader/test-18", + "name": "test-18", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4392, + "BBH": 0.5317, + "MATH Level 5": 0.1148, + "GPQA": 0.3121, + "MUSR": 0.4251, + "MMLU-PRO": 0.393 + } + }, + { + "model_id": "jaspionjader/test-19", + "name": "test-19", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4401, + "BBH": 0.5319, + "MATH Level 5": 0.1095, + "GPQA": 0.3096, + "MUSR": 0.4264, + "MMLU-PRO": 0.3929 + } + }, + { + "model_id": "jaspionjader/test-20", + "name": "test-20", + "developer": "jaspionjader", + "scores": { + "IFEval": 0.4529, + "BBH": 0.5327, + "MATH Level 5": 0.1118, + "GPQA": 0.3138, + "MUSR": 0.4251, + "MMLU-PRO": 0.392 + } + }, + { + "model_id": "jayasuryajsk/Qwen2.5-3B-reasoner", + "name": "Qwen2.5-3B-reasoner", + "developer": "jayasuryajsk", + "scores": { + "IFEval": 0.416, + "BBH": 0.4651, + "MATH Level 5": 0.2085, + "GPQA": 0.302, + "MUSR": 0.4123, + "MMLU-PRO": 0.3482 + } + }, + { + "model_id": "jeanmichela/o-distil-qwen", + "name": "o-distil-qwen", + "developer": "jeanmichela", + "scores": { + "IFEval": 0.4482, + "BBH": 0.59, + "MATH Level 5": 0.565, + "GPQA": 0.3935, + "MUSR": 0.534, + "MMLU-PRO": 0.4658 + } + }, + { + "model_id": "jebcarter/psyonic-cetacean-20B", + "name": "psyonic-cetacean-20B", + "developer": "jebcarter", + "scores": { + "IFEval": 0.2544, + "BBH": 0.4907, + "MATH Level 5": 0.0181, + "GPQA": 0.2735, + "MUSR": 0.4661, + "MMLU-PRO": 0.2886 + } + }, + { + "model_id": "jebish7/Llama-3-Nanda-10B-Chat", + "name": "Llama-3-Nanda-10B-Chat", + "developer": "jebish7", + "scores": { + "IFEval": 0.2953, + "BBH": 0.4959, + "MATH Level 5": 0.0559, + "GPQA": 0.3012, + "MUSR": 0.4356, + "MMLU-PRO": 0.3157 + } + }, + { + "model_id": "jebish7/Llama-3.1-8B-Instruct", + "name": "Llama-3.1-8B-Instruct", + "developer": "jebish7", + "scores": { + "IFEval": 0.5058, + "BBH": 0.5088, + "MATH Level 5": 0.1548, + "GPQA": 0.3213, + "MUSR": 0.3998, + "MMLU-PRO": 0.3777 + } + }, + { + "model_id": "jebish7/Nemotron-4-Mini-Hindi-4B-Base", + "name": "Nemotron-4-Mini-Hindi-4B-Base", + "developer": "jebish7", + "scores": { + "IFEval": 0.2285, + "BBH": 0.3924, + "MATH Level 5": 0.0272, + "GPQA": 0.2836, + "MUSR": 0.4249, + "MMLU-PRO": 0.2503 + } + }, + { + "model_id": "jebish7/Nemotron-4-Mini-Hindi-4B-Instruct", + "name": "Nemotron-4-Mini-Hindi-4B-Instruct", + "developer": "jebish7", + "scores": { + "IFEval": 0.3345, + "BBH": 0.4041, + "MATH Level 5": 0.0287, + "GPQA": 0.3087, + "MUSR": 0.4153, + "MMLU-PRO": 0.2595 + } + }, + { + "model_id": "jebish7/Nemotron-Mini-4B-Instruct", + "name": "Nemotron-Mini-4B-Instruct", + "developer": "jebish7", + "scores": { + "IFEval": 0.3709, + "BBH": 0.4244, + "MATH Level 5": 0.0325, + "GPQA": 0.276, + "MUSR": 0.4727, + "MMLU-PRO": 0.2783 + } + }, + { + "model_id": "jebish7/aya-expanse-8b", + "name": "aya-expanse-8b", + "developer": "jebish7", + "scores": { + "IFEval": 0.3791, + "BBH": 0.4969, + "MATH Level 5": 0.0816, + "GPQA": 0.2836, + "MUSR": 0.3869, + "MMLU-PRO": 0.3103 + } + }, + { + "model_id": "jebish7/gemma-2-2b-it", + "name": "gemma-2-2b-it", + "developer": "jebish7", + "scores": { + "IFEval": 0.1272, + "BBH": 0.4395, + "MATH Level 5": 0.034, + "GPQA": 0.297, + "MUSR": 0.4244, + "MMLU-PRO": 0.2715 + } + }, + { + "model_id": "jebish7/gemma-2-9b-it", + "name": "gemma-2-9b-it", + "developer": "jebish7", + "scores": { + "IFEval": 0.1557, + "BBH": 0.5949, + "MATH Level 5": 0.0846, + "GPQA": 0.3473, + "MUSR": 0.4554, + "MMLU-PRO": 0.4143 + } + }, + { + "model_id": "jebish7/qwen2.5-0.5B-IHA-Hin", + "name": "qwen2.5-0.5B-IHA-Hin", + "developer": "jebish7", + "scores": { + "IFEval": 0.1416, + "BBH": 0.2989, + "MATH Level 5": 0.0, + "GPQA": 0.2525, + "MUSR": 0.3475, + "MMLU-PRO": 0.1094 + } + }, + { + "model_id": "jeffmeloy/Qwen-7B-nerd-uncensored-v1.0", + "name": "Qwen-7B-nerd-uncensored-v1.0", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.6136, + "BBH": 0.5421, + "MATH Level 5": 0.287, + "GPQA": 0.328, + "MUSR": 0.4793, + "MMLU-PRO": 0.4363 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-minperplexity-2", + "name": "Qwen2.5-7B-minperplexity-2", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.5097, + "BBH": 0.5524, + "MATH Level 5": 0.3014, + "GPQA": 0.3112, + "MUSR": 0.4625, + "MMLU-PRO": 0.4346 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v0.9", + "name": "Qwen2.5-7B-nerd-uncensored-v0.9", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.6048, + "BBH": 0.547, + "MATH Level 5": 0.2946, + "GPQA": 0.323, + "MUSR": 0.482, + "MMLU-PRO": 0.4363 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v1.0", + "name": "Qwen2.5-7B-nerd-uncensored-v1.0", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.7695, + "BBH": 0.5418, + "MATH Level 5": 0.4713, + "GPQA": 0.2903, + "MUSR": 0.4551, + "MMLU-PRO": 0.4254 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v1.1", + "name": "Qwen2.5-7B-nerd-uncensored-v1.1", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.6626, + "BBH": 0.4864, + "MATH Level 5": 0.1329, + "GPQA": 0.2869, + "MUSR": 0.3843, + "MMLU-PRO": 0.385 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v1.2", + "name": "Qwen2.5-7B-nerd-uncensored-v1.2", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.4965, + "BBH": 0.4946, + "MATH Level 5": 0.1208, + "GPQA": 0.3037, + "MUSR": 0.4172, + "MMLU-PRO": 0.3969 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v1.3", + "name": "Qwen2.5-7B-nerd-uncensored-v1.3", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.4995, + "BBH": 0.5026, + "MATH Level 5": 0.1231, + "GPQA": 0.3129, + "MUSR": 0.4187, + "MMLU-PRO": 0.4016 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v1.4", + "name": "Qwen2.5-7B-nerd-uncensored-v1.4", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.6079, + "BBH": 0.5467, + "MATH Level 5": 0.281, + "GPQA": 0.3238, + "MUSR": 0.4714, + "MMLU-PRO": 0.4419 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v1.5", + "name": "Qwen2.5-7B-nerd-uncensored-v1.5", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.565, + "BBH": 0.5523, + "MATH Level 5": 0.2757, + "GPQA": 0.3272, + "MUSR": 0.4982, + "MMLU-PRO": 0.4448 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v1.7", + "name": "Qwen2.5-7B-nerd-uncensored-v1.7", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.4202, + "BBH": 0.5392, + "MATH Level 5": 0.2915, + "GPQA": 0.3238, + "MUSR": 0.4848, + "MMLU-PRO": 0.428 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-nerd-uncensored-v1.8", + "name": "Qwen2.5-7B-nerd-uncensored-v1.8", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.6256, + "BBH": 0.5447, + "MATH Level 5": 0.2704, + "GPQA": 0.3238, + "MUSR": 0.4767, + "MMLU-PRO": 0.4343 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-olm-v1.0", + "name": "Qwen2.5-7B-olm-v1.0", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.5331, + "BBH": 0.566, + "MATH Level 5": 0.2863, + "GPQA": 0.3205, + "MUSR": 0.4278, + "MMLU-PRO": 0.4566 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-olm-v1.1", + "name": "Qwen2.5-7B-olm-v1.1", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.4329, + "BBH": 0.5478, + "MATH Level 5": 0.3829, + "GPQA": 0.3087, + "MUSR": 0.4808, + "MMLU-PRO": 0.4354 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-olm-v1.2", + "name": "Qwen2.5-7B-olm-v1.2", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.4203, + "BBH": 0.5533, + "MATH Level 5": 0.2847, + "GPQA": 0.3171, + "MUSR": 0.4688, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-olm-v1.3", + "name": "Qwen2.5-7B-olm-v1.3", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.4219, + "BBH": 0.5532, + "MATH Level 5": 0.3104, + "GPQA": 0.3213, + "MUSR": 0.4701, + "MMLU-PRO": 0.447 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-olm-v1.4", + "name": "Qwen2.5-7B-olm-v1.4", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.4545, + "BBH": 0.5582, + "MATH Level 5": 0.2923, + "GPQA": 0.3121, + "MUSR": 0.4622, + "MMLU-PRO": 0.4457 + } + }, + { + "model_id": "jeffmeloy/Qwen2.5-7B-olm-v1.5", + "name": "Qwen2.5-7B-olm-v1.5", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.4547, + "BBH": 0.5544, + "MATH Level 5": 0.2817, + "GPQA": 0.3398, + "MUSR": 0.4539, + "MMLU-PRO": 0.4399 + } + }, + { + "model_id": "jeffmeloy/jeffmeloy_Qwen2.5-7B-minperplexity-1", + "name": "jeffmeloy_Qwen2.5-7B-minperplexity-1", + "developer": "jeffmeloy", + "scores": { + "IFEval": 0.3757, + "BBH": 0.5582, + "MATH Level 5": 0.2915, + "GPQA": 0.3322, + "MUSR": 0.429, + "MMLU-PRO": 0.4368 + } + }, + { + "model_id": "jeonsworld/CarbonVillain-en-10.7B-v4", + "name": "CarbonVillain-en-10.7B-v4", + "developer": "jeonsworld", + "scores": { + "IFEval": 0.4579, + "BBH": 0.5168, + "MATH Level 5": 0.0468, + "GPQA": 0.3062, + "MUSR": 0.3965, + "MMLU-PRO": 0.3142 + } + }, + { + "model_id": "jiangxinyang-shanda/Homer-LLama3-8B", + "name": "Homer-LLama3-8B", + "developer": "jiangxinyang-shanda", + "scores": { + "IFEval": 0.3992, + "BBH": 0.5173, + "MATH Level 5": 0.0861, + "GPQA": 0.297, + "MUSR": 0.4056, + "MMLU-PRO": 0.3139 + } + }, + { + "model_id": "jieliu/Storm-7B", + "name": "Storm-7B", + "developer": "jieliu", + "scores": { + "IFEval": 0.3424, + "BBH": 0.5187, + "MATH Level 5": 0.0612, + "GPQA": 0.3079, + "MUSR": 0.4429, + "MMLU-PRO": 0.3119 + } + }, + { + "model_id": "jiviai/medX_v2", + "name": "medX_v2", + "developer": "jiviai", + "scores": { + "IFEval": 0.3743, + "BBH": 0.4509, + "MATH Level 5": 0.0544, + "GPQA": 0.323, + "MUSR": 0.3498, + "MMLU-PRO": 0.3428 + } + }, + { + "model_id": "jlzhou/Qwen2.5-3B-Infinity-Instruct-0625", + "name": "Qwen2.5-3B-Infinity-Instruct-0625", + "developer": "jlzhou", + "scores": { + "IFEval": 0.3558, + "BBH": 0.4774, + "MATH Level 5": 0.1367, + "GPQA": 0.2693, + "MUSR": 0.3981, + "MMLU-PRO": 0.3199 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.1-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.1-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4271, + "BBH": 0.5036, + "MATH Level 5": 0.0453, + "GPQA": 0.3221, + "MUSR": 0.4638, + "MMLU-PRO": 0.3739 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.1-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.1-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4253, + "BBH": 0.5019, + "MATH Level 5": 0.0967, + "GPQA": 0.3012, + "MUSR": 0.415, + "MMLU-PRO": 0.3724 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.3-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.3-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.3377, + "BBH": 0.4917, + "MATH Level 5": 0.0106, + "GPQA": 0.3121, + "MUSR": 0.5018, + "MMLU-PRO": 0.3533 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.3-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.3-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4274, + "BBH": 0.5126, + "MATH Level 5": 0.0808, + "GPQA": 0.3087, + "MUSR": 0.4226, + "MMLU-PRO": 0.3739 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.5-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.5-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.3204, + "BBH": 0.4884, + "MATH Level 5": 0.0038, + "GPQA": 0.302, + "MUSR": 0.5098, + "MMLU-PRO": 0.3344 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.5-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.5-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4396, + "BBH": 0.514, + "MATH Level 5": 0.0801, + "GPQA": 0.307, + "MUSR": 0.4398, + "MMLU-PRO": 0.3696 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.7-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.7-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.2814, + "BBH": 0.4854, + "MATH Level 5": 0.0023, + "GPQA": 0.2903, + "MUSR": 0.5163, + "MMLU-PRO": 0.3295 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.7-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.7-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4302, + "BBH": 0.5157, + "MATH Level 5": 0.0627, + "GPQA": 0.3079, + "MUSR": 0.4332, + "MMLU-PRO": 0.3663 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.9-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.9-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.279, + "BBH": 0.4861, + "MATH Level 5": 0.0015, + "GPQA": 0.2945, + "MUSR": 0.515, + "MMLU-PRO": 0.3305 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs-density-0.9-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs-density-0.9-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4223, + "BBH": 0.5154, + "MATH Level 5": 0.074, + "GPQA": 0.3079, + "MUSR": 0.4384, + "MMLU-PRO": 0.365 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.1-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.1-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4359, + "BBH": 0.5041, + "MATH Level 5": 0.0483, + "GPQA": 0.3104, + "MUSR": 0.4532, + "MMLU-PRO": 0.3762 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.1-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.1-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4202, + "BBH": 0.5011, + "MATH Level 5": 0.0982, + "GPQA": 0.3003, + "MUSR": 0.415, + "MMLU-PRO": 0.3699 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.3-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.3-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.3518, + "BBH": 0.4999, + "MATH Level 5": 0.0234, + "GPQA": 0.3062, + "MUSR": 0.4871, + "MMLU-PRO": 0.3611 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.3-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.3-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4204, + "BBH": 0.5107, + "MATH Level 5": 0.0876, + "GPQA": 0.3045, + "MUSR": 0.4279, + "MMLU-PRO": 0.371 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.5-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.5-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.3454, + "BBH": 0.4984, + "MATH Level 5": 0.0219, + "GPQA": 0.297, + "MUSR": 0.4911, + "MMLU-PRO": 0.3531 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.5-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.5-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4092, + "BBH": 0.5137, + "MATH Level 5": 0.0808, + "GPQA": 0.2953, + "MUSR": 0.4357, + "MMLU-PRO": 0.3669 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.7-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.7-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.2904, + "BBH": 0.4967, + "MATH Level 5": 0.0144, + "GPQA": 0.2995, + "MUSR": 0.4991, + "MMLU-PRO": 0.349 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.7-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.7-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4199, + "BBH": 0.5147, + "MATH Level 5": 0.0808, + "GPQA": 0.2987, + "MUSR": 0.4358, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.9-gamma-0.01", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.9-gamma-0.01", + "developer": "johnsutor", + "scores": { + "IFEval": 0.2913, + "BBH": 0.4918, + "MATH Level 5": 0.0106, + "GPQA": 0.3003, + "MUSR": 0.4977, + "MMLU-PRO": 0.3454 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_breadcrumbs_ties-density-0.9-gamma-0.1", + "name": "Llama-3-8B-Instruct_breadcrumbs_ties-density-0.9-gamma-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4162, + "BBH": 0.5139, + "MATH Level 5": 0.0778, + "GPQA": 0.297, + "MUSR": 0.4317, + "MMLU-PRO": 0.3625 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_dare_linear", + "name": "Llama-3-8B-Instruct_dare_linear", + "developer": "johnsutor", + "scores": { + "IFEval": 0.2145, + "BBH": 0.4283, + "MATH Level 5": 0.0, + "GPQA": 0.2961, + "MUSR": 0.4979, + "MMLU-PRO": 0.2414 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_dare_ties-density-0.1", + "name": "Llama-3-8B-Instruct_dare_ties-density-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.1891, + "BBH": 0.4119, + "MATH Level 5": 0.0008, + "GPQA": 0.2718, + "MUSR": 0.4658, + "MMLU-PRO": 0.2265 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_dare_ties-density-0.3", + "name": "Llama-3-8B-Instruct_dare_ties-density-0.3", + "developer": "johnsutor", + "scores": { + "IFEval": 0.2113, + "BBH": 0.4559, + "MATH Level 5": 0.0015, + "GPQA": 0.297, + "MUSR": 0.5069, + "MMLU-PRO": 0.304 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_dare_ties-density-0.7", + "name": "Llama-3-8B-Instruct_dare_ties-density-0.7", + "developer": "johnsutor", + "scores": { + "IFEval": 0.2034, + "BBH": 0.4723, + "MATH Level 5": 0.003, + "GPQA": 0.3037, + "MUSR": 0.511, + "MMLU-PRO": 0.3148 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_dare_ties-density-0.9", + "name": "Llama-3-8B-Instruct_dare_ties-density-0.9", + "developer": "johnsutor", + "scores": { + "IFEval": 0.2161, + "BBH": 0.4664, + "MATH Level 5": 0.0015, + "GPQA": 0.3079, + "MUSR": 0.523, + "MMLU-PRO": 0.3143 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_linear", + "name": "Llama-3-8B-Instruct_linear", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4308, + "BBH": 0.5031, + "MATH Level 5": 0.1005, + "GPQA": 0.2953, + "MUSR": 0.4097, + "MMLU-PRO": 0.3712 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_ties-density-0.1", + "name": "Llama-3-8B-Instruct_ties-density-0.1", + "developer": "johnsutor", + "scores": { + "IFEval": 0.4116, + "BBH": 0.5021, + "MATH Level 5": 0.0793, + "GPQA": 0.2886, + "MUSR": 0.4174, + "MMLU-PRO": 0.36 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_ties-density-0.3", + "name": "Llama-3-8B-Instruct_ties-density-0.3", + "developer": "johnsutor", + "scores": { + "IFEval": 0.3626, + "BBH": 0.4906, + "MATH Level 5": 0.0672, + "GPQA": 0.2961, + "MUSR": 0.4025, + "MMLU-PRO": 0.3321 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_ties-density-0.5", + "name": "Llama-3-8B-Instruct_ties-density-0.5", + "developer": "johnsutor", + "scores": { + "IFEval": 0.3797, + "BBH": 0.4793, + "MATH Level 5": 0.0612, + "GPQA": 0.3045, + "MUSR": 0.388, + "MMLU-PRO": 0.3175 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_ties-density-0.7", + "name": "Llama-3-8B-Instruct_ties-density-0.7", + "developer": "johnsutor", + "scores": { + "IFEval": 0.3681, + "BBH": 0.4738, + "MATH Level 5": 0.0672, + "GPQA": 0.3096, + "MUSR": 0.3881, + "MMLU-PRO": 0.3152 + } + }, + { + "model_id": "johnsutor/Llama-3-8B-Instruct_ties-density-0.9", + "name": "Llama-3-8B-Instruct_ties-density-0.9", + "developer": "johnsutor", + "scores": { + "IFEval": 0.3858, + "BBH": 0.4735, + "MATH Level 5": 0.0619, + "GPQA": 0.2995, + "MUSR": 0.388, + "MMLU-PRO": 0.3182 + } + }, + { + "model_id": "jpacifico/Chocolatine-14B-Instruct-4k-DPO", + "name": "Chocolatine-14B-Instruct-4k-DPO", + "developer": "jpacifico", + "scores": { + "IFEval": 0.4689, + "BBH": 0.63, + "MATH Level 5": 0.1782, + "GPQA": 0.3414, + "MUSR": 0.4439, + "MMLU-PRO": 0.4764 + } + }, + { + "model_id": "jpacifico/Chocolatine-14B-Instruct-DPO-v1.2", + "name": "Chocolatine-14B-Instruct-DPO-v1.2", + "developer": "jpacifico", + "scores": { + "IFEval": 0.6852, + "BBH": 0.6438, + "MATH Level 5": 0.2092, + "GPQA": 0.3255, + "MUSR": 0.4268, + "MMLU-PRO": 0.4697 + } + }, + { + "model_id": "jpacifico/Chocolatine-14B-Instruct-DPO-v1.3", + "name": "Chocolatine-14B-Instruct-DPO-v1.3", + "developer": "jpacifico", + "scores": { + "IFEval": 0.704, + "BBH": 0.6846, + "MATH Level 5": 0.5619, + "GPQA": 0.3414, + "MUSR": 0.4234, + "MMLU-PRO": 0.5374 + } + }, + { + "model_id": "jpacifico/Chocolatine-2-14B-Instruct-DPO-v2.0b1", + "name": "Chocolatine-2-14B-Instruct-DPO-v2.0b1", + "developer": "jpacifico", + "scores": { + "IFEval": 0.1033, + "BBH": 0.6696, + "MATH Level 5": 0.2757, + "GPQA": 0.3758, + "MUSR": 0.4467, + "MMLU-PRO": 0.5124 + } + }, + { + "model_id": "jpacifico/Chocolatine-2-14B-Instruct-v2.0", + "name": "Chocolatine-2-14B-Instruct-v2.0", + "developer": "jpacifico", + "scores": { + "IFEval": 0.0885, + "BBH": 0.677, + "MATH Level 5": 0.4804, + "GPQA": 0.3876, + "MUSR": 0.5021, + "MMLU-PRO": 0.5302 + } + }, + { + "model_id": "jpacifico/Chocolatine-2-14B-Instruct-v2.0.1", + "name": "Chocolatine-2-14B-Instruct-v2.0.1", + "developer": "jpacifico", + "scores": { + "IFEval": 0.0742, + "BBH": 0.6736, + "MATH Level 5": 0.4796, + "GPQA": 0.3918, + "MUSR": 0.5008, + "MMLU-PRO": 0.5299 + } + }, + { + "model_id": "jpacifico/Chocolatine-2-14B-Instruct-v2.0.3", + "name": "Chocolatine-2-14B-Instruct-v2.0.3", + "developer": "jpacifico", + "scores": { + "IFEval": 0.7037, + "BBH": 0.6548, + "MATH Level 5": 0.4207, + "GPQA": 0.3792, + "MUSR": 0.4768, + "MMLU-PRO": 0.5374 + } + }, + { + "model_id": "jpacifico/Chocolatine-2-14B-Instruct-v2.0b2", + "name": "Chocolatine-2-14B-Instruct-v2.0b2", + "developer": "jpacifico", + "scores": { + "IFEval": 0.7241, + "BBH": 0.6476, + "MATH Level 5": 0.395, + "GPQA": 0.3834, + "MUSR": 0.4808, + "MMLU-PRO": 0.5369 + } + }, + { + "model_id": "jpacifico/Chocolatine-2-14B-Instruct-v2.0b3", + "name": "Chocolatine-2-14B-Instruct-v2.0b3", + "developer": "jpacifico", + "scores": { + "IFEval": 0.7323, + "BBH": 0.6469, + "MATH Level 5": 0.4109, + "GPQA": 0.3792, + "MUSR": 0.4781, + "MMLU-PRO": 0.5337 + } + }, + { + "model_id": "jpacifico/Chocolatine-3B-Instruct-DPO-Revised", + "name": "Chocolatine-3B-Instruct-DPO-Revised", + "developer": "jpacifico", + "scores": { + "IFEval": 0.5623, + "BBH": 0.554, + "MATH Level 5": 0.1805, + "GPQA": 0.3221, + "MUSR": 0.4453, + "MMLU-PRO": 0.3989 + } + }, + { + "model_id": "jpacifico/Chocolatine-3B-Instruct-DPO-v1.0", + "name": "Chocolatine-3B-Instruct-DPO-v1.0", + "developer": "jpacifico", + "scores": { + "IFEval": 0.3737, + "BBH": 0.5471, + "MATH Level 5": 0.1782, + "GPQA": 0.3154, + "MUSR": 0.4755, + "MMLU-PRO": 0.3937 + } + }, + { + "model_id": "jpacifico/Chocolatine-3B-Instruct-DPO-v1.2", + "name": "Chocolatine-3B-Instruct-DPO-v1.2", + "developer": "jpacifico", + "scores": { + "IFEval": 0.5455, + "BBH": 0.5487, + "MATH Level 5": 0.2047, + "GPQA": 0.3389, + "MUSR": 0.4154, + "MMLU-PRO": 0.3877 + } + }, + { + "model_id": "jpacifico/Distilucie-7B-Math-Instruct-DPO-v0.1", + "name": "Distilucie-7B-Math-Instruct-DPO-v0.1", + "developer": "jpacifico", + "scores": { + "IFEval": 0.3048, + "BBH": 0.3835, + "MATH Level 5": 0.0257, + "GPQA": 0.2995, + "MUSR": 0.3644, + "MMLU-PRO": 0.1809 + } + }, + { + "model_id": "jpacifico/Lucie-7B-Instruct-DPO-v1.1", + "name": "Lucie-7B-Instruct-DPO-v1.1", + "developer": "jpacifico", + "scores": { + "IFEval": 0.3121, + "BBH": 0.3781, + "MATH Level 5": 0.0234, + "GPQA": 0.2878, + "MUSR": 0.4016, + "MMLU-PRO": 0.1838 + } + }, + { + "model_id": "jpacifico/Lucie-7B-Instruct-DPO-v1.1.3", + "name": "Lucie-7B-Instruct-DPO-v1.1.3", + "developer": "jpacifico", + "scores": { + "IFEval": 0.3045, + "BBH": 0.3819, + "MATH Level 5": 0.0242, + "GPQA": 0.2861, + "MUSR": 0.3818, + "MMLU-PRO": 0.1764 + } + }, + { + "model_id": "jpacifico/Lucie-7B-Instruct-Merged-Model_Stock-v1.0", + "name": "Lucie-7B-Instruct-Merged-Model_Stock-v1.0", + "developer": "jpacifico", + "scores": { + "IFEval": 0.3234, + "BBH": 0.3802, + "MATH Level 5": 0.0242, + "GPQA": 0.2886, + "MUSR": 0.3844, + "MMLU-PRO": 0.1871 + } + }, + { + "model_id": "jpacifico/Lucie-7B-Instruct-Merged-Model_Stock-v1.1", + "name": "Lucie-7B-Instruct-Merged-Model_Stock-v1.1", + "developer": "jpacifico", + "scores": { + "IFEval": 0.3014, + "BBH": 0.3808, + "MATH Level 5": 0.0279, + "GPQA": 0.2827, + "MUSR": 0.375, + "MMLU-PRO": 0.1862 + } + }, + { + "model_id": "jpacifico/Lucie-Boosted-7B-Instruct", + "name": "Lucie-Boosted-7B-Instruct", + "developer": "jpacifico", + "scores": { + "IFEval": 0.2566, + "BBH": 0.3465, + "MATH Level 5": 0.0128, + "GPQA": 0.2668, + "MUSR": 0.3699, + "MMLU-PRO": 0.163 + } + }, + { + "model_id": "jsfs11/L3-8B-Stheno-slerp", + "name": "L3-8B-Stheno-slerp", + "developer": "jsfs11", + "scores": { + "IFEval": 0.6752, + "BBH": 0.5326, + "MATH Level 5": 0.0989, + "GPQA": 0.2852, + "MUSR": 0.3725, + "MMLU-PRO": 0.3649 + } + }, + { + "model_id": "jsfs11/MixtureofMerges-MoE-4x7b-v4", + "name": "MixtureofMerges-MoE-4x7b-v4", + "developer": "jsfs11", + "scores": { + "IFEval": 0.403, + "BBH": 0.5169, + "MATH Level 5": 0.0634, + "GPQA": 0.2861, + "MUSR": 0.4386, + "MMLU-PRO": 0.3032 + } + }, + { + "model_id": "jsfs11/MixtureofMerges-MoE-4x7b-v5", + "name": "MixtureofMerges-MoE-4x7b-v5", + "developer": "jsfs11", + "scores": { + "IFEval": 0.4199, + "BBH": 0.5198, + "MATH Level 5": 0.0755, + "GPQA": 0.2844, + "MUSR": 0.4305, + "MMLU-PRO": 0.3098 + } + }, + { + "model_id": "kaist-ai/janus-7b", + "name": "janus-7b", + "developer": "kaist-ai", + "scores": { + "IFEval": 0.3775, + "BBH": 0.4694, + "MATH Level 5": 0.0408, + "GPQA": 0.2727, + "MUSR": 0.4401, + "MMLU-PRO": 0.2874 + } + }, + { + "model_id": "kaist-ai/janus-dpo-7b", + "name": "janus-dpo-7b", + "developer": "kaist-ai", + "scores": { + "IFEval": 0.4003, + "BBH": 0.4773, + "MATH Level 5": 0.0415, + "GPQA": 0.2819, + "MUSR": 0.4387, + "MMLU-PRO": 0.2976 + } + }, + { + "model_id": "kaist-ai/janus-rm-7b", + "name": "janus-rm-7b", + "developer": "kaist-ai", + "scores": { + "IFEval": 0.1778, + "BBH": 0.3056, + "MATH Level 5": 0.0, + "GPQA": 0.2517, + "MUSR": 0.3883, + "MMLU-PRO": 0.1126 + } + }, + { + "model_id": "kaist-ai/mistral-orpo-capybara-7k", + "name": "mistral-orpo-capybara-7k", + "developer": "kaist-ai", + "scores": { + "IFEval": 0.5367, + "BBH": 0.4489, + "MATH Level 5": 0.0393, + "GPQA": 0.2861, + "MUSR": 0.3964, + "MMLU-PRO": 0.2971 + } + }, + { + "model_id": "kavonalds/BunderMaxx-0710", + "name": "BunderMaxx-0710", + "developer": "kavonalds", + "scores": { + "IFEval": 0.2701, + "BBH": 0.5566, + "MATH Level 5": 0.068, + "GPQA": 0.2802, + "MUSR": 0.3682, + "MMLU-PRO": 0.1449 + } + }, + { + "model_id": "kavonalds/BunderMaxx-1010", + "name": "BunderMaxx-1010", + "developer": "kavonalds", + "scores": { + "IFEval": 0.2981, + "BBH": 0.702, + "MATH Level 5": 0.105, + "GPQA": 0.2609, + "MUSR": 0.3484, + "MMLU-PRO": 0.1224 + } + }, + { + "model_id": "kavonalds/Lancer-1-1b-Instruct", + "name": "Lancer-1-1b-Instruct", + "developer": "kavonalds", + "scores": { + "IFEval": 0.5546, + "BBH": 0.3253, + "MATH Level 5": 0.0393, + "GPQA": 0.2617, + "MUSR": 0.3144, + "MMLU-PRO": 0.1568 + } + }, + { + "model_id": "kayfour/T3Q-Qwen2.5-7B-it-KOR-Safe", + "name": "T3Q-Qwen2.5-7B-it-KOR-Safe", + "developer": "kayfour", + "scores": { + "IFEval": 0.6081, + "BBH": 0.555, + "MATH Level 5": 0.3761, + "GPQA": 0.3213, + "MUSR": 0.4277, + "MMLU-PRO": 0.4464 + } + }, + { + "model_id": "keeeeenw/MicroLlama", + "name": "MicroLlama", + "developer": "keeeeenw", + "scores": { + "IFEval": 0.1985, + "BBH": 0.3007, + "MATH Level 5": 0.0113, + "GPQA": 0.2609, + "MUSR": 0.3698, + "MMLU-PRO": 0.1138 + } + }, + { + "model_id": "kekmodel/StopCarbon-10.7B-v5", + "name": "StopCarbon-10.7B-v5", + "developer": "kekmodel", + "scores": { + "IFEval": 0.4728, + "BBH": 0.5178, + "MATH Level 5": 0.0559, + "GPQA": 0.3062, + "MUSR": 0.4019, + "MMLU-PRO": 0.3157 + } + }, + { + "model_id": "kevin009/llamaRAGdrama", + "name": "llamaRAGdrama", + "developer": "kevin009", + "scores": { + "IFEval": 0.2598, + "BBH": 0.4007, + "MATH Level 5": 0.0431, + "GPQA": 0.2643, + "MUSR": 0.4316, + "MMLU-PRO": 0.2724 + } + }, + { + "model_id": "khoantap/cheap-moe-merge", + "name": "cheap-moe-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.4557, + "BBH": 0.5131, + "MATH Level 5": 0.0921, + "GPQA": 0.2953, + "MUSR": 0.4103, + "MMLU-PRO": 0.3339 + } + }, + { + "model_id": "khoantap/llama-3-8b-stock-merge", + "name": "llama-3-8b-stock-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.4812, + "BBH": 0.5162, + "MATH Level 5": 0.1616, + "GPQA": 0.318, + "MUSR": 0.3946, + "MMLU-PRO": 0.38 + } + }, + { + "model_id": "khoantap/llama-breadcrumbs-ties-merge", + "name": "llama-breadcrumbs-ties-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.2205, + "BBH": 0.5416, + "MATH Level 5": 0.1125, + "GPQA": 0.2659, + "MUSR": 0.4434, + "MMLU-PRO": 0.3172 + } + }, + { + "model_id": "khoantap/llama-evolve-ties-best-merge", + "name": "llama-evolve-ties-best-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.6744, + "BBH": 0.5414, + "MATH Level 5": 0.1563, + "GPQA": 0.3171, + "MUSR": 0.3946, + "MMLU-PRO": 0.386 + } + }, + { + "model_id": "khoantap/llama-linear-0.5-0.5-1-merge", + "name": "llama-linear-0.5-0.5-1-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.4812, + "BBH": 0.5643, + "MATH Level 5": 0.2054, + "GPQA": 0.307, + "MUSR": 0.4143, + "MMLU-PRO": 0.3833 + } + }, + { + "model_id": "khoantap/llama-linear-0.5-1-0.5-merge", + "name": "llama-linear-0.5-1-0.5-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.5032, + "BBH": 0.5951, + "MATH Level 5": 0.148, + "GPQA": 0.2936, + "MUSR": 0.4172, + "MMLU-PRO": 0.369 + } + }, + { + "model_id": "khoantap/llama-linear-1-0.5-0.5-merge", + "name": "llama-linear-1-0.5-0.5-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.4515, + "BBH": 0.5526, + "MATH Level 5": 0.2477, + "GPQA": 0.2928, + "MUSR": 0.4118, + "MMLU-PRO": 0.3635 + } + }, + { + "model_id": "khoantap/llama-slerp-merge", + "name": "llama-slerp-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.498, + "BBH": 0.5783, + "MATH Level 5": 0.0831, + "GPQA": 0.3029, + "MUSR": 0.4053, + "MMLU-PRO": 0.3678 + } + }, + { + "model_id": "khoantap/moe-out-merge", + "name": "moe-out-merge", + "developer": "khoantap", + "scores": { + "IFEval": 0.4505, + "BBH": 0.5151, + "MATH Level 5": 0.0929, + "GPQA": 0.2886, + "MUSR": 0.4063, + "MMLU-PRO": 0.3348 + } + }, + { + "model_id": "khulaifi95/Llama-3.1-8B-Reason-Blend-888k", + "name": "Llama-3.1-8B-Reason-Blend-888k", + "developer": "khulaifi95", + "scores": { + "IFEval": 0.5832, + "BBH": 0.479, + "MATH Level 5": 0.1156, + "GPQA": 0.2794, + "MUSR": 0.3379, + "MMLU-PRO": 0.31 + } + }, + { + "model_id": "kms7530/chemeng_llama-3-8b-Instruct-bnb-4bit_24_1_100_1", + "name": "chemeng_llama-3-8b-Instruct-bnb-4bit_24_1_100_1", + "developer": "kms7530", + "scores": { + "IFEval": 0.5455, + "BBH": 0.4289, + "MATH Level 5": 0.0619, + "GPQA": 0.2701, + "MUSR": 0.3821, + "MMLU-PRO": 0.2798 + } + }, + { + "model_id": "kms7530/chemeng_phi-3-mini-4k-instruct-bnb-4bit_16_4_100_1_nonmath", + "name": "chemeng_phi-3-mini-4k-instruct-bnb-4bit_16_4_100_1_nonmath", + "developer": "kms7530", + "scores": { + "IFEval": 0.4863, + "BBH": 0.4987, + "MATH Level 5": 0.108, + "GPQA": 0.3104, + "MUSR": 0.3983, + "MMLU-PRO": 0.3481 + } + }, + { + "model_id": "kms7530/chemeng_qwen-math-7b_24_1_100_1", + "name": "chemeng_qwen-math-7b_24_1_100_1", + "developer": "kms7530", + "scores": { + "IFEval": 0.2111, + "BBH": 0.3578, + "MATH Level 5": 0.2243, + "GPQA": 0.2441, + "MUSR": 0.3687, + "MMLU-PRO": 0.2158 + } + }, + { + "model_id": "kms7530/chemeng_qwen-math-7b_24_1_100_1_nonmath", + "name": "chemeng_qwen-math-7b_24_1_100_1_nonmath", + "developer": "kms7530", + "scores": { + "IFEval": 0.2584, + "BBH": 0.3893, + "MATH Level 5": 0.3097, + "GPQA": 0.2903, + "MUSR": 0.4087, + "MMLU-PRO": 0.2452 + } + }, + { + "model_id": "kno10/ende-chat-0.0.5", + "name": "ende-chat-0.0.5", + "developer": "kno10", + "scores": { + "IFEval": 0.3404, + "BBH": 0.3604, + "MATH Level 5": 0.0204, + "GPQA": 0.2651, + "MUSR": 0.3938, + "MMLU-PRO": 0.179 + } + }, + { + "model_id": "kno10/ende-chat-0.0.7", + "name": "ende-chat-0.0.7", + "developer": "kno10", + "scores": { + "IFEval": 0.4401, + "BBH": 0.3792, + "MATH Level 5": 0.0174, + "GPQA": 0.281, + "MUSR": 0.3861, + "MMLU-PRO": 0.1966 + } + }, + { + "model_id": "kyutai/helium-1-preview-2b", + "name": "helium-1-preview-2b", + "developer": "kyutai", + "scores": { + "IFEval": 0.2614, + "BBH": 0.3638, + "MATH Level 5": 0.0136, + "GPQA": 0.2785, + "MUSR": 0.355, + "MMLU-PRO": 0.1873 + } + }, + { + "model_id": "kz919/QwQ-0.5B-Distilled-SFT", + "name": "QwQ-0.5B-Distilled-SFT", + "developer": "kz919", + "scores": { + "IFEval": 0.3077, + "BBH": 0.3256, + "MATH Level 5": 0.074, + "GPQA": 0.2609, + "MUSR": 0.3409, + "MMLU-PRO": 0.1587 + } + }, + { + "model_id": "ladydaina/ECE-FDF", + "name": "ECE-FDF", + "developer": "ladydaina", + "scores": { + "IFEval": 0.3728, + "BBH": 0.515, + "MATH Level 5": 0.0816, + "GPQA": 0.2827, + "MUSR": 0.4504, + "MMLU-PRO": 0.3007 + } + }, + { + "model_id": "laislemke/LLaMA-2-vicuna-7b-slerp", + "name": "LLaMA-2-vicuna-7b-slerp", + "developer": "laislemke", + "scores": { + "IFEval": 0.2932, + "BBH": 0.2986, + "MATH Level 5": 0.0113, + "GPQA": 0.2735, + "MUSR": 0.3833, + "MMLU-PRO": 0.1342 + } + }, + { + "model_id": "lalainy/ECE-PRYMMAL-0.5B-FT-V5-MUSR", + "name": "ECE-PRYMMAL-0.5B-FT-V5-MUSR", + "developer": "lalainy", + "scores": { + "IFEval": 0.2138, + "BBH": 0.3269, + "MATH Level 5": 0.0453, + "GPQA": 0.2743, + "MUSR": 0.3262, + "MMLU-PRO": 0.1533 + } + }, + { + "model_id": "lalainy/ECE-PRYMMAL-0.5B-SLERP-V4", + "name": "ECE-PRYMMAL-0.5B-SLERP-V4", + "developer": "lalainy", + "scores": { + "IFEval": 0.1564, + "BBH": 0.2894, + "MATH Level 5": 0.0, + "GPQA": 0.2626, + "MUSR": 0.3789, + "MMLU-PRO": 0.1169 + } + }, + { + "model_id": "lalainy/ECE-PRYMMAL-YL-0.5B-SLERP-BIS-V1", + "name": "ECE-PRYMMAL-YL-0.5B-SLERP-BIS-V1", + "developer": "lalainy", + "scores": { + "IFEval": 0.1437, + "BBH": 0.3032, + "MATH Level 5": 0.0008, + "GPQA": 0.2349, + "MUSR": 0.3646, + "MMLU-PRO": 0.1121 + } + }, + { + "model_id": "lalainy/ECE-PRYMMAL-YL-1B-SLERP-V3", + "name": "ECE-PRYMMAL-YL-1B-SLERP-V3", + "developer": "lalainy", + "scores": { + "IFEval": 0.325, + "BBH": 0.4225, + "MATH Level 5": 0.0974, + "GPQA": 0.2945, + "MUSR": 0.4213, + "MMLU-PRO": 0.2931 + } + }, + { + "model_id": "lalainy/ECE-PRYMMAL-YL-1B-SLERP-V4", + "name": "ECE-PRYMMAL-YL-1B-SLERP-V4", + "developer": "lalainy", + "scores": { + "IFEval": 0.3324, + "BBH": 0.4171, + "MATH Level 5": 0.1005, + "GPQA": 0.2861, + "MUSR": 0.4306, + "MMLU-PRO": 0.2893 + } + }, + { + "model_id": "lalainy/ECE-PRYMMAL-YL-6B-SLERP-V1", + "name": "ECE-PRYMMAL-YL-6B-SLERP-V1", + "developer": "lalainy", + "scores": { + "IFEval": 0.3264, + "BBH": 0.4629, + "MATH Level 5": 0.1269, + "GPQA": 0.2886, + "MUSR": 0.4864, + "MMLU-PRO": 0.3214 + } + }, + { + "model_id": "lalainy/ECE-PRYMMAL-YL-6B-SLERP-V2", + "name": "ECE-PRYMMAL-YL-6B-SLERP-V2", + "developer": "lalainy", + "scores": { + "IFEval": 0.3249, + "BBH": 0.4629, + "MATH Level 5": 0.1269, + "GPQA": 0.2886, + "MUSR": 0.4864, + "MMLU-PRO": 0.3214 + } + }, + { + "model_id": "langgptai/Qwen-las-v0.1", + "name": "Qwen-las-v0.1", + "developer": "langgptai", + "scores": { + "IFEval": 0.3301, + "BBH": 0.3893, + "MATH Level 5": 0.037, + "GPQA": 0.2466, + "MUSR": 0.3701, + "MMLU-PRO": 0.2325 + } + }, + { + "model_id": "langgptai/qwen1.5-7b-chat-sa-v0.1", + "name": "qwen1.5-7b-chat-sa-v0.1", + "developer": "langgptai", + "scores": { + "IFEval": 0.4268, + "BBH": 0.4325, + "MATH Level 5": 0.0302, + "GPQA": 0.3121, + "MUSR": 0.3551, + "MMLU-PRO": 0.2993 + } + }, + { + "model_id": "lars1234/Mistral-Small-24B-Instruct-2501-writer", + "name": "Mistral-Small-24B-Instruct-2501-writer", + "developer": "lars1234", + "scores": { + "IFEval": 0.6565, + "BBH": 0.6733, + "MATH Level 5": 0.3557, + "GPQA": 0.3893, + "MUSR": 0.4645, + "MMLU-PRO": 0.5448 + } + }, + { + "model_id": "leafspark/Llama-3.1-8B-MultiReflection-Instruct", + "name": "Llama-3.1-8B-MultiReflection-Instruct", + "developer": "leafspark", + "scores": { + "IFEval": 0.7125, + "BBH": 0.5009, + "MATH Level 5": 0.1707, + "GPQA": 0.2928, + "MUSR": 0.3682, + "MMLU-PRO": 0.3724 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-9B", + "name": "Gemma-2-Ataraxy-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.3009, + "BBH": 0.5931, + "MATH Level 5": 0.0853, + "GPQA": 0.3347, + "MUSR": 0.4424, + "MMLU-PRO": 0.4226 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-Advanced-9B", + "name": "Gemma-2-Ataraxy-Advanced-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.5516, + "BBH": 0.5889, + "MATH Level 5": 0.1979, + "GPQA": 0.3356, + "MUSR": 0.3761, + "MMLU-PRO": 0.4244 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-Remix-9B", + "name": "Gemma-2-Ataraxy-Remix-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.7083, + "BBH": 0.5892, + "MATH Level 5": 0.2017, + "GPQA": 0.3389, + "MUSR": 0.4372, + "MMLU-PRO": 0.4239 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v2-9B", + "name": "Gemma-2-Ataraxy-v2-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.2136, + "BBH": 0.5766, + "MATH Level 5": 0.0846, + "GPQA": 0.3423, + "MUSR": 0.3484, + "MMLU-PRO": 0.4221 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v2a-9B", + "name": "Gemma-2-Ataraxy-v2a-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.1595, + "BBH": 0.5182, + "MATH Level 5": 0.0612, + "GPQA": 0.3398, + "MUSR": 0.3165, + "MMLU-PRO": 0.3515 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v2f-9B", + "name": "Gemma-2-Ataraxy-v2f-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.3791, + "BBH": 0.5193, + "MATH Level 5": 0.1163, + "GPQA": 0.3389, + "MUSR": 0.3231, + "MMLU-PRO": 0.3503 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v3-Advanced-9B", + "name": "Gemma-2-Ataraxy-v3-Advanced-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.6602, + "BBH": 0.5935, + "MATH Level 5": 0.1873, + "GPQA": 0.3364, + "MUSR": 0.445, + "MMLU-PRO": 0.4196 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v3b-9B", + "name": "Gemma-2-Ataraxy-v3b-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.6809, + "BBH": 0.5908, + "MATH Level 5": 0.2153, + "GPQA": 0.3331, + "MUSR": 0.4489, + "MMLU-PRO": 0.4205 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v3i-9B", + "name": "Gemma-2-Ataraxy-v3i-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.4203, + "BBH": 0.5626, + "MATH Level 5": 0.1533, + "GPQA": 0.328, + "MUSR": 0.3181, + "MMLU-PRO": 0.4166 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v3j-9B", + "name": "Gemma-2-Ataraxy-v3j-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.4169, + "BBH": 0.5632, + "MATH Level 5": 0.1692, + "GPQA": 0.328, + "MUSR": 0.318, + "MMLU-PRO": 0.4134 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v4-Advanced-9B", + "name": "Gemma-2-Ataraxy-v4-Advanced-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.7015, + "BBH": 0.6024, + "MATH Level 5": 0.2153, + "GPQA": 0.3389, + "MUSR": 0.4581, + "MMLU-PRO": 0.4367 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v4a-Advanced-9B", + "name": "Gemma-2-Ataraxy-v4a-Advanced-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.7135, + "BBH": 0.5988, + "MATH Level 5": 0.2115, + "GPQA": 0.344, + "MUSR": 0.4489, + "MMLU-PRO": 0.4309 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v4b-9B", + "name": "Gemma-2-Ataraxy-v4b-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.6878, + "BBH": 0.6039, + "MATH Level 5": 0.2334, + "GPQA": 0.3406, + "MUSR": 0.4555, + "MMLU-PRO": 0.4357 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v4c-9B", + "name": "Gemma-2-Ataraxy-v4c-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.6945, + "BBH": 0.6084, + "MATH Level 5": 0.2266, + "GPQA": 0.3339, + "MUSR": 0.4528, + "MMLU-PRO": 0.4395 + } + }, + { + "model_id": "lemon07r/Gemma-2-Ataraxy-v4d-9B", + "name": "Gemma-2-Ataraxy-v4d-9B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.725, + "BBH": 0.6054, + "MATH Level 5": 0.2334, + "GPQA": 0.3473, + "MUSR": 0.4541, + "MMLU-PRO": 0.4346 + } + }, + { + "model_id": "lemon07r/Llama-3-RedMagic4-8B", + "name": "Llama-3-RedMagic4-8B", + "developer": "lemon07r", + "scores": { + "IFEval": 0.4864, + "BBH": 0.4256, + "MATH Level 5": 0.0899, + "GPQA": 0.2903, + "MUSR": 0.3766, + "MMLU-PRO": 0.3676 + } + }, + { + "model_id": "lemon07r/llama-3-NeuralMahou-8b", + "name": "llama-3-NeuralMahou-8b", + "developer": "lemon07r", + "scores": { + "IFEval": 0.4901, + "BBH": 0.4184, + "MATH Level 5": 0.102, + "GPQA": 0.2886, + "MUSR": 0.3873, + "MMLU-PRO": 0.369 + } + }, + { + "model_id": "lesubra/ECE-EIFFEL-3B", + "name": "ECE-EIFFEL-3B", + "developer": "lesubra", + "scores": { + "IFEval": 0.3469, + "BBH": 0.5102, + "MATH Level 5": 0.1216, + "GPQA": 0.3314, + "MUSR": 0.4362, + "MMLU-PRO": 0.3821 + } + }, + { + "model_id": "lesubra/ECE-EIFFEL-3Bv2", + "name": "ECE-EIFFEL-3Bv2", + "developer": "lesubra", + "scores": { + "IFEval": 0.3013, + "BBH": 0.5424, + "MATH Level 5": 0.1186, + "GPQA": 0.3356, + "MUSR": 0.4443, + "MMLU-PRO": 0.3999 + } + }, + { + "model_id": "lesubra/ECE-EIFFEL-3Bv3", + "name": "ECE-EIFFEL-3Bv3", + "developer": "lesubra", + "scores": { + "IFEval": 0.3786, + "BBH": 0.5469, + "MATH Level 5": 0.1669, + "GPQA": 0.3297, + "MUSR": 0.4675, + "MMLU-PRO": 0.3975 + } + }, + { + "model_id": "lesubra/ECE-PRYMMAL-3B-SLERP-V1", + "name": "ECE-PRYMMAL-3B-SLERP-V1", + "developer": "lesubra", + "scores": { + "IFEval": 0.2933, + "BBH": 0.5341, + "MATH Level 5": 0.1662, + "GPQA": 0.3171, + "MUSR": 0.4595, + "MMLU-PRO": 0.39 + } + }, + { + "model_id": "lesubra/ECE-PRYMMAL-3B-SLERP-V2", + "name": "ECE-PRYMMAL-3B-SLERP-V2", + "developer": "lesubra", + "scores": { + "IFEval": 0.2933, + "BBH": 0.5341, + "MATH Level 5": 0.1662, + "GPQA": 0.3171, + "MUSR": 0.4595, + "MMLU-PRO": 0.39 + } + }, + { + "model_id": "lesubra/ECE-PRYMMAL-3B-SLERP_2-V1", + "name": "ECE-PRYMMAL-3B-SLERP_2-V1", + "developer": "lesubra", + "scores": { + "IFEval": 0.3649, + "BBH": 0.5411, + "MATH Level 5": 0.1677, + "GPQA": 0.3213, + "MUSR": 0.4661, + "MMLU-PRO": 0.399 + } + }, + { + "model_id": "lesubra/ECE-PRYMMAL-3B-SLERP_2-V2", + "name": "ECE-PRYMMAL-3B-SLERP_2-V2", + "developer": "lesubra", + "scores": { + "IFEval": 0.3664, + "BBH": 0.5411, + "MATH Level 5": 0.1677, + "GPQA": 0.3213, + "MUSR": 0.4661, + "MMLU-PRO": 0.399 + } + }, + { + "model_id": "lesubra/merge-test", + "name": "merge-test", + "developer": "lesubra", + "scores": { + "IFEval": 0.5383, + "BBH": 0.524, + "MATH Level 5": 0.1208, + "GPQA": 0.3221, + "MUSR": 0.4419, + "MMLU-PRO": 0.3874 + } + }, + { + "model_id": "lightblue/suzume-llama-3-8B-multilingual", + "name": "suzume-llama-3-8B-multilingual", + "developer": "lightblue", + "scores": { + "IFEval": 0.6678, + "BBH": 0.495, + "MATH Level 5": 0.0944, + "GPQA": 0.2836, + "MUSR": 0.3977, + "MMLU-PRO": 0.3383 + } + }, + { + "model_id": "lightblue/suzume-llama-3-8B-multilingual-orpo-borda-full", + "name": "suzume-llama-3-8B-multilingual-orpo-borda-full", + "developer": "lightblue", + "scores": { + "IFEval": 0.5817, + "BBH": 0.4714, + "MATH Level 5": 0.0763, + "GPQA": 0.2592, + "MUSR": 0.3222, + "MMLU-PRO": 0.331 + } + }, + { + "model_id": "lightblue/suzume-llama-3-8B-multilingual-orpo-borda-half", + "name": "suzume-llama-3-8B-multilingual-orpo-borda-half", + "developer": "lightblue", + "scores": { + "IFEval": 0.6249, + "BBH": 0.4707, + "MATH Level 5": 0.0906, + "GPQA": 0.245, + "MUSR": 0.3516, + "MMLU-PRO": 0.3614 + } + }, + { + "model_id": "lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top25", + "name": "suzume-llama-3-8B-multilingual-orpo-borda-top25", + "developer": "lightblue", + "scores": { + "IFEval": 0.6637, + "BBH": 0.4865, + "MATH Level 5": 0.1042, + "GPQA": 0.2727, + "MUSR": 0.3566, + "MMLU-PRO": 0.3684 + } + }, + { + "model_id": "lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top75", + "name": "suzume-llama-3-8B-multilingual-orpo-borda-top75", + "developer": "lightblue", + "scores": { + "IFEval": 0.6687, + "BBH": 0.4833, + "MATH Level 5": 0.0785, + "GPQA": 0.2727, + "MUSR": 0.3817, + "MMLU-PRO": 0.3769 + } + }, + { + "model_id": "lkoenig/BBAI_145_", + "name": "BBAI_145_", + "developer": "lkoenig", + "scores": { + "IFEval": 0.445, + "BBH": 0.5567, + "MATH Level 5": 0.361, + "GPQA": 0.3163, + "MUSR": 0.4382, + "MMLU-PRO": 0.449 + } + }, + { + "model_id": "lkoenig/BBAI_200_Gemma", + "name": "BBAI_200_Gemma", + "developer": "lkoenig", + "scores": { + "IFEval": 0.0705, + "BBH": 0.3449, + "MATH Level 5": 0.0, + "GPQA": 0.2668, + "MUSR": 0.3631, + "MMLU-PRO": 0.1679 + } + }, + { + "model_id": "lkoenig/BBAI_212_QwenLawLo", + "name": "BBAI_212_QwenLawLo", + "developer": "lkoenig", + "scores": { + "IFEval": 0.4566, + "BBH": 0.5574, + "MATH Level 5": 0.3603, + "GPQA": 0.3163, + "MUSR": 0.437, + "MMLU-PRO": 0.4489 + } + }, + { + "model_id": "lkoenig/BBAI_212_Qwencore", + "name": "BBAI_212_Qwencore", + "developer": "lkoenig", + "scores": { + "IFEval": 0.4384, + "BBH": 0.5569, + "MATH Level 5": 0.3489, + "GPQA": 0.3163, + "MUSR": 0.4343, + "MMLU-PRO": 0.449 + } + }, + { + "model_id": "lkoenig/BBAI_230_Xiaqwen", + "name": "BBAI_230_Xiaqwen", + "developer": "lkoenig", + "scores": { + "IFEval": 0.4649, + "BBH": 0.5578, + "MATH Level 5": 0.3663, + "GPQA": 0.3138, + "MUSR": 0.4422, + "MMLU-PRO": 0.4481 + } + }, + { + "model_id": "lkoenig/BBAI_375_QwenDyancabs", + "name": "BBAI_375_QwenDyancabs", + "developer": "lkoenig", + "scores": { + "IFEval": 0.4566, + "BBH": 0.5571, + "MATH Level 5": 0.3776, + "GPQA": 0.3129, + "MUSR": 0.4462, + "MMLU-PRO": 0.4476 + } + }, + { + "model_id": "lkoenig/BBAI_456_QwenKoen", + "name": "BBAI_456_QwenKoen", + "developer": "lkoenig", + "scores": { + "IFEval": 0.4529, + "BBH": 0.5553, + "MATH Level 5": 0.3686, + "GPQA": 0.3129, + "MUSR": 0.4395, + "MMLU-PRO": 0.4469 + } + }, + { + "model_id": "lkoenig/BBAI_7B_KoenQwenDyan", + "name": "BBAI_7B_KoenQwenDyan", + "developer": "lkoenig", + "scores": { + "IFEval": 0.5807, + "BBH": 0.5537, + "MATH Level 5": 0.3739, + "GPQA": 0.318, + "MUSR": 0.4369, + "MMLU-PRO": 0.446 + } + }, + { + "model_id": "lkoenig/BBAI_7B_Qwen2.5koen", + "name": "BBAI_7B_Qwen2.5koen", + "developer": "lkoenig", + "scores": { + "IFEval": 0.46, + "BBH": 0.5544, + "MATH Level 5": 0.3656, + "GPQA": 0.3129, + "MUSR": 0.4369, + "MMLU-PRO": 0.4485 + } + }, + { + "model_id": "lkoenig/BBAI_7B_QwenDyanKoenLo", + "name": "BBAI_7B_QwenDyanKoenLo", + "developer": "lkoenig", + "scores": { + "IFEval": 0.4663, + "BBH": 0.5562, + "MATH Level 5": 0.364, + "GPQA": 0.3188, + "MUSR": 0.4343, + "MMLU-PRO": 0.4465 + } + }, + { + "model_id": "lkoenig/BBAI_7B_QwenDyancabsLAW", + "name": "BBAI_7B_QwenDyancabsLAW", + "developer": "lkoenig", + "scores": { + "IFEval": 0.555, + "BBH": 0.5579, + "MATH Level 5": 0.3678, + "GPQA": 0.3188, + "MUSR": 0.4461, + "MMLU-PRO": 0.4471 + } + }, + { + "model_id": "llmat/Mistral-v0.3-7B-ORPO", + "name": "Mistral-v0.3-7B-ORPO", + "developer": "llmat", + "scores": { + "IFEval": 0.364, + "BBH": 0.4005, + "MATH Level 5": 0.0015, + "GPQA": 0.2693, + "MUSR": 0.3529, + "MMLU-PRO": 0.2301 + } + }, + { + "model_id": "llnYou/ECE-PRYMMAL-YL-1B-SLERP-V5", + "name": "ECE-PRYMMAL-YL-1B-SLERP-V5", + "developer": "llnYou", + "scores": { + "IFEval": 0.3313, + "BBH": 0.4233, + "MATH Level 5": 0.111, + "GPQA": 0.2861, + "MUSR": 0.3868, + "MMLU-PRO": 0.2931 + } + }, + { + "model_id": "llnYou/ECE-PRYMMAL-YL-1B-SLERP-V6", + "name": "ECE-PRYMMAL-YL-1B-SLERP-V6", + "developer": "llnYou", + "scores": { + "IFEval": 0.1388, + "BBH": 0.3944, + "MATH Level 5": 0.0023, + "GPQA": 0.2903, + "MUSR": 0.3928, + "MMLU-PRO": 0.235 + } + }, + { + "model_id": "llnYou/ECE-PRYMMAL-YL-3B-SLERP-V1", + "name": "ECE-PRYMMAL-YL-3B-SLERP-V1", + "developer": "llnYou", + "scores": { + "IFEval": 0.2346, + "BBH": 0.4018, + "MATH Level 5": 0.0091, + "GPQA": 0.2936, + "MUSR": 0.3364, + "MMLU-PRO": 0.285 + } + }, + { + "model_id": "llnYou/ECE-PRYMMAL-YL-3B-SLERP-V2", + "name": "ECE-PRYMMAL-YL-3B-SLERP-V2", + "developer": "llnYou", + "scores": { + "IFEval": 0.2309, + "BBH": 0.399, + "MATH Level 5": 0.0128, + "GPQA": 0.2768, + "MUSR": 0.3588, + "MMLU-PRO": 0.29 + } + }, + { + "model_id": "llnYou/ECE-PRYMMAL-YL-3B-SLERP-V3", + "name": "ECE-PRYMMAL-YL-3B-SLERP-V3", + "developer": "llnYou", + "scores": { + "IFEval": 0.3581, + "BBH": 0.5473, + "MATH Level 5": 0.1299, + "GPQA": 0.3045, + "MUSR": 0.4361, + "MMLU-PRO": 0.4043 + } + }, + { + "model_id": "lmsys/vicuna-13b-v1.3", + "name": "vicuna-13b-v1.3", + "developer": "lmsys", + "scores": { + "IFEval": 0.3344, + "BBH": 0.3384, + "MATH Level 5": 0.0144, + "GPQA": 0.2676, + "MUSR": 0.3727, + "MMLU-PRO": 0.2243 + } + }, + { + "model_id": "lmsys/vicuna-7b-v1.3", + "name": "vicuna-7b-v1.3", + "developer": "lmsys", + "scores": { + "IFEval": 0.2909, + "BBH": 0.3298, + "MATH Level 5": 0.0128, + "GPQA": 0.2424, + "MUSR": 0.3793, + "MMLU-PRO": 0.1838 + } + }, + { + "model_id": "lmsys/vicuna-7b-v1.5", + "name": "vicuna-7b-v1.5", + "developer": "lmsys", + "scores": { + "IFEval": 0.2352, + "BBH": 0.3947, + "MATH Level 5": 0.0136, + "GPQA": 0.2584, + "MUSR": 0.4231, + "MMLU-PRO": 0.2147 + } + }, + { + "model_id": "lodrick-the-lafted/llama-3.1-8b-instruct-ortho-v7", + "name": "llama-3.1-8b-instruct-ortho-v7", + "developer": "lodrick-the-lafted", + "scores": { + "IFEval": 0.3515, + "BBH": 0.3907, + "MATH Level 5": 0.0272, + "GPQA": 0.2727, + "MUSR": 0.3616, + "MMLU-PRO": 0.1974 + } + }, + { + "model_id": "lordjia/Llama-3-Cantonese-8B-Instruct", + "name": "Llama-3-Cantonese-8B-Instruct", + "developer": "lordjia", + "scores": { + "IFEval": 0.6669, + "BBH": 0.4814, + "MATH Level 5": 0.0891, + "GPQA": 0.2936, + "MUSR": 0.4046, + "MMLU-PRO": 0.3515 + } + }, + { + "model_id": "lordjia/Qwen2-Cantonese-7B-Instruct", + "name": "Qwen2-Cantonese-7B-Instruct", + "developer": "lordjia", + "scores": { + "IFEval": 0.5435, + "BBH": 0.5215, + "MATH Level 5": 0.256, + "GPQA": 0.2953, + "MUSR": 0.4004, + "MMLU-PRO": 0.3843 + } + }, + { + "model_id": "lt-asset/nova-1.3b", + "name": "nova-1.3b", + "developer": "lt-asset", + "scores": { + "IFEval": 0.1214, + "BBH": 0.317, + "MATH Level 5": 0.0121, + "GPQA": 0.2492, + "MUSR": 0.3698, + "MMLU-PRO": 0.1142 + } + }, + { + "model_id": "lunahr/thea-3b-50r-u1", + "name": "thea-3b-50r-u1", + "developer": "lunahr", + "scores": { + "IFEval": 0.603, + "BBH": 0.4105, + "MATH Level 5": 0.1042, + "GPQA": 0.2836, + "MUSR": 0.3182, + "MMLU-PRO": 0.2808 + } + }, + { + "model_id": "lunahr/thea-v2-3b-50r", + "name": "thea-v2-3b-50r", + "developer": "lunahr", + "scores": { + "IFEval": 0.3704, + "BBH": 0.4194, + "MATH Level 5": 0.0242, + "GPQA": 0.2609, + "MUSR": 0.3222, + "MMLU-PRO": 0.2409 + } + }, + { + "model_id": "m42-health/Llama3-Med42-70B", + "name": "Llama3-Med42-70B", + "developer": "m42-health", + "scores": { + "IFEval": 0.6291, + "BBH": 0.6688, + "MATH Level 5": 0.2258, + "GPQA": 0.3473, + "MUSR": 0.4629, + "MMLU-PRO": 0.4963 + } + }, + { + "model_id": "macadeliccc/Samantha-Qwen-2-7B", + "name": "Samantha-Qwen-2-7B", + "developer": "macadeliccc", + "scores": { + "IFEval": 0.4377, + "BBH": 0.5082, + "MATH Level 5": 0.2115, + "GPQA": 0.2727, + "MUSR": 0.4799, + "MMLU-PRO": 0.3779 + } + }, + { + "model_id": "macadeliccc/magistrate-3.2-3b-base", + "name": "magistrate-3.2-3b-base", + "developer": "macadeliccc", + "scores": { + "IFEval": 0.1159, + "BBH": 0.3343, + "MATH Level 5": 0.0113, + "GPQA": 0.2609, + "MUSR": 0.3976, + "MMLU-PRO": 0.1689 + } + }, + { + "model_id": "macadeliccc/magistrate-3.2-3b-it", + "name": "magistrate-3.2-3b-it", + "developer": "macadeliccc", + "scores": { + "IFEval": 0.2292, + "BBH": 0.3257, + "MATH Level 5": 0.0196, + "GPQA": 0.2475, + "MUSR": 0.3763, + "MMLU-PRO": 0.1592 + } + }, + { + "model_id": "magnifi/Phi3_intent_v56_3_w_unknown_5_lr_0.002", + "name": "Phi3_intent_v56_3_w_unknown_5_lr_0.002", + "developer": "magnifi", + "scores": { + "IFEval": 0.2018, + "BBH": 0.3282, + "MATH Level 5": 0.0, + "GPQA": 0.2643, + "MUSR": 0.4123, + "MMLU-PRO": 0.1472 + } + }, + { + "model_id": "maldv/Awqward2.5-32B-Instruct", + "name": "Awqward2.5-32B-Instruct", + "developer": "maldv", + "scores": { + "IFEval": 0.8255, + "BBH": 0.6974, + "MATH Level 5": 0.6231, + "GPQA": 0.3406, + "MUSR": 0.4275, + "MMLU-PRO": 0.5723 + } + }, + { + "model_id": "maldv/Lytta2.5-32B-Instruct", + "name": "Lytta2.5-32B-Instruct", + "developer": "maldv", + "scores": { + "IFEval": 0.2508, + "BBH": 0.56, + "MATH Level 5": 0.3444, + "GPQA": 0.2668, + "MUSR": 0.3769, + "MMLU-PRO": 0.5048 + } + }, + { + "model_id": "maldv/Qwentile2.5-32B-Instruct", + "name": "Qwentile2.5-32B-Instruct", + "developer": "maldv", + "scores": { + "IFEval": 0.7393, + "BBH": 0.6963, + "MATH Level 5": 0.5219, + "GPQA": 0.3842, + "MUSR": 0.4682, + "MMLU-PRO": 0.5879 + } + }, + { + "model_id": "maldv/badger-kappa-llama-3-8b", + "name": "badger-kappa-llama-3-8b", + "developer": "maldv", + "scores": { + "IFEval": 0.4695, + "BBH": 0.5085, + "MATH Level 5": 0.0861, + "GPQA": 0.3029, + "MUSR": 0.3765, + "MMLU-PRO": 0.3695 + } + }, + { + "model_id": "maldv/badger-lambda-llama-3-8b", + "name": "badger-lambda-llama-3-8b", + "developer": "maldv", + "scores": { + "IFEval": 0.4861, + "BBH": 0.4963, + "MATH Level 5": 0.0944, + "GPQA": 0.2819, + "MUSR": 0.3754, + "MMLU-PRO": 0.3767 + } + }, + { + "model_id": "maldv/badger-mu-llama-3-8b", + "name": "badger-mu-llama-3-8b", + "developer": "maldv", + "scores": { + "IFEval": 0.4919, + "BBH": 0.5143, + "MATH Level 5": 0.0559, + "GPQA": 0.2592, + "MUSR": 0.3555, + "MMLU-PRO": 0.3674 + } + }, + { + "model_id": "maldv/badger-writer-llama-3-8b", + "name": "badger-writer-llama-3-8b", + "developer": "maldv", + "scores": { + "IFEval": 0.5303, + "BBH": 0.4864, + "MATH Level 5": 0.0755, + "GPQA": 0.2894, + "MUSR": 0.3581, + "MMLU-PRO": 0.376 + } + }, + { + "model_id": "marcuscedricridia/Cheng-1", + "name": "Cheng-1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7789, + "BBH": 0.5525, + "MATH Level 5": 0.4894, + "GPQA": 0.2961, + "MUSR": 0.4073, + "MMLU-PRO": 0.4349 + } + }, + { + "model_id": "marcuscedricridia/Cheng-2", + "name": "Cheng-2", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.8337, + "BBH": 0.6499, + "MATH Level 5": 0.5438, + "GPQA": 0.3456, + "MUSR": 0.4193, + "MMLU-PRO": 0.5013 + } + }, + { + "model_id": "marcuscedricridia/Cheng-2-v1.1", + "name": "Cheng-2-v1.1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.827, + "BBH": 0.651, + "MATH Level 5": 0.5393, + "GPQA": 0.3431, + "MUSR": 0.4167, + "MMLU-PRO": 0.5076 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-MST", + "name": "Hush-Qwen2.5-7B-MST", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7488, + "BBH": 0.5458, + "MATH Level 5": 0.4245, + "GPQA": 0.3037, + "MUSR": 0.3914, + "MMLU-PRO": 0.4163 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-MST-v1.1", + "name": "Hush-Qwen2.5-7B-MST-v1.1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7445, + "BBH": 0.5559, + "MATH Level 5": 0.4653, + "GPQA": 0.3062, + "MUSR": 0.4073, + "MMLU-PRO": 0.4299 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-MST-v1.3", + "name": "Hush-Qwen2.5-7B-MST-v1.3", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7043, + "BBH": 0.5516, + "MATH Level 5": 0.4758, + "GPQA": 0.3146, + "MUSR": 0.4311, + "MMLU-PRO": 0.444 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-Preview", + "name": "Hush-Qwen2.5-7B-Preview", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7962, + "BBH": 0.5431, + "MATH Level 5": 0.3754, + "GPQA": 0.3112, + "MUSR": 0.4298, + "MMLU-PRO": 0.4364 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-RP-v1.4-1M", + "name": "Hush-Qwen2.5-7B-RP-v1.4-1M", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7728, + "BBH": 0.5295, + "MATH Level 5": 0.3369, + "GPQA": 0.2987, + "MUSR": 0.4433, + "MMLU-PRO": 0.4135 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-v1.1", + "name": "Hush-Qwen2.5-7B-v1.1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7889, + "BBH": 0.5384, + "MATH Level 5": 0.4381, + "GPQA": 0.3163, + "MUSR": 0.4179, + "MMLU-PRO": 0.4227 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-v1.2", + "name": "Hush-Qwen2.5-7B-v1.2", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7865, + "BBH": 0.5403, + "MATH Level 5": 0.4403, + "GPQA": 0.3146, + "MUSR": 0.4219, + "MMLU-PRO": 0.4197 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-v1.3", + "name": "Hush-Qwen2.5-7B-v1.3", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7856, + "BBH": 0.5327, + "MATH Level 5": 0.3323, + "GPQA": 0.3121, + "MUSR": 0.4246, + "MMLU-PRO": 0.4345 + } + }, + { + "model_id": "marcuscedricridia/Hush-Qwen2.5-7B-v1.4", + "name": "Hush-Qwen2.5-7B-v1.4", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7835, + "BBH": 0.5423, + "MATH Level 5": 0.426, + "GPQA": 0.3112, + "MUSR": 0.4232, + "MMLU-PRO": 0.4195 + } + }, + { + "model_id": "marcuscedricridia/Qwen2.5-7B-Preview", + "name": "Qwen2.5-7B-Preview", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7679, + "BBH": 0.536, + "MATH Level 5": 0.3444, + "GPQA": 0.3238, + "MUSR": 0.414, + "MMLU-PRO": 0.4258 + } + }, + { + "model_id": "marcuscedricridia/Yell-Qwen2.5-7B-Preview", + "name": "Yell-Qwen2.5-7B-Preview", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.5839, + "BBH": 0.5371, + "MATH Level 5": 0.1926, + "GPQA": 0.281, + "MUSR": 0.4046, + "MMLU-PRO": 0.3798 + } + }, + { + "model_id": "marcuscedricridia/Yell-Qwen2.5-7B-Preview-v1.1", + "name": "Yell-Qwen2.5-7B-Preview-v1.1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.5757, + "BBH": 0.5348, + "MATH Level 5": 0.1896, + "GPQA": 0.2861, + "MUSR": 0.4059, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "marcuscedricridia/absolute-o1-7b", + "name": "absolute-o1-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7516, + "BBH": 0.5469, + "MATH Level 5": 0.5083, + "GPQA": 0.3196, + "MUSR": 0.4114, + "MMLU-PRO": 0.4413 + } + }, + { + "model_id": "marcuscedricridia/cursa-o1-7b", + "name": "cursa-o1-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7628, + "BBH": 0.5466, + "MATH Level 5": 0.4955, + "GPQA": 0.307, + "MUSR": 0.4301, + "MMLU-PRO": 0.4392 + } + }, + { + "model_id": "marcuscedricridia/cursa-o1-7b-2-28-2025", + "name": "cursa-o1-7b-2-28-2025", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7467, + "BBH": 0.5384, + "MATH Level 5": 0.4811, + "GPQA": 0.307, + "MUSR": 0.4273, + "MMLU-PRO": 0.4365 + } + }, + { + "model_id": "marcuscedricridia/cursa-o1-7b-v1.1", + "name": "cursa-o1-7b-v1.1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7528, + "BBH": 0.5493, + "MATH Level 5": 0.4985, + "GPQA": 0.307, + "MUSR": 0.4259, + "MMLU-PRO": 0.4392 + } + }, + { + "model_id": "marcuscedricridia/cursa-o1-7b-v1.2-normalize-false", + "name": "cursa-o1-7b-v1.2-normalize-false", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7616, + "BBH": 0.5492, + "MATH Level 5": 0.4992, + "GPQA": 0.307, + "MUSR": 0.4273, + "MMLU-PRO": 0.4436 + } + }, + { + "model_id": "marcuscedricridia/cursor-o1-7b", + "name": "cursor-o1-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.4107, + "BBH": 0.5007, + "MATH Level 5": 0.1412, + "GPQA": 0.281, + "MUSR": 0.4101, + "MMLU-PRO": 0.3251 + } + }, + { + "model_id": "marcuscedricridia/cursorr-o1.2-7b", + "name": "cursorr-o1.2-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.166, + "BBH": 0.3068, + "MATH Level 5": 0.0, + "GPQA": 0.2542, + "MUSR": 0.3538, + "MMLU-PRO": 0.108 + } + }, + { + "model_id": "marcuscedricridia/etr1o-explicit-v1.1", + "name": "etr1o-explicit-v1.1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.288, + "BBH": 0.3132, + "MATH Level 5": 0.0045, + "GPQA": 0.2777, + "MUSR": 0.4111, + "MMLU-PRO": 0.1195 + } + }, + { + "model_id": "marcuscedricridia/etr1o-explicit-v1.2", + "name": "etr1o-explicit-v1.2", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.1504, + "BBH": 0.295, + "MATH Level 5": 0.0, + "GPQA": 0.2609, + "MUSR": 0.4031, + "MMLU-PRO": 0.1126 + } + }, + { + "model_id": "marcuscedricridia/etr1o-v1.1", + "name": "etr1o-v1.1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.1597, + "BBH": 0.31, + "MATH Level 5": 0.0, + "GPQA": 0.2567, + "MUSR": 0.4017, + "MMLU-PRO": 0.1157 + } + }, + { + "model_id": "marcuscedricridia/etr1o-v1.2", + "name": "etr1o-v1.2", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7287, + "BBH": 0.6349, + "MATH Level 5": 0.3588, + "GPQA": 0.3758, + "MUSR": 0.4714, + "MMLU-PRO": 0.5316 + } + }, + { + "model_id": "marcuscedricridia/fan-o1-7b", + "name": "fan-o1-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.4456, + "BBH": 0.4849, + "MATH Level 5": 0.1616, + "GPQA": 0.2844, + "MUSR": 0.3834, + "MMLU-PRO": 0.3274 + } + }, + { + "model_id": "marcuscedricridia/olmner-7b", + "name": "olmner-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7254, + "BBH": 0.5472, + "MATH Level 5": 0.463, + "GPQA": 0.3079, + "MUSR": 0.438, + "MMLU-PRO": 0.4309 + } + }, + { + "model_id": "marcuscedricridia/olmner-della-7b", + "name": "olmner-della-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7637, + "BBH": 0.5491, + "MATH Level 5": 0.4962, + "GPQA": 0.3012, + "MUSR": 0.4208, + "MMLU-PRO": 0.4386 + } + }, + { + "model_id": "marcuscedricridia/olmner-o1-7b", + "name": "olmner-o1-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7528, + "BBH": 0.5481, + "MATH Level 5": 0.4924, + "GPQA": 0.3012, + "MUSR": 0.4299, + "MMLU-PRO": 0.4386 + } + }, + { + "model_id": "marcuscedricridia/olmner-sbr-7b", + "name": "olmner-sbr-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.76, + "BBH": 0.5462, + "MATH Level 5": 0.4947, + "GPQA": 0.3087, + "MUSR": 0.4154, + "MMLU-PRO": 0.4412 + } + }, + { + "model_id": "marcuscedricridia/post-cursa-o1", + "name": "post-cursa-o1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7628, + "BBH": 0.548, + "MATH Level 5": 0.4872, + "GPQA": 0.3096, + "MUSR": 0.4351, + "MMLU-PRO": 0.4361 + } + }, + { + "model_id": "marcuscedricridia/pre-cursa-o1", + "name": "pre-cursa-o1", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7409, + "BBH": 0.5462, + "MATH Level 5": 0.5038, + "GPQA": 0.3096, + "MUSR": 0.426, + "MMLU-PRO": 0.4424 + } + }, + { + "model_id": "marcuscedricridia/pre-cursa-o1-v1.2", + "name": "pre-cursa-o1-v1.2", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7549, + "BBH": 0.5487, + "MATH Level 5": 0.5068, + "GPQA": 0.3129, + "MUSR": 0.4272, + "MMLU-PRO": 0.4402 + } + }, + { + "model_id": "marcuscedricridia/pre-cursa-o1-v1.3", + "name": "pre-cursa-o1-v1.3", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7507, + "BBH": 0.5455, + "MATH Level 5": 0.5076, + "GPQA": 0.3129, + "MUSR": 0.4271, + "MMLU-PRO": 0.442 + } + }, + { + "model_id": "marcuscedricridia/pre-cursa-o1-v1.4", + "name": "pre-cursa-o1-v1.4", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7488, + "BBH": 0.5493, + "MATH Level 5": 0.4834, + "GPQA": 0.3054, + "MUSR": 0.4285, + "MMLU-PRO": 0.4436 + } + }, + { + "model_id": "marcuscedricridia/pre-cursa-o1-v1.6", + "name": "pre-cursa-o1-v1.6", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7528, + "BBH": 0.5473, + "MATH Level 5": 0.5, + "GPQA": 0.3205, + "MUSR": 0.4234, + "MMLU-PRO": 0.4413 + } + }, + { + "model_id": "marcuscedricridia/r1o-et", + "name": "r1o-et", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.3597, + "BBH": 0.4209, + "MATH Level 5": 0.0793, + "GPQA": 0.2727, + "MUSR": 0.3579, + "MMLU-PRO": 0.258 + } + }, + { + "model_id": "marcuscedricridia/sbr-o1-7b", + "name": "sbr-o1-7b", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.7455, + "BBH": 0.5479, + "MATH Level 5": 0.4985, + "GPQA": 0.3104, + "MUSR": 0.4404, + "MMLU-PRO": 0.4355 + } + }, + { + "model_id": "marcuscedricridia/stray-r1o-et", + "name": "stray-r1o-et", + "developer": "marcuscedricridia", + "scores": { + "IFEval": 0.1562, + "BBH": 0.2967, + "MATH Level 5": 0.0045, + "GPQA": 0.2617, + "MUSR": 0.4086, + "MMLU-PRO": 0.1094 + } + }, + { + "model_id": "matouLeLoup/ECE-PRYMMAL-0.5B-FT-EnhancedMUSREnsembleV3", + "name": "ECE-PRYMMAL-0.5B-FT-EnhancedMUSREnsembleV3", + "developer": "matouLeLoup", + "scores": { + "IFEval": 0.1873, + "BBH": 0.3239, + "MATH Level 5": 0.0264, + "GPQA": 0.2609, + "MUSR": 0.3752, + "MMLU-PRO": 0.172 + } + }, + { + "model_id": "matouLeLoup/ECE-PRYMMAL-0.5B-FT-MUSR-ENSEMBLE-V2Mathis", + "name": "ECE-PRYMMAL-0.5B-FT-MUSR-ENSEMBLE-V2Mathis", + "developer": "matouLeLoup", + "scores": { + "IFEval": 0.1873, + "BBH": 0.3239, + "MATH Level 5": 0.0264, + "GPQA": 0.2609, + "MUSR": 0.3752, + "MMLU-PRO": 0.172 + } + }, + { + "model_id": "matouLeLoup/ECE-PRYMMAL-0.5B-FT-V4-MUSR-ENSEMBLE-Mathis", + "name": "ECE-PRYMMAL-0.5B-FT-V4-MUSR-ENSEMBLE-Mathis", + "developer": "matouLeLoup", + "scores": { + "IFEval": 0.1873, + "BBH": 0.3239, + "MATH Level 5": 0.0264, + "GPQA": 0.2609, + "MUSR": 0.3752, + "MMLU-PRO": 0.172 + } + }, + { + "model_id": "matouLeLoup/ECE-PRYMMAL-0.5B-FT-V4-MUSR-Mathis", + "name": "ECE-PRYMMAL-0.5B-FT-V4-MUSR-Mathis", + "developer": "matouLeLoup", + "scores": { + "IFEval": 0.1882, + "BBH": 0.3233, + "MATH Level 5": 0.0272, + "GPQA": 0.2634, + "MUSR": 0.3685, + "MMLU-PRO": 0.172 + } + }, + { + "model_id": "matouLeLoup/ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis", + "name": "ECE-PRYMMAL-0.5B-FT-V5-MUSR-Mathis", + "developer": "matouLeLoup", + "scores": { + "IFEval": 0.1652, + "BBH": 0.3024, + "MATH Level 5": 0.0189, + "GPQA": 0.2567, + "MUSR": 0.4273, + "MMLU-PRO": 0.1116 + } + }, + { + "model_id": "mattshumer/Reflection-Llama-3.1-70B", + "name": "Reflection-Llama-3.1-70B", + "developer": "mattshumer", + "scores": { + "IFEval": 0.0045, + "BBH": 0.645, + "MATH Level 5": 0.2145, + "GPQA": 0.3633, + "MUSR": 0.4577, + "MMLU-PRO": 0.4955 + } + }, + { + "model_id": "mattshumer/ref_70_e3", + "name": "ref_70_e3", + "developer": "mattshumer", + "scores": { + "IFEval": 0.6294, + "BBH": 0.6501, + "MATH Level 5": 0.2795, + "GPQA": 0.3356, + "MUSR": 0.4328, + "MMLU-PRO": 0.5303 + } + }, + { + "model_id": "maywell/Qwen2-7B-Multilingual-RP", + "name": "Qwen2-7B-Multilingual-RP", + "developer": "maywell", + "scores": { + "IFEval": 0.4347, + "BBH": 0.5062, + "MATH Level 5": 0.2243, + "GPQA": 0.297, + "MUSR": 0.3696, + "MMLU-PRO": 0.3859 + } + }, + { + "model_id": "meditsolutions/Llama-3.1-MedIT-SUN-8B", + "name": "Llama-3.1-MedIT-SUN-8B", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.7837, + "BBH": 0.5187, + "MATH Level 5": 0.2092, + "GPQA": 0.3087, + "MUSR": 0.4056, + "MMLU-PRO": 0.3916 + } + }, + { + "model_id": "meditsolutions/Llama-3.2-SUN-1B-Instruct", + "name": "Llama-3.2-SUN-1B-Instruct", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.6413, + "BBH": 0.3474, + "MATH Level 5": 0.071, + "GPQA": 0.2424, + "MUSR": 0.3514, + "MMLU-PRO": 0.1781 + } + }, + { + "model_id": "meditsolutions/Llama-3.2-SUN-1B-chat", + "name": "Llama-3.2-SUN-1B-chat", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.5482, + "BBH": 0.3514, + "MATH Level 5": 0.0642, + "GPQA": 0.2617, + "MUSR": 0.3249, + "MMLU-PRO": 0.1838 + } + }, + { + "model_id": "meditsolutions/Llama-3.2-SUN-2.4B-checkpoint-26000", + "name": "Llama-3.2-SUN-2.4B-checkpoint-26000", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.2814, + "BBH": 0.3018, + "MATH Level 5": 0.0181, + "GPQA": 0.2777, + "MUSR": 0.4103, + "MMLU-PRO": 0.1345 + } + }, + { + "model_id": "meditsolutions/Llama-3.2-SUN-2.4B-checkpoint-34800", + "name": "Llama-3.2-SUN-2.4B-checkpoint-34800", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.2501, + "BBH": 0.3161, + "MATH Level 5": 0.0106, + "GPQA": 0.2861, + "MUSR": 0.4022, + "MMLU-PRO": 0.1357 + } + }, + { + "model_id": "meditsolutions/Llama-3.2-SUN-2.4B-v1.0.0", + "name": "Llama-3.2-SUN-2.4B-v1.0.0", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.5637, + "BBH": 0.3391, + "MATH Level 5": 0.0627, + "GPQA": 0.2576, + "MUSR": 0.3209, + "MMLU-PRO": 0.1543 + } + }, + { + "model_id": "meditsolutions/Llama-3.2-SUN-2.5B-chat", + "name": "Llama-3.2-SUN-2.5B-chat", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.5604, + "BBH": 0.3575, + "MATH Level 5": 0.071, + "GPQA": 0.2592, + "MUSR": 0.3155, + "MMLU-PRO": 0.1813 + } + }, + { + "model_id": "meditsolutions/Llama-3.2-SUN-HDIC-1B-Instruct", + "name": "Llama-3.2-SUN-HDIC-1B-Instruct", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.6827, + "BBH": 0.3508, + "MATH Level 5": 0.0619, + "GPQA": 0.2366, + "MUSR": 0.3594, + "MMLU-PRO": 0.1687 + } + }, + { + "model_id": "meditsolutions/MSH-Lite-7B-v1-Bielik-v2.3-Instruct-Llama-Prune", + "name": "MSH-Lite-7B-v1-Bielik-v2.3-Instruct-Llama-Prune", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.3655, + "BBH": 0.4035, + "MATH Level 5": 0.0264, + "GPQA": 0.3029, + "MUSR": 0.4253, + "MMLU-PRO": 0.219 + } + }, + { + "model_id": "meditsolutions/MSH-v1-Bielik-v2.3-Instruct-MedIT-merge", + "name": "MSH-v1-Bielik-v2.3-Instruct-MedIT-merge", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.5814, + "BBH": 0.5672, + "MATH Level 5": 0.2077, + "GPQA": 0.3456, + "MUSR": 0.4385, + "MMLU-PRO": 0.35 + } + }, + { + "model_id": "meditsolutions/MedIT-Mesh-3B-Instruct", + "name": "MedIT-Mesh-3B-Instruct", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.5814, + "BBH": 0.5576, + "MATH Level 5": 0.2032, + "GPQA": 0.3238, + "MUSR": 0.4048, + "MMLU-PRO": 0.4012 + } + }, + { + "model_id": "meditsolutions/SmolLM2-MedIT-Upscale-2B", + "name": "SmolLM2-MedIT-Upscale-2B", + "developer": "meditsolutions", + "scores": { + "IFEval": 0.6429, + "BBH": 0.3551, + "MATH Level 5": 0.0559, + "GPQA": 0.2643, + "MUSR": 0.3314, + "MMLU-PRO": 0.1971 + } + }, + { + "model_id": "meetkai/functionary-small-v3.1", + "name": "functionary-small-v3.1", + "developer": "meetkai", + "scores": { + "IFEval": 0.6275, + "BBH": 0.4982, + "MATH Level 5": 0.1571, + "GPQA": 0.2886, + "MUSR": 0.3834, + "MMLU-PRO": 0.3349 + } + }, + { + "model_id": "meraGPT/mera-mix-4x7B", + "name": "mera-mix-4x7B", + "developer": "meraGPT", + "scores": { + "IFEval": 0.4832, + "BBH": 0.4019, + "MATH Level 5": 0.0536, + "GPQA": 0.3045, + "MUSR": 0.4057, + "MMLU-PRO": 0.2748 + } + }, + { + "model_id": "mergekit-community/JAJUKA-WEWILLNEVERFORGETYOU-3B", + "name": "JAJUKA-WEWILLNEVERFORGETYOU-3B", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.4941, + "BBH": 0.437, + "MATH Level 5": 0.1246, + "GPQA": 0.2928, + "MUSR": 0.3656, + "MMLU-PRO": 0.3033 + } + }, + { + "model_id": "mergekit-community/SuperQwen-2.5-1.5B", + "name": "SuperQwen-2.5-1.5B", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.1336, + "BBH": 0.2907, + "MATH Level 5": 0.0196, + "GPQA": 0.2542, + "MUSR": 0.3355, + "MMLU-PRO": 0.1075 + } + }, + { + "model_id": "mergekit-community/VirtuosoSmall-InstructModelStock", + "name": "VirtuosoSmall-InstructModelStock", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.5238, + "BBH": 0.6518, + "MATH Level 5": 0.4094, + "GPQA": 0.3826, + "MUSR": 0.4756, + "MMLU-PRO": 0.5421 + } + }, + { + "model_id": "mergekit-community/diabolic6045_ELN-AOC-CAIN", + "name": "diabolic6045_ELN-AOC-CAIN", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.0862, + "BBH": 0.3126, + "MATH Level 5": 0.0121, + "GPQA": 0.2634, + "MUSR": 0.3658, + "MMLU-PRO": 0.1191 + } + }, + { + "model_id": "mergekit-community/mergekit-dare_ties-ajgjgea", + "name": "mergekit-dare_ties-ajgjgea", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.5263, + "BBH": 0.3495, + "MATH Level 5": 0.0642, + "GPQA": 0.2643, + "MUSR": 0.3289, + "MMLU-PRO": 0.1744 + } + }, + { + "model_id": "mergekit-community/mergekit-della-zgowfmf", + "name": "mergekit-della-zgowfmf", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.4828, + "BBH": 0.6591, + "MATH Level 5": 0.3618, + "GPQA": 0.3901, + "MUSR": 0.4834, + "MMLU-PRO": 0.5415 + } + }, + { + "model_id": "mergekit-community/mergekit-model_stock-azgztvm", + "name": "mergekit-model_stock-azgztvm", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.5062, + "BBH": 0.6543, + "MATH Level 5": 0.4373, + "GPQA": 0.3817, + "MUSR": 0.473, + "MMLU-PRO": 0.5406 + } + }, + { + "model_id": "mergekit-community/mergekit-slerp-fmrazcr", + "name": "mergekit-slerp-fmrazcr", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.4174, + "BBH": 0.5342, + "MATH Level 5": 0.1193, + "GPQA": 0.3112, + "MUSR": 0.4105, + "MMLU-PRO": 0.3777 + } + }, + { + "model_id": "mergekit-community/mergekit-ties-rraxdhv", + "name": "mergekit-ties-rraxdhv", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.1123, + "BBH": 0.5184, + "MATH Level 5": 0.04, + "GPQA": 0.3079, + "MUSR": 0.4202, + "MMLU-PRO": 0.391 + } + }, + { + "model_id": "mergekit-community/mergekit-ties-ykqemwr", + "name": "mergekit-ties-ykqemwr", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.36, + "BBH": 0.5455, + "MATH Level 5": 0.1224, + "GPQA": 0.3221, + "MUSR": 0.4198, + "MMLU-PRO": 0.3734 + } + }, + { + "model_id": "mergekit-community/sexeh_time_testing", + "name": "sexeh_time_testing", + "developer": "mergekit-community", + "scores": { + "IFEval": 0.7329, + "BBH": 0.5241, + "MATH Level 5": 0.0899, + "GPQA": 0.2911, + "MUSR": 0.3619, + "MMLU-PRO": 0.3667 + } + }, + { + "model_id": "meta-llama/Llama-2-13b-chat-hf", + "name": "Llama-2-13b-chat-hf", + "developer": "meta-llama", + "scores": { + "IFEval": 0.3985, + "BBH": 0.3343, + "MATH Level 5": 0.0136, + "GPQA": 0.2315, + "MUSR": 0.4007, + "MMLU-PRO": 0.1923 + } + }, + { + "model_id": "meta-llama/Llama-2-13b-hf", + "name": "Llama-2-13b-hf", + "developer": "meta-llama", + "scores": { + "IFEval": 0.2482, + "BBH": 0.4126, + "MATH Level 5": 0.0151, + "GPQA": 0.281, + "MUSR": 0.3538, + "MMLU-PRO": 0.2378 + } + }, + { + "model_id": "meta-llama/Llama-2-70b-chat-hf", + "name": "Llama-2-70b-chat-hf", + "developer": "meta-llama", + "scores": { + "IFEval": 0.4958, + "BBH": 0.3042, + "MATH Level 5": 0.0295, + "GPQA": 0.2643, + "MUSR": 0.3687, + "MMLU-PRO": 0.2433 + } + }, + { + "model_id": "meta-llama/Llama-2-70b-hf", + "name": "Llama-2-70b-hf", + "developer": "meta-llama", + "scores": { + "IFEval": 0.2407, + "BBH": 0.5473, + "MATH Level 5": 0.0325, + "GPQA": 0.3029, + "MUSR": 0.4124, + "MMLU-PRO": 0.3718 + } + }, + { + "model_id": "meta-llama/Llama-2-7b-chat-hf", + "name": "Llama-2-7b-chat-hf", + "developer": "meta-llama", + "scores": { + "IFEval": 0.3986, + "BBH": 0.3114, + "MATH Level 5": 0.0196, + "GPQA": 0.2534, + "MUSR": 0.3676, + "MMLU-PRO": 0.1688 + } + }, + { + "model_id": "meta-llama/Llama-2-7b-hf", + "name": "Llama-2-7b-hf", + "developer": "meta-llama", + "scores": { + "IFEval": 0.2519, + "BBH": 0.3496, + "MATH Level 5": 0.0174, + "GPQA": 0.2668, + "MUSR": 0.3701, + "MMLU-PRO": 0.1861 + } + }, + { + "model_id": "meta-llama/Llama-3.1-70B", + "name": "Llama-3.1-70B", + "developer": "meta-llama", + "scores": { + "IFEval": 0.1684, + "BBH": 0.626, + "MATH Level 5": 0.1843, + "GPQA": 0.3876, + "MUSR": 0.4572, + "MMLU-PRO": 0.4654 + } + }, + { + "model_id": "meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama-3.1-70B-Instruct", + "developer": "meta-llama", + "scores": { + "IFEval": 0.8669, + "BBH": 0.6917, + "MATH Level 5": 0.3807, + "GPQA": 0.3565, + "MUSR": 0.4581, + "MMLU-PRO": 0.5309 + } + }, + { + "model_id": "meta-llama/Llama-3.1-8B", + "name": "Llama-3.1-8B", + "developer": "meta-llama", + "scores": { + "IFEval": 0.1246, + "BBH": 0.466, + "MATH Level 5": 0.0657, + "GPQA": 0.3104, + "MUSR": 0.3812, + "MMLU-PRO": 0.3288 + } + }, + { + "model_id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama-3.1-8B-Instruct", + "developer": "meta-llama", + "scores": { + "IFEval": 0.4922, + "BBH": 0.5087, + "MATH Level 5": 0.1556, + "GPQA": 0.3154, + "MUSR": 0.3972, + "MMLU-PRO": 0.3798 + } + }, + { + "model_id": "meta-llama/Llama-3.2-1B", + "name": "Llama-3.2-1B", + "developer": "meta-llama", + "scores": { + "IFEval": 0.1478, + "BBH": 0.3115, + "MATH Level 5": 0.0121, + "GPQA": 0.2282, + "MUSR": 0.3447, + "MMLU-PRO": 0.1203 + } + }, + { + "model_id": "meta-llama/Llama-3.2-1B-Instruct", + "name": "Llama-3.2-1B-Instruct", + "developer": "meta-llama", + "scores": { + "IFEval": 0.5698, + "BBH": 0.3497, + "MATH Level 5": 0.0702, + "GPQA": 0.2752, + "MUSR": 0.3329, + "MMLU-PRO": 0.1682 + } + }, + { + "model_id": "meta-llama/Llama-3.2-3B", + "name": "Llama-3.2-3B", + "developer": "meta-llama", + "scores": { + "IFEval": 0.1337, + "BBH": 0.3905, + "MATH Level 5": 0.0189, + "GPQA": 0.2676, + "MUSR": 0.3577, + "MMLU-PRO": 0.2488 + } + }, + { + "model_id": "meta-llama/Llama-3.2-3B-Instruct", + "name": "Llama-3.2-3B-Instruct", + "developer": "meta-llama", + "scores": { + "IFEval": 0.7393, + "BBH": 0.461, + "MATH Level 5": 0.1767, + "GPQA": 0.2785, + "MUSR": 0.3529, + "MMLU-PRO": 0.3195 + } + }, + { + "model_id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "developer": "meta-llama", + "scores": { + "IFEval": 0.8998, + "BBH": 0.6919, + "MATH Level 5": 0.4834, + "GPQA": 0.3289, + "MUSR": 0.4461, + "MMLU-PRO": 0.5332 + } + }, + { + "model_id": "meta-llama/Meta-Llama-3-70B", + "name": "Meta-Llama-3-70B", + "developer": "meta-llama", + "scores": { + "IFEval": 0.1603, + "BBH": 0.6461, + "MATH Level 5": 0.1858, + "GPQA": 0.3977, + "MUSR": 0.4518, + "MMLU-PRO": 0.4709 + } + }, + { + "model_id": "meta-llama/Meta-Llama-3-70B-Instruct", + "name": "Meta-Llama-3-70B-Instruct", + "developer": "meta-llama", + "scores": { + "IFEval": 0.8099, + "BBH": 0.6547, + "MATH Level 5": 0.2447, + "GPQA": 0.2869, + "MUSR": 0.4154, + "MMLU-PRO": 0.5207 + } + }, + { + "model_id": "meta-llama/Meta-Llama-3-8B", + "name": "Meta-Llama-3-8B", + "developer": "meta-llama", + "scores": { + "IFEval": 0.1455, + "BBH": 0.4598, + "MATH Level 5": 0.0453, + "GPQA": 0.3054, + "MUSR": 0.3614, + "MMLU-PRO": 0.321 + } + }, + { + "model_id": "meta-llama/Meta-Llama-3-8B-Instruct", + "name": "Meta-Llama-3-8B-Instruct", + "developer": "meta-llama", + "scores": { + "IFEval": 0.7408, + "BBH": 0.4989, + "MATH Level 5": 0.0869, + "GPQA": 0.2592, + "MUSR": 0.3568, + "MMLU-PRO": 0.3664 + } + }, + { + "model_id": "mhl1/Qwen2.5-0.5B-cinstruct-stage1", + "name": "Qwen2.5-0.5B-cinstruct-stage1", + "developer": "mhl1", + "scores": { + "IFEval": 0.1482, + "BBH": 0.3256, + "MATH Level 5": 0.0128, + "GPQA": 0.2651, + "MUSR": 0.35, + "MMLU-PRO": 0.1139 + } + }, + { + "model_id": "microsoft/DialoGPT-medium", + "name": "DialoGPT-medium", + "developer": "microsoft", + "scores": { + "IFEval": 0.1479, + "BBH": 0.3014, + "MATH Level 5": 0.0, + "GPQA": 0.2542, + "MUSR": 0.4287, + "MMLU-PRO": 0.1119 + } + }, + { + "model_id": "microsoft/Orca-2-13b", + "name": "Orca-2-13b", + "developer": "microsoft", + "scores": { + "IFEval": 0.3128, + "BBH": 0.4884, + "MATH Level 5": 0.0317, + "GPQA": 0.2802, + "MUSR": 0.513, + "MMLU-PRO": 0.2749 + } + }, + { + "model_id": "microsoft/Orca-2-7b", + "name": "Orca-2-7b", + "developer": "microsoft", + "scores": { + "IFEval": 0.2183, + "BBH": 0.4452, + "MATH Level 5": 0.0196, + "GPQA": 0.2609, + "MUSR": 0.5026, + "MMLU-PRO": 0.2319 + } + }, + { + "model_id": "microsoft/Phi-3-medium-128k-instruct", + "name": "Phi-3-medium-128k-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.604, + "BBH": 0.6382, + "MATH Level 5": 0.1918, + "GPQA": 0.3364, + "MUSR": 0.4129, + "MMLU-PRO": 0.4712 + } + }, + { + "model_id": "microsoft/Phi-3-medium-4k-instruct", + "name": "Phi-3-medium-4k-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.6423, + "BBH": 0.6412, + "MATH Level 5": 0.1956, + "GPQA": 0.3364, + "MUSR": 0.4258, + "MMLU-PRO": 0.4676 + } + }, + { + "model_id": "microsoft/Phi-3-mini-128k-instruct", + "name": "Phi-3-mini-128k-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.5976, + "BBH": 0.5575, + "MATH Level 5": 0.1405, + "GPQA": 0.318, + "MUSR": 0.3937, + "MMLU-PRO": 0.3734 + } + }, + { + "model_id": "microsoft/Phi-3-mini-4k-instruct", + "name": "Phi-3-mini-4k-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.5477, + "BBH": 0.5491, + "MATH Level 5": 0.1639, + "GPQA": 0.3322, + "MUSR": 0.4284, + "MMLU-PRO": 0.4022 + } + }, + { + "model_id": "microsoft/Phi-3-small-128k-instruct", + "name": "Phi-3-small-128k-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.6368, + "BBH": 0.6202, + "MATH Level 5": 0.2026, + "GPQA": 0.3171, + "MUSR": 0.4378, + "MMLU-PRO": 0.4491 + } + }, + { + "model_id": "microsoft/Phi-3-small-8k-instruct", + "name": "Phi-3-small-8k-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.6497, + "BBH": 0.6208, + "MATH Level 5": 0.1887, + "GPQA": 0.3121, + "MUSR": 0.4558, + "MMLU-PRO": 0.4506 + } + }, + { + "model_id": "microsoft/Phi-3.5-MoE-instruct", + "name": "Phi-3.5-MoE-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.6925, + "BBH": 0.6408, + "MATH Level 5": 0.3119, + "GPQA": 0.3557, + "MUSR": 0.4565, + "MMLU-PRO": 0.4658 + } + }, + { + "model_id": "microsoft/Phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.5775, + "BBH": 0.5518, + "MATH Level 5": 0.1964, + "GPQA": 0.3398, + "MUSR": 0.4021, + "MMLU-PRO": 0.3962 + } + }, + { + "model_id": "microsoft/Phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "developer": "microsoft", + "scores": { + "IFEval": 0.7378, + "BBH": 0.5689, + "MATH Level 5": 0.1699, + "GPQA": 0.3096, + "MUSR": 0.3873, + "MMLU-PRO": 0.3932 + } + }, + { + "model_id": "microsoft/phi-1", + "name": "phi-1", + "developer": "microsoft", + "scores": { + "IFEval": 0.2068, + "BBH": 0.3139, + "MATH Level 5": 0.0098, + "GPQA": 0.2651, + "MUSR": 0.3525, + "MMLU-PRO": 0.1162 + } + }, + { + "model_id": "microsoft/phi-1_5", + "name": "phi-1_5", + "developer": "microsoft", + "scores": { + "IFEval": 0.2033, + "BBH": 0.336, + "MATH Level 5": 0.0181, + "GPQA": 0.2676, + "MUSR": 0.3404, + "MMLU-PRO": 0.1691 + } + }, + { + "model_id": "microsoft/phi-2", + "name": "Phi-2", + "developer": "microsoft", + "scores": { + "IFEval": 0.2739, + "BBH": 0.4881, + "MATH Level 5": 0.0295, + "GPQA": 0.2718, + "MUSR": 0.4099, + "MMLU-PRO": 0.2628 + } + }, + { + "model_id": "microsoft/phi-4", + "name": "phi-4", + "developer": "microsoft", + "scores": { + "IFEval": 0.0488, + "BBH": 0.6703, + "MATH Level 5": 0.2787, + "GPQA": 0.401, + "MUSR": 0.5034, + "MMLU-PRO": 0.5295 + } + }, + { + "model_id": "migtissera/Llama-3-70B-Synthia-v3.5", + "name": "Llama-3-70B-Synthia-v3.5", + "developer": "migtissera", + "scores": { + "IFEval": 0.6076, + "BBH": 0.6489, + "MATH Level 5": 0.2115, + "GPQA": 0.3876, + "MUSR": 0.4922, + "MMLU-PRO": 0.4658 + } + }, + { + "model_id": "migtissera/Llama-3-8B-Synthia-v3.5", + "name": "Llama-3-8B-Synthia-v3.5", + "developer": "migtissera", + "scores": { + "IFEval": 0.507, + "BBH": 0.4888, + "MATH Level 5": 0.0657, + "GPQA": 0.2718, + "MUSR": 0.4044, + "MMLU-PRO": 0.303 + } + }, + { + "model_id": "migtissera/Tess-3-7B-SFT", + "name": "Tess-3-7B-SFT", + "developer": "migtissera", + "scores": { + "IFEval": 0.3946, + "BBH": 0.4607, + "MATH Level 5": 0.04, + "GPQA": 0.271, + "MUSR": 0.4113, + "MMLU-PRO": 0.3034 + } + }, + { + "model_id": "migtissera/Tess-3-Mistral-Nemo-12B", + "name": "Tess-3-Mistral-Nemo-12B", + "developer": "migtissera", + "scores": { + "IFEval": 0.3355, + "BBH": 0.4899, + "MATH Level 5": 0.0574, + "GPQA": 0.2508, + "MUSR": 0.4458, + "MMLU-PRO": 0.2565 + } + }, + { + "model_id": "migtissera/Tess-v2.5-Phi-3-medium-128k-14B", + "name": "Tess-v2.5-Phi-3-medium-128k-14B", + "developer": "migtissera", + "scores": { + "IFEval": 0.4539, + "BBH": 0.6207, + "MATH Level 5": 0.0506, + "GPQA": 0.3079, + "MUSR": 0.4113, + "MMLU-PRO": 0.3732 + } + }, + { + "model_id": "migtissera/Tess-v2.5.2-Qwen2-72B", + "name": "Tess-v2.5.2-Qwen2-72B", + "developer": "migtissera", + "scores": { + "IFEval": 0.4494, + "BBH": 0.6647, + "MATH Level 5": 0.2938, + "GPQA": 0.3507, + "MUSR": 0.4188, + "MMLU-PRO": 0.5561 + } + }, + { + "model_id": "migtissera/Trinity-2-Codestral-22B", + "name": "Trinity-2-Codestral-22B", + "developer": "migtissera", + "scores": { + "IFEval": 0.4202, + "BBH": 0.5593, + "MATH Level 5": 0.0967, + "GPQA": 0.3146, + "MUSR": 0.4111, + "MMLU-PRO": 0.3308 + } + }, + { + "model_id": "migtissera/Trinity-2-Codestral-22B-v0.2", + "name": "Trinity-2-Codestral-22B-v0.2", + "developer": "migtissera", + "scores": { + "IFEval": 0.4345, + "BBH": 0.5686, + "MATH Level 5": 0.0838, + "GPQA": 0.3003, + "MUSR": 0.4045, + "MMLU-PRO": 0.334 + } + }, + { + "model_id": "mindw96/DeepSeek-llama3.3-Bllossom-8B-DACON-LLM3", + "name": "DeepSeek-llama3.3-Bllossom-8B-DACON-LLM3", + "developer": "mindw96", + "scores": { + "IFEval": 0.1388, + "BBH": 0.3068, + "MATH Level 5": 0.0083, + "GPQA": 0.2508, + "MUSR": 0.3792, + "MMLU-PRO": 0.1106 + } + }, + { + "model_id": "minghaowu/Qwen1.5-1.8B-OpenHermes-2.5", + "name": "Qwen1.5-1.8B-OpenHermes-2.5", + "developer": "minghaowu", + "scores": { + "IFEval": 0.2778, + "BBH": 0.3375, + "MATH Level 5": 0.0242, + "GPQA": 0.2836, + "MUSR": 0.3529, + "MMLU-PRO": 0.1792 + } + }, + { + "model_id": "ministral/Ministral-3b-instruct", + "name": "Ministral-3b-instruct", + "developer": "ministral", + "scores": { + "IFEval": 0.1358, + "BBH": 0.3192, + "MATH Level 5": 0.0083, + "GPQA": 0.2517, + "MUSR": 0.3382, + "MMLU-PRO": 0.1093 + } + }, + { + "model_id": "mistral-community/Mistral-7B-v0.2", + "name": "Mistral-7B-v0.2", + "developer": "mistral-community", + "scores": { + "IFEval": 0.2266, + "BBH": 0.451, + "MATH Level 5": 0.0302, + "GPQA": 0.2919, + "MUSR": 0.4032, + "MMLU-PRO": 0.2953 + } + }, + { + "model_id": "mistral-community/Mixtral-8x22B-v0.1", + "name": "Mixtral-8x22B-v0.1", + "developer": "mistral-community", + "scores": { + "IFEval": 0.3167, + "BBH": 0.38, + "MATH Level 5": 0.1543, + "GPQA": 0.33, + "MUSR": 0.3533, + "MMLU-PRO": 0.36 + } + }, + { + "model_id": "mistral-community/mixtral-8x22B-v0.3", + "name": "mixtral-8x22B-v0.3", + "developer": "mistral-community", + "scores": { + "IFEval": 0.2583, + "BBH": 0.625, + "MATH Level 5": 0.1835, + "GPQA": 0.3775, + "MUSR": 0.4037, + "MMLU-PRO": 0.4639 + } + }, + { + "model_id": "mistralai/Codestral-22B-v0.1", + "name": "Codestral-22B-v0.1", + "developer": "mistralai", + "scores": { + "IFEval": 0.5772, + "BBH": 0.5139, + "MATH Level 5": 0.1005, + "GPQA": 0.2987, + "MUSR": 0.4187, + "MMLU-PRO": 0.3156 + } + }, + { + "model_id": "mistralai/Ministral-8B-Instruct-2410", + "name": "Ministral-8B-Instruct-2410", + "developer": "mistralai", + "scores": { + "IFEval": 0.5896, + "BBH": 0.4762, + "MATH Level 5": 0.1956, + "GPQA": 0.2844, + "MUSR": 0.4138, + "MMLU-PRO": 0.3291 + } + }, + { + "model_id": "mistralai/Mistral-7B-Instruct-v0.1", + "name": "Mistral-7B-Instruct-v0.1", + "developer": "mistralai", + "scores": { + "IFEval": 0.4487, + "BBH": 0.3355, + "MATH Level 5": 0.0227, + "GPQA": 0.25, + "MUSR": 0.3848, + "MMLU-PRO": 0.2414 + } + }, + { + "model_id": "mistralai/Mistral-7B-Instruct-v0.2", + "name": "Mistral-7B-Instruct-v0.2", + "developer": "mistralai", + "scores": { + "IFEval": 0.5496, + "BBH": 0.446, + "MATH Level 5": 0.0302, + "GPQA": 0.276, + "MUSR": 0.3966, + "MMLU-PRO": 0.2717 + } + }, + { + "model_id": "mistralai/Mistral-7B-Instruct-v0.3", + "name": "Mistral-7B-Instruct-v0.3", + "developer": "mistralai", + "scores": { + "IFEval": 0.5465, + "BBH": 0.4722, + "MATH Level 5": 0.0385, + "GPQA": 0.2794, + "MUSR": 0.3739, + "MMLU-PRO": 0.3075 + } + }, + { + "model_id": "mistralai/Mistral-7B-v0.1", + "name": "Mistral-7B-v0.1", + "developer": "mistralai", + "scores": { + "IFEval": 0.2386, + "BBH": 0.4419, + "MATH Level 5": 0.0295, + "GPQA": 0.2919, + "MUSR": 0.4139, + "MMLU-PRO": 0.3013 + } + }, + { + "model_id": "mistralai/Mistral-7B-v0.3", + "name": "Mistral-7B-v0.3", + "developer": "mistralai", + "scores": { + "IFEval": 0.2266, + "BBH": 0.4517, + "MATH Level 5": 0.0302, + "GPQA": 0.2919, + "MUSR": 0.4032, + "MMLU-PRO": 0.2953 + } + }, + { + "model_id": "mistralai/Mistral-Large-Instruct-2411", + "name": "Mistral-Large-Instruct-2411", + "developer": "mistralai", + "scores": { + "IFEval": 0.8401, + "BBH": 0.6747, + "MATH Level 5": 0.4955, + "GPQA": 0.4371, + "MUSR": 0.454, + "MMLU-PRO": 0.5562 + } + }, + { + "model_id": "mistralai/Mistral-Nemo-Base-2407", + "name": "Mistral-Nemo-Base-2407", + "developer": "mistralai", + "scores": { + "IFEval": 0.163, + "BBH": 0.5035, + "MATH Level 5": 0.0597, + "GPQA": 0.2936, + "MUSR": 0.3921, + "MMLU-PRO": 0.3472 + } + }, + { + "model_id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral-Nemo-Instruct-2407", + "developer": "mistralai", + "scores": { + "IFEval": 0.638, + "BBH": 0.5037, + "MATH Level 5": 0.1269, + "GPQA": 0.2903, + "MUSR": 0.39, + "MMLU-PRO": 0.3517 + } + }, + { + "model_id": "mistralai/Mistral-Small-24B-Base-2501", + "name": "Mistral-Small-24B-Base-2501", + "developer": "mistralai", + "scores": { + "IFEval": 0.1672, + "BBH": 0.6442, + "MATH Level 5": 0.1971, + "GPQA": 0.3876, + "MUSR": 0.4237, + "MMLU-PRO": 0.5406 + } + }, + { + "model_id": "mistralai/Mistral-Small-Instruct-2409", + "name": "Mistral-Small-Instruct-2409", + "developer": "mistralai", + "scores": { + "IFEval": 0.667, + "BBH": 0.5213, + "MATH Level 5": 0.1435, + "GPQA": 0.3238, + "MUSR": 0.3632, + "MMLU-PRO": 0.396 + } + }, + { + "model_id": "mistralai/Mixtral-8x22B-Instruct-v0.1", + "name": "Mixtral-8x22B-Instruct-v0.1", + "developer": "mistralai", + "scores": { + "IFEval": 0.7184, + "BBH": 0.6125, + "MATH Level 5": 0.1873, + "GPQA": 0.3733, + "MUSR": 0.4311, + "MMLU-PRO": 0.4483 + } + }, + { + "model_id": "mistralai/Mixtral-8x22B-v0.1", + "name": "Mixtral-8x22B-v0.1", + "developer": "mistralai", + "scores": { + "IFEval": 0.2583, + "BBH": 0.624, + "MATH Level 5": 0.1835, + "GPQA": 0.3758, + "MUSR": 0.4037, + "MMLU-PRO": 0.4639 + } + }, + { + "model_id": "mistralai/Mixtral-8x7B-Instruct-v0.1", + "name": "Mixtral-8x7B-Instruct-v0.1", + "developer": "mistralai", + "scores": { + "IFEval": 0.5599, + "BBH": 0.4962, + "MATH Level 5": 0.0914, + "GPQA": 0.3029, + "MUSR": 0.4203, + "MMLU-PRO": 0.3692 + } + }, + { + "model_id": "mistralai/Mixtral-8x7B-v0.1", + "name": "Mixtral-8x7B-v0.1", + "developer": "mistralai", + "scores": { + "IFEval": 0.2415, + "BBH": 0.5087, + "MATH Level 5": 0.102, + "GPQA": 0.3138, + "MUSR": 0.4321, + "MMLU-PRO": 0.385 + } + }, + { + "model_id": "mixtao/MixTAO-7Bx2-MoE-v8.1", + "name": "MixTAO-7Bx2-MoE-v8.1", + "developer": "mixtao", + "scores": { + "IFEval": 0.4162, + "BBH": 0.5189, + "MATH Level 5": 0.0906, + "GPQA": 0.2844, + "MUSR": 0.4463, + "MMLU-PRO": 0.3123 + } + }, + { + "model_id": "mkurman/llama-3.2-MEDIT-3B-o1", + "name": "llama-3.2-MEDIT-3B-o1", + "developer": "mkurman", + "scores": { + "IFEval": 0.4382, + "BBH": 0.44, + "MATH Level 5": 0.1307, + "GPQA": 0.2659, + "MUSR": 0.3565, + "MMLU-PRO": 0.2741 + } + }, + { + "model_id": "mkurman/phi-4-MedIT-11B-exp-1", + "name": "phi-4-MedIT-11B-exp-1", + "developer": "mkurman", + "scores": { + "IFEval": 0.5948, + "BBH": 0.5414, + "MATH Level 5": 0.0899, + "GPQA": 0.3012, + "MUSR": 0.3848, + "MMLU-PRO": 0.3825 + } + }, + { + "model_id": "mkurman/phi4-MedIT-10B-o1", + "name": "phi4-MedIT-10B-o1", + "developer": "mkurman", + "scores": { + "IFEval": 0.3463, + "BBH": 0.5198, + "MATH Level 5": 0.1148, + "GPQA": 0.2458, + "MUSR": 0.3968, + "MMLU-PRO": 0.3507 + } + }, + { + "model_id": "mkxu/llama-3-8b-instruct-fpo", + "name": "llama-3-8b-instruct-fpo", + "developer": "mkxu", + "scores": { + "IFEval": 0.679, + "BBH": 0.4959, + "MATH Level 5": 0.0733, + "GPQA": 0.2777, + "MUSR": 0.3658, + "MMLU-PRO": 0.3605 + } + }, + { + "model_id": "mkxu/llama-3-8b-po1", + "name": "llama-3-8b-po1", + "developer": "mkxu", + "scores": { + "IFEval": 0.4081, + "BBH": 0.4976, + "MATH Level 5": 0.0702, + "GPQA": 0.297, + "MUSR": 0.3804, + "MMLU-PRO": 0.3562 + } + }, + { + "model_id": "mlabonne/AlphaMonarch-7B", + "name": "AlphaMonarch-7B", + "developer": "mlabonne", + "scores": { + "IFEval": 0.4939, + "BBH": 0.4626, + "MATH Level 5": 0.0408, + "GPQA": 0.2701, + "MUSR": 0.4121, + "MMLU-PRO": 0.2473 + } + }, + { + "model_id": "mlabonne/Beyonder-4x7B-v3", + "name": "Beyonder-4x7B-v3", + "developer": "mlabonne", + "scores": { + "IFEval": 0.5608, + "BBH": 0.4671, + "MATH Level 5": 0.0536, + "GPQA": 0.2852, + "MUSR": 0.4045, + "MMLU-PRO": 0.2512 + } + }, + { + "model_id": "mlabonne/BigQwen2.5-52B-Instruct", + "name": "BigQwen2.5-52B-Instruct", + "developer": "mlabonne", + "scores": { + "IFEval": 0.7913, + "BBH": 0.7121, + "MATH Level 5": 0.5476, + "GPQA": 0.302, + "MUSR": 0.4113, + "MMLU-PRO": 0.5519 + } + }, + { + "model_id": "mlabonne/BigQwen2.5-Echo-47B-Instruct", + "name": "BigQwen2.5-Echo-47B-Instruct", + "developer": "mlabonne", + "scores": { + "IFEval": 0.7357, + "BBH": 0.6125, + "MATH Level 5": 0.4381, + "GPQA": 0.3146, + "MUSR": 0.4125, + "MMLU-PRO": 0.4734 + } + }, + { + "model_id": "mlabonne/ChimeraLlama-3-8B-v2", + "name": "ChimeraLlama-3-8B-v2", + "developer": "mlabonne", + "scores": { + "IFEval": 0.4469, + "BBH": 0.5046, + "MATH Level 5": 0.0906, + "GPQA": 0.2852, + "MUSR": 0.3791, + "MMLU-PRO": 0.3569 + } + }, + { + "model_id": "mlabonne/ChimeraLlama-3-8B-v3", + "name": "ChimeraLlama-3-8B-v3", + "developer": "mlabonne", + "scores": { + "IFEval": 0.4408, + "BBH": 0.4978, + "MATH Level 5": 0.0884, + "GPQA": 0.2919, + "MUSR": 0.4004, + "MMLU-PRO": 0.3669 + } + }, + { + "model_id": "mlabonne/Daredevil-8B", + "name": "Daredevil-8B", + "developer": "mlabonne", + "scores": { + "IFEval": 0.4548, + "BBH": 0.5194, + "MATH Level 5": 0.1065, + "GPQA": 0.3079, + "MUSR": 0.3939, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "mlabonne/Daredevil-8B-abliterated", + "name": "Daredevil-8B-abliterated", + "developer": "mlabonne", + "scores": { + "IFEval": 0.4426, + "BBH": 0.4254, + "MATH Level 5": 0.0944, + "GPQA": 0.2903, + "MUSR": 0.407, + "MMLU-PRO": 0.3701 + } + }, + { + "model_id": "mlabonne/Hermes-3-Llama-3.1-70B-lorablated", + "name": "Hermes-3-Llama-3.1-70B-lorablated", + "developer": "mlabonne", + "scores": { + "IFEval": 0.3424, + "BBH": 0.6693, + "MATH Level 5": 0.2243, + "GPQA": 0.3658, + "MUSR": 0.5029, + "MMLU-PRO": 0.4679 + } + }, + { + "model_id": "mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated", + "name": "Meta-Llama-3.1-8B-Instruct-abliterated", + "developer": "mlabonne", + "scores": { + "IFEval": 0.7329, + "BBH": 0.4874, + "MATH Level 5": 0.0687, + "GPQA": 0.2567, + "MUSR": 0.3649, + "MMLU-PRO": 0.3503 + } + }, + { + "model_id": "mlabonne/NeuralBeagle14-7B", + "name": "NeuralBeagle14-7B", + "developer": "mlabonne", + "scores": { + "IFEval": 0.4935, + "BBH": 0.4628, + "MATH Level 5": 0.0521, + "GPQA": 0.2819, + "MUSR": 0.4319, + "MMLU-PRO": 0.2601 + } + }, + { + "model_id": "mlabonne/NeuralDaredevil-8B-abliterated", + "name": "NeuralDaredevil-8B-abliterated", + "developer": "mlabonne", + "scores": { + "IFEval": 0.7561, + "BBH": 0.5111, + "MATH Level 5": 0.0906, + "GPQA": 0.3062, + "MUSR": 0.4019, + "MMLU-PRO": 0.3841 + } + }, + { + "model_id": "mlabonne/OrpoLlama-3-8B", + "name": "OrpoLlama-3-8B", + "developer": "mlabonne", + "scores": { + "IFEval": 0.3653, + "BBH": 0.4424, + "MATH Level 5": 0.0559, + "GPQA": 0.2794, + "MUSR": 0.3579, + "MMLU-PRO": 0.2705 + } + }, + { + "model_id": "mlabonne/phixtral-2x2_8", + "name": "phixtral-2x2_8", + "developer": "mlabonne", + "scores": { + "IFEval": 0.3431, + "BBH": 0.4889, + "MATH Level 5": 0.0355, + "GPQA": 0.2651, + "MUSR": 0.3644, + "MMLU-PRO": 0.2551 + } + }, + { + "model_id": "mlx-community/Josiefied-Qwen2.5-0.5B-Instruct-abliterated-v1-float32", + "name": "Josiefied-Qwen2.5-0.5B-Instruct-abliterated-v1-float32", + "developer": "mlx-community", + "scores": { + "IFEval": 0.3369, + "BBH": 0.3292, + "MATH Level 5": 0.0846, + "GPQA": 0.2576, + "MUSR": 0.3249, + "MMLU-PRO": 0.1638 + } + }, + { + "model_id": "mlx-community/Mistral-Small-24B-Instruct-2501-bf16", + "name": "Mistral-Small-24B-Instruct-2501-bf16", + "developer": "mlx-community", + "scores": { + "IFEval": 0.6283, + "BBH": 0.6713, + "MATH Level 5": 0.3225, + "GPQA": 0.3951, + "MUSR": 0.4618, + "MMLU-PRO": 0.5395 + } + }, + { + "model_id": "mmnga/Llama-3-70B-japanese-suzume-vector-v0.1", + "name": "Llama-3-70B-japanese-suzume-vector-v0.1", + "developer": "mmnga", + "scores": { + "IFEval": 0.4649, + "BBH": 0.6542, + "MATH Level 5": 0.2326, + "GPQA": 0.2861, + "MUSR": 0.4141, + "MMLU-PRO": 0.5224 + } + }, + { + "model_id": "mobiuslabsgmbh/DeepSeek-R1-ReDistill-Llama3-8B-v1.1", + "name": "DeepSeek-R1-ReDistill-Llama3-8B-v1.1", + "developer": "mobiuslabsgmbh", + "scores": { + "IFEval": 0.3704, + "BBH": 0.3473, + "MATH Level 5": 0.3285, + "GPQA": 0.271, + "MUSR": 0.3396, + "MMLU-PRO": 0.2198 + } + }, + { + "model_id": "mobiuslabsgmbh/DeepSeek-R1-ReDistill-Qwen-7B-v1.1", + "name": "DeepSeek-R1-ReDistill-Qwen-7B-v1.1", + "developer": "mobiuslabsgmbh", + "scores": { + "IFEval": 0.3473, + "BBH": 0.3698, + "MATH Level 5": 0.3497, + "GPQA": 0.2651, + "MUSR": 0.4009, + "MMLU-PRO": 0.2326 + } + }, + { + "model_id": "moeru-ai/L3.1-Moe-2x8B-v0.2", + "name": "L3.1-Moe-2x8B-v0.2", + "developer": "moeru-ai", + "scores": { + "IFEval": 0.7348, + "BBH": 0.5256, + "MATH Level 5": 0.1699, + "GPQA": 0.3003, + "MUSR": 0.4199, + "MMLU-PRO": 0.3858 + } + }, + { + "model_id": "moeru-ai/L3.1-Moe-4x8B-v0.1", + "name": "L3.1-Moe-4x8B-v0.1", + "developer": "moeru-ai", + "scores": { + "IFEval": 0.4332, + "BBH": 0.4939, + "MATH Level 5": 0.1299, + "GPQA": 0.2592, + "MUSR": 0.3609, + "MMLU-PRO": 0.3454 + } + }, + { + "model_id": "moeru-ai/L3.1-Moe-4x8B-v0.2", + "name": "L3.1-Moe-4x8B-v0.2", + "developer": "moeru-ai", + "scores": { + "IFEval": 0.5407, + "BBH": 0.4466, + "MATH Level 5": 0.1035, + "GPQA": 0.2668, + "MUSR": 0.3234, + "MMLU-PRO": 0.2763 + } + }, + { + "model_id": "monsterapi/Llama-3_1-8B-Instruct-orca-ORPO", + "name": "Llama-3_1-8B-Instruct-orca-ORPO", + "developer": "monsterapi", + "scores": { + "IFEval": 0.2273, + "BBH": 0.2865, + "MATH Level 5": 0.0, + "GPQA": 0.2492, + "MUSR": 0.3445, + "MMLU-PRO": 0.1168 + } + }, + { + "model_id": "monsterapi/gemma-2-2b-LoRA-MonsterInstruct", + "name": "gemma-2-2b-LoRA-MonsterInstruct", + "developer": "monsterapi", + "scores": { + "IFEval": 0.3903, + "BBH": 0.365, + "MATH Level 5": 0.0506, + "GPQA": 0.2701, + "MUSR": 0.3644, + "MMLU-PRO": 0.1987 + } + }, + { + "model_id": "mosaicml/mpt-7b", + "name": "mpt-7b", + "developer": "mosaicml", + "scores": { + "IFEval": 0.2152, + "BBH": 0.33, + "MATH Level 5": 0.0159, + "GPQA": 0.2601, + "MUSR": 0.3672, + "MMLU-PRO": 0.1206 + } + }, + { + "model_id": "mosama/Qwen2.5-1.5B-Instruct-CoT-Reflection", + "name": "Qwen2.5-1.5B-Instruct-CoT-Reflection", + "developer": "mosama", + "scores": { + "IFEval": 0.287, + "BBH": 0.4109, + "MATH Level 5": 0.0272, + "GPQA": 0.2617, + "MUSR": 0.3212, + "MMLU-PRO": 0.2651 + } + }, + { + "model_id": "mrdayl/OpenCogito", + "name": "OpenCogito", + "developer": "mrdayl", + "scores": { + "IFEval": 0.3934, + "BBH": 0.472, + "MATH Level 5": 0.2183, + "GPQA": 0.3003, + "MUSR": 0.424, + "MMLU-PRO": 0.3452 + } + }, + { + "model_id": "mrdayl/OpenCognito", + "name": "OpenCognito", + "developer": "mrdayl", + "scores": { + "IFEval": 0.4062, + "BBH": 0.4706, + "MATH Level 5": 0.2115, + "GPQA": 0.2978, + "MUSR": 0.4293, + "MMLU-PRO": 0.3443 + } + }, + { + "model_id": "mrdayl/OpenCognito-r1", + "name": "OpenCognito-r1", + "developer": "mrdayl", + "scores": { + "IFEval": 0.4241, + "BBH": 0.4673, + "MATH Level 5": 0.1903, + "GPQA": 0.2995, + "MUSR": 0.4241, + "MMLU-PRO": 0.3475 + } + }, + { + "model_id": "mrdayl/OpenCognito-r2", + "name": "OpenCognito-r2", + "developer": "mrdayl", + "scores": { + "IFEval": 0.3959, + "BBH": 0.4688, + "MATH Level 5": 0.2024, + "GPQA": 0.3062, + "MUSR": 0.4202, + "MMLU-PRO": 0.3462 + } + }, + { + "model_id": "mrdayl/OpenThink", + "name": "OpenThink", + "developer": "mrdayl", + "scores": { + "IFEval": 0.2054, + "BBH": 0.346, + "MATH Level 5": 0.2885, + "GPQA": 0.2827, + "MUSR": 0.3289, + "MMLU-PRO": 0.185 + } + }, + { + "model_id": "mrm8488/phi-4-14B-grpo-gsm8k-3e", + "name": "phi-4-14B-grpo-gsm8k-3e", + "developer": "mrm8488", + "scores": { + "IFEval": 0.6885, + "BBH": 0.6805, + "MATH Level 5": 0.4524, + "GPQA": 0.3356, + "MUSR": 0.3994, + "MMLU-PRO": 0.5268 + } + }, + { + "model_id": "mrm8488/phi-4-14B-grpo-limo", + "name": "phi-4-14B-grpo-limo", + "developer": "mrm8488", + "scores": { + "IFEval": 0.6812, + "BBH": 0.6785, + "MATH Level 5": 0.4569, + "GPQA": 0.3364, + "MUSR": 0.3981, + "MMLU-PRO": 0.5261 + } + }, + { + "model_id": "mukaj/Llama-3.1-Hawkish-8B", + "name": "Llama-3.1-Hawkish-8B", + "developer": "mukaj", + "scores": { + "IFEval": 0.672, + "BBH": 0.4884, + "MATH Level 5": 0.2432, + "GPQA": 0.2903, + "MUSR": 0.3967, + "MMLU-PRO": 0.3331 + } + }, + { + "model_id": "natong19/Mistral-Nemo-Instruct-2407-abliterated", + "name": "Mistral-Nemo-Instruct-2407-abliterated", + "developer": "natong19", + "scores": { + "IFEval": 0.6392, + "BBH": 0.5048, + "MATH Level 5": 0.1322, + "GPQA": 0.2869, + "MUSR": 0.4033, + "MMLU-PRO": 0.3518 + } + }, + { + "model_id": "natong19/Qwen2-7B-Instruct-abliterated", + "name": "Qwen2-7B-Instruct-abliterated", + "developer": "natong19", + "scores": { + "IFEval": 0.5837, + "BBH": 0.5553, + "MATH Level 5": 0.2764, + "GPQA": 0.3012, + "MUSR": 0.4034, + "MMLU-PRO": 0.3842 + } + }, + { + "model_id": "nazimali/Mistral-Nemo-Kurdish", + "name": "Mistral-Nemo-Kurdish", + "developer": "nazimali", + "scores": { + "IFEval": 0.3401, + "BBH": 0.5133, + "MATH Level 5": 0.0959, + "GPQA": 0.3012, + "MUSR": 0.4116, + "MMLU-PRO": 0.3235 + } + }, + { + "model_id": "nazimali/Mistral-Nemo-Kurdish-Instruct", + "name": "Mistral-Nemo-Kurdish-Instruct", + "developer": "nazimali", + "scores": { + "IFEval": 0.4964, + "BBH": 0.4699, + "MATH Level 5": 0.0045, + "GPQA": 0.2827, + "MUSR": 0.3979, + "MMLU-PRO": 0.3063 + } + }, + { + "model_id": "nbeerbower/BigKartoffel-mistral-nemo-20B", + "name": "BigKartoffel-mistral-nemo-20B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.5857, + "BBH": 0.5515, + "MATH Level 5": 0.0264, + "GPQA": 0.2869, + "MUSR": 0.428, + "MMLU-PRO": 0.353 + } + }, + { + "model_id": "nbeerbower/DoppelKartoffel-Mistral-Nemo-23B", + "name": "DoppelKartoffel-Mistral-Nemo-23B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.5191, + "BBH": 0.5218, + "MATH Level 5": 0.031, + "GPQA": 0.2752, + "MUSR": 0.3795, + "MMLU-PRO": 0.308 + } + }, + { + "model_id": "nbeerbower/DoublePotato-Mistral-Nemo-13B", + "name": "DoublePotato-Mistral-Nemo-13B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6796, + "BBH": 0.5438, + "MATH Level 5": 0.04, + "GPQA": 0.3012, + "MUSR": 0.46, + "MMLU-PRO": 0.3596 + } + }, + { + "model_id": "nbeerbower/Dumpling-Qwen2.5-1.5B", + "name": "Dumpling-Qwen2.5-1.5B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3699, + "BBH": 0.416, + "MATH Level 5": 0.1171, + "GPQA": 0.2685, + "MUSR": 0.3728, + "MMLU-PRO": 0.2772 + } + }, + { + "model_id": "nbeerbower/Dumpling-Qwen2.5-14B", + "name": "Dumpling-Qwen2.5-14B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6064, + "BBH": 0.6451, + "MATH Level 5": 0.3097, + "GPQA": 0.3012, + "MUSR": 0.4354, + "MMLU-PRO": 0.517 + } + }, + { + "model_id": "nbeerbower/Dumpling-Qwen2.5-7B-1k-r16", + "name": "Dumpling-Qwen2.5-7B-1k-r16", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.486, + "BBH": 0.5214, + "MATH Level 5": 0.2364, + "GPQA": 0.2701, + "MUSR": 0.423, + "MMLU-PRO": 0.3959 + } + }, + { + "model_id": "nbeerbower/Dumpling-Qwen2.5-7B-1k-r64-2e-5", + "name": "Dumpling-Qwen2.5-7B-1k-r64-2e-5", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.4179, + "BBH": 0.5301, + "MATH Level 5": 0.2115, + "GPQA": 0.2701, + "MUSR": 0.4486, + "MMLU-PRO": 0.4122 + } + }, + { + "model_id": "nbeerbower/EVA-abliterated-TIES-Qwen2.5-1.5B", + "name": "EVA-abliterated-TIES-Qwen2.5-1.5B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.4115, + "BBH": 0.3997, + "MATH Level 5": 0.1375, + "GPQA": 0.2651, + "MUSR": 0.3502, + "MMLU-PRO": 0.2712 + } + }, + { + "model_id": "nbeerbower/EVA-abliterated-TIES-Qwen2.5-14B", + "name": "EVA-abliterated-TIES-Qwen2.5-14B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.7836, + "BBH": 0.6372, + "MATH Level 5": 0.5045, + "GPQA": 0.3549, + "MUSR": 0.4407, + "MMLU-PRO": 0.5211 + } + }, + { + "model_id": "nbeerbower/Flammades-Mistral-Nemo-12B", + "name": "Flammades-Mistral-Nemo-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3842, + "BBH": 0.53, + "MATH Level 5": 0.0755, + "GPQA": 0.3037, + "MUSR": 0.4806, + "MMLU-PRO": 0.3661 + } + }, + { + "model_id": "nbeerbower/Gemma2-Gutenberg-Doppel-9B", + "name": "Gemma2-Gutenberg-Doppel-9B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.7171, + "BBH": 0.587, + "MATH Level 5": 0.1979, + "GPQA": 0.3297, + "MUSR": 0.4608, + "MMLU-PRO": 0.4127 + } + }, + { + "model_id": "nbeerbower/Gutensuppe-mistral-nemo-12B", + "name": "Gutensuppe-mistral-nemo-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.2916, + "BBH": 0.5487, + "MATH Level 5": 0.1329, + "GPQA": 0.3372, + "MUSR": 0.429, + "MMLU-PRO": 0.368 + } + }, + { + "model_id": "nbeerbower/Hermes2-Gutenberg2-Mistral-7B", + "name": "Hermes2-Gutenberg2-Mistral-7B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3721, + "BBH": 0.4981, + "MATH Level 5": 0.0574, + "GPQA": 0.2894, + "MUSR": 0.4623, + "MMLU-PRO": 0.2993 + } + }, + { + "model_id": "nbeerbower/Kartoffel-Deepfry-12B", + "name": "Kartoffel-Deepfry-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.5022, + "BBH": 0.5365, + "MATH Level 5": 0.0604, + "GPQA": 0.2961, + "MUSR": 0.4792, + "MMLU-PRO": 0.3582 + } + }, + { + "model_id": "nbeerbower/Llama-3.1-Nemotron-lorablated-70B", + "name": "Llama-3.1-Nemotron-lorablated-70B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.7229, + "BBH": 0.6825, + "MATH Level 5": 0.3338, + "GPQA": 0.3909, + "MUSR": 0.4682, + "MMLU-PRO": 0.5343 + } + }, + { + "model_id": "nbeerbower/Llama3.1-Gutenberg-Doppel-70B", + "name": "Llama3.1-Gutenberg-Doppel-70B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.7092, + "BBH": 0.6661, + "MATH Level 5": 0.2122, + "GPQA": 0.3448, + "MUSR": 0.4897, + "MMLU-PRO": 0.4737 + } + }, + { + "model_id": "nbeerbower/Lyra-Gutenberg-mistral-nemo-12B", + "name": "Lyra-Gutenberg-mistral-nemo-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3495, + "BBH": 0.5586, + "MATH Level 5": 0.1012, + "GPQA": 0.3339, + "MUSR": 0.4357, + "MMLU-PRO": 0.3628 + } + }, + { + "model_id": "nbeerbower/Lyra4-Gutenberg-12B", + "name": "Lyra4-Gutenberg-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.2212, + "BBH": 0.5387, + "MATH Level 5": 0.1299, + "GPQA": 0.3188, + "MUSR": 0.4038, + "MMLU-PRO": 0.3571 + } + }, + { + "model_id": "nbeerbower/Lyra4-Gutenberg2-12B", + "name": "Lyra4-Gutenberg2-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.2585, + "BBH": 0.5345, + "MATH Level 5": 0.1171, + "GPQA": 0.3129, + "MUSR": 0.3972, + "MMLU-PRO": 0.3565 + } + }, + { + "model_id": "nbeerbower/Mahou-1.5-mistral-nemo-12B-lorablated", + "name": "Mahou-1.5-mistral-nemo-12B-lorablated", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6825, + "BBH": 0.5496, + "MATH Level 5": 0.0891, + "GPQA": 0.2794, + "MUSR": 0.4522, + "MMLU-PRO": 0.3574 + } + }, + { + "model_id": "nbeerbower/Mistral-Gutenberg-Doppel-7B-FFT", + "name": "Mistral-Gutenberg-Doppel-7B-FFT", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.5717, + "BBH": 0.4076, + "MATH Level 5": 0.0249, + "GPQA": 0.2836, + "MUSR": 0.4059, + "MMLU-PRO": 0.2729 + } + }, + { + "model_id": "nbeerbower/Mistral-Nemo-Gutenberg-Doppel-12B", + "name": "Mistral-Nemo-Gutenberg-Doppel-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3567, + "BBH": 0.5275, + "MATH Level 5": 0.1216, + "GPQA": 0.3163, + "MUSR": 0.4132, + "MMLU-PRO": 0.3579 + } + }, + { + "model_id": "nbeerbower/Mistral-Nemo-Gutenberg-Doppel-12B-v2", + "name": "Mistral-Nemo-Gutenberg-Doppel-12B-v2", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6536, + "BBH": 0.5374, + "MATH Level 5": 0.1156, + "GPQA": 0.271, + "MUSR": 0.4233, + "MMLU-PRO": 0.3546 + } + }, + { + "model_id": "nbeerbower/Mistral-Nemo-Moderne-12B-FFT-experimental", + "name": "Mistral-Nemo-Moderne-12B-FFT-experimental", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3352, + "BBH": 0.5234, + "MATH Level 5": 0.077, + "GPQA": 0.281, + "MUSR": 0.3715, + "MMLU-PRO": 0.3455 + } + }, + { + "model_id": "nbeerbower/Mistral-Nemo-Prism-12B", + "name": "Mistral-Nemo-Prism-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6858, + "BBH": 0.5475, + "MATH Level 5": 0.0869, + "GPQA": 0.3079, + "MUSR": 0.4626, + "MMLU-PRO": 0.3581 + } + }, + { + "model_id": "nbeerbower/Mistral-Nemo-Prism-12B-v2", + "name": "Mistral-Nemo-Prism-12B-v2", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6974, + "BBH": 0.5492, + "MATH Level 5": 0.0891, + "GPQA": 0.3054, + "MUSR": 0.46, + "MMLU-PRO": 0.3567 + } + }, + { + "model_id": "nbeerbower/Mistral-Nemo-Prism-12B-v7", + "name": "Mistral-Nemo-Prism-12B-v7", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6962, + "BBH": 0.5521, + "MATH Level 5": 0.0869, + "GPQA": 0.2995, + "MUSR": 0.4639, + "MMLU-PRO": 0.359 + } + }, + { + "model_id": "nbeerbower/Mistral-Small-Drummer-22B", + "name": "Mistral-Small-Drummer-22B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6331, + "BBH": 0.5793, + "MATH Level 5": 0.1888, + "GPQA": 0.3431, + "MUSR": 0.4064, + "MMLU-PRO": 0.4095 + } + }, + { + "model_id": "nbeerbower/Mistral-Small-Gutenberg-Doppel-22B", + "name": "Mistral-Small-Gutenberg-Doppel-22B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.4893, + "BBH": 0.5859, + "MATH Level 5": 0.2183, + "GPQA": 0.3465, + "MUSR": 0.3971, + "MMLU-PRO": 0.4124 + } + }, + { + "model_id": "nbeerbower/Nemo-Loony-12B-experimental", + "name": "Nemo-Loony-12B-experimental", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3734, + "BBH": 0.3822, + "MATH Level 5": 0.0151, + "GPQA": 0.2701, + "MUSR": 0.3341, + "MMLU-PRO": 0.1589 + } + }, + { + "model_id": "nbeerbower/Nemoties-ChatML-12B", + "name": "Nemoties-ChatML-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6382, + "BBH": 0.547, + "MATH Level 5": 0.0785, + "GPQA": 0.297, + "MUSR": 0.4509, + "MMLU-PRO": 0.3551 + } + }, + { + "model_id": "nbeerbower/Qwen2.5-Gutenberg-Doppel-14B", + "name": "Qwen2.5-Gutenberg-Doppel-14B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.8091, + "BBH": 0.6382, + "MATH Level 5": 0.5415, + "GPQA": 0.3331, + "MUSR": 0.4101, + "MMLU-PRO": 0.4921 + } + }, + { + "model_id": "nbeerbower/SmolNemo-12B-FFT-experimental", + "name": "SmolNemo-12B-FFT-experimental", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3348, + "BBH": 0.3336, + "MATH Level 5": 0.0128, + "GPQA": 0.2601, + "MUSR": 0.3847, + "MMLU-PRO": 0.1217 + } + }, + { + "model_id": "nbeerbower/Stella-mistral-nemo-12B-v2", + "name": "Stella-mistral-nemo-12B-v2", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3274, + "BBH": 0.5484, + "MATH Level 5": 0.1163, + "GPQA": 0.3322, + "MUSR": 0.4304, + "MMLU-PRO": 0.3684 + } + }, + { + "model_id": "nbeerbower/gemma2-gutenberg-27B", + "name": "gemma2-gutenberg-27B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.2947, + "BBH": 0.3797, + "MATH Level 5": 0.0189, + "GPQA": 0.2727, + "MUSR": 0.3727, + "MMLU-PRO": 0.1982 + } + }, + { + "model_id": "nbeerbower/gemma2-gutenberg-9B", + "name": "gemma2-gutenberg-9B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.2796, + "BBH": 0.5951, + "MATH Level 5": 0.0808, + "GPQA": 0.3381, + "MUSR": 0.4595, + "MMLU-PRO": 0.4192 + } + }, + { + "model_id": "nbeerbower/llama-3-gutenberg-8B", + "name": "llama-3-gutenberg-8B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.4372, + "BBH": 0.4994, + "MATH Level 5": 0.0785, + "GPQA": 0.3012, + "MUSR": 0.4073, + "MMLU-PRO": 0.3831 + } + }, + { + "model_id": "nbeerbower/llama3.1-cc-8B", + "name": "llama3.1-cc-8B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.5068, + "BBH": 0.4871, + "MATH Level 5": 0.071, + "GPQA": 0.2852, + "MUSR": 0.3885, + "MMLU-PRO": 0.3347 + } + }, + { + "model_id": "nbeerbower/llama3.1-kartoffeldes-70B", + "name": "llama3.1-kartoffeldes-70B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.823, + "BBH": 0.6894, + "MATH Level 5": 0.3218, + "GPQA": 0.3515, + "MUSR": 0.4646, + "MMLU-PRO": 0.4988 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-bophades-12B", + "name": "mistral-nemo-bophades-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6794, + "BBH": 0.4988, + "MATH Level 5": 0.1231, + "GPQA": 0.2852, + "MUSR": 0.4178, + "MMLU-PRO": 0.3501 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-bophades3-12B", + "name": "mistral-nemo-bophades3-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6578, + "BBH": 0.5449, + "MATH Level 5": 0.0846, + "GPQA": 0.3121, + "MUSR": 0.4604, + "MMLU-PRO": 0.3371 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-cc-12B", + "name": "mistral-nemo-cc-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.1435, + "BBH": 0.5399, + "MATH Level 5": 0.0257, + "GPQA": 0.3154, + "MUSR": 0.4424, + "MMLU-PRO": 0.3598 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-gutades-12B", + "name": "mistral-nemo-gutades-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3425, + "BBH": 0.5407, + "MATH Level 5": 0.1178, + "GPQA": 0.3154, + "MUSR": 0.404, + "MMLU-PRO": 0.3561 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-gutenberg-12B", + "name": "mistral-nemo-gutenberg-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3504, + "BBH": 0.5281, + "MATH Level 5": 0.1163, + "GPQA": 0.307, + "MUSR": 0.4171, + "MMLU-PRO": 0.3562 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-gutenberg-12B-v2", + "name": "mistral-nemo-gutenberg-12B-v2", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.6203, + "BBH": 0.5397, + "MATH Level 5": 0.1088, + "GPQA": 0.2777, + "MUSR": 0.4287, + "MMLU-PRO": 0.3499 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-gutenberg-12B-v3", + "name": "mistral-nemo-gutenberg-12B-v3", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.2183, + "BBH": 0.5441, + "MATH Level 5": 0.0597, + "GPQA": 0.3146, + "MUSR": 0.445, + "MMLU-PRO": 0.3644 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-gutenberg-12B-v4", + "name": "mistral-nemo-gutenberg-12B-v4", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.2379, + "BBH": 0.5269, + "MATH Level 5": 0.1261, + "GPQA": 0.3163, + "MUSR": 0.4104, + "MMLU-PRO": 0.3575 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-gutenberg2-12B-test", + "name": "mistral-nemo-gutenberg2-12B-test", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.3385, + "BBH": 0.5255, + "MATH Level 5": 0.1163, + "GPQA": 0.3171, + "MUSR": 0.4157, + "MMLU-PRO": 0.3555 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-kartoffel-12B", + "name": "mistral-nemo-kartoffel-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.7032, + "BBH": 0.5484, + "MATH Level 5": 0.0853, + "GPQA": 0.3045, + "MUSR": 0.4653, + "MMLU-PRO": 0.3585 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-narwhal-12B", + "name": "mistral-nemo-narwhal-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.5549, + "BBH": 0.5057, + "MATH Level 5": 0.0582, + "GPQA": 0.271, + "MUSR": 0.3847, + "MMLU-PRO": 0.3483 + } + }, + { + "model_id": "nbeerbower/mistral-nemo-wissenschaft-12B", + "name": "mistral-nemo-wissenschaft-12B", + "developer": "nbeerbower", + "scores": { + "IFEval": 0.652, + "BBH": 0.504, + "MATH Level 5": 0.1216, + "GPQA": 0.2928, + "MUSR": 0.4178, + "MMLU-PRO": 0.3532 + } + }, + { + "model_id": "nbrahme/IndusQ", + "name": "IndusQ", + "developer": "nbrahme", + "scores": { + "IFEval": 0.244, + "BBH": 0.3062, + "MATH Level 5": 0.0008, + "GPQA": 0.2651, + "MUSR": 0.3366, + "MMLU-PRO": 0.112 + } + }, + { + "model_id": "necva/IE-cont-Llama3.1-8B", + "name": "IE-cont-Llama3.1-8B", + "developer": "necva", + "scores": { + "IFEval": 0.2049, + "BBH": 0.2912, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3575, + "MMLU-PRO": 0.1167 + } + }, + { + "model_id": "necva/replica-IEPile", + "name": "replica-IEPile", + "developer": "necva", + "scores": { + "IFEval": 0.4678, + "BBH": 0.4779, + "MATH Level 5": 0.1239, + "GPQA": 0.3062, + "MUSR": 0.3998, + "MMLU-PRO": 0.3561 + } + }, + { + "model_id": "neopolita/jessi-v0.1-bf16-falcon3-7b-instruct", + "name": "jessi-v0.1-bf16-falcon3-7b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.7527, + "BBH": 0.5516, + "MATH Level 5": 0.3807, + "GPQA": 0.3029, + "MUSR": 0.4825, + "MMLU-PRO": 0.3924 + } + }, + { + "model_id": "neopolita/jessi-v0.1-falcon3-10b-instruct", + "name": "jessi-v0.1-falcon3-10b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.7552, + "BBH": 0.5953, + "MATH Level 5": 0.2002, + "GPQA": 0.3188, + "MUSR": 0.4279, + "MMLU-PRO": 0.4188 + } + }, + { + "model_id": "neopolita/jessi-v0.1-qwen2.5-7b-instruct", + "name": "jessi-v0.1-qwen2.5-7b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.7327, + "BBH": 0.5292, + "MATH Level 5": 0.4086, + "GPQA": 0.297, + "MUSR": 0.3914, + "MMLU-PRO": 0.4228 + } + }, + { + "model_id": "neopolita/jessi-v0.1-virtuoso-small", + "name": "jessi-v0.1-virtuoso-small", + "developer": "neopolita", + "scores": { + "IFEval": 0.7959, + "BBH": 0.6443, + "MATH Level 5": 0.3399, + "GPQA": 0.3305, + "MUSR": 0.4362, + "MMLU-PRO": 0.513 + } + }, + { + "model_id": "neopolita/jessi-v0.2-falcon3-10b-instruct", + "name": "jessi-v0.2-falcon3-10b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.7768, + "BBH": 0.6205, + "MATH Level 5": 0.2122, + "GPQA": 0.3289, + "MUSR": 0.4281, + "MMLU-PRO": 0.4354 + } + }, + { + "model_id": "neopolita/jessi-v0.2-falcon3-7b-instruct", + "name": "jessi-v0.2-falcon3-7b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.5771, + "BBH": 0.5363, + "MATH Level 5": 0.2538, + "GPQA": 0.3171, + "MUSR": 0.4479, + "MMLU-PRO": 0.3905 + } + }, + { + "model_id": "neopolita/jessi-v0.3-falcon3-7b-instruct", + "name": "jessi-v0.3-falcon3-7b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.7509, + "BBH": 0.5388, + "MATH Level 5": 0.1888, + "GPQA": 0.3196, + "MUSR": 0.4692, + "MMLU-PRO": 0.397 + } + }, + { + "model_id": "neopolita/jessi-v0.4-falcon3-7b-instruct", + "name": "jessi-v0.4-falcon3-7b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.7604, + "BBH": 0.5522, + "MATH Level 5": 0.3769, + "GPQA": 0.3029, + "MUSR": 0.4971, + "MMLU-PRO": 0.4004 + } + }, + { + "model_id": "neopolita/jessi-v0.5-falcon3-7b-instruct", + "name": "jessi-v0.5-falcon3-7b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.7412, + "BBH": 0.559, + "MATH Level 5": 0.3739, + "GPQA": 0.3112, + "MUSR": 0.4865, + "MMLU-PRO": 0.3966 + } + }, + { + "model_id": "neopolita/jessi-v0.6-falcon3-7b-instruct", + "name": "jessi-v0.6-falcon3-7b-instruct", + "developer": "neopolita", + "scores": { + "IFEval": 0.7402, + "BBH": 0.5509, + "MATH Level 5": 0.3565, + "GPQA": 0.3003, + "MUSR": 0.4904, + "MMLU-PRO": 0.3957 + } + }, + { + "model_id": "neopolita/loki-v0.1-virtuoso", + "name": "loki-v0.1-virtuoso", + "developer": "neopolita", + "scores": { + "IFEval": 0.7819, + "BBH": 0.6467, + "MATH Level 5": 0.3391, + "GPQA": 0.3507, + "MUSR": 0.4375, + "MMLU-PRO": 0.5129 + } + }, + { + "model_id": "netcat420/DeepSeek-R1-Distill-Qwen-MFANN-Slerp-7b", + "name": "DeepSeek-R1-Distill-Qwen-MFANN-Slerp-7b", + "developer": "netcat420", + "scores": { + "IFEval": 0.115, + "BBH": 0.2877, + "MATH Level 5": 0.0015, + "GPQA": 0.2643, + "MUSR": 0.3724, + "MMLU-PRO": 0.109 + } + }, + { + "model_id": "netcat420/DeepSeek-R1-MFANN-TIES-unretrained-7b", + "name": "DeepSeek-R1-MFANN-TIES-unretrained-7b", + "developer": "netcat420", + "scores": { + "IFEval": 0.2587, + "BBH": 0.3086, + "MATH Level 5": 0.0121, + "GPQA": 0.255, + "MUSR": 0.3527, + "MMLU-PRO": 0.1145 + } + }, + { + "model_id": "netcat420/Llama3.1-MFANN-8b", + "name": "Llama3.1-MFANN-8b", + "developer": "netcat420", + "scores": { + "IFEval": 0.297, + "BBH": 0.4281, + "MATH Level 5": 0.0295, + "GPQA": 0.2878, + "MUSR": 0.3379, + "MMLU-PRO": 0.2725 + } + }, + { + "model_id": "netcat420/MFANN-Llama3.1-Abliterated-SLERP-TIES-V2", + "name": "MFANN-Llama3.1-Abliterated-SLERP-TIES-V2", + "developer": "netcat420", + "scores": { + "IFEval": 0.421, + "BBH": 0.4924, + "MATH Level 5": 0.0763, + "GPQA": 0.297, + "MUSR": 0.3728, + "MMLU-PRO": 0.3522 + } + }, + { + "model_id": "netcat420/MFANN-Llama3.1-Abliterated-SLERP-TIES-V3", + "name": "MFANN-Llama3.1-Abliterated-SLERP-TIES-V3", + "developer": "netcat420", + "scores": { + "IFEval": 0.4238, + "BBH": 0.4914, + "MATH Level 5": 0.0755, + "GPQA": 0.297, + "MUSR": 0.3741, + "MMLU-PRO": 0.349 + } + }, + { + "model_id": "netcat420/MFANN-Llama3.1-Abliterated-SLERP-V4", + "name": "MFANN-Llama3.1-Abliterated-SLERP-V4", + "developer": "netcat420", + "scores": { + "IFEval": 0.4169, + "BBH": 0.4909, + "MATH Level 5": 0.068, + "GPQA": 0.3054, + "MUSR": 0.3821, + "MMLU-PRO": 0.3516 + } + }, + { + "model_id": "netcat420/MFANN-Llama3.1-Abliterated-SLERP-V5", + "name": "MFANN-Llama3.1-Abliterated-SLERP-V5", + "developer": "netcat420", + "scores": { + "IFEval": 0.4329, + "BBH": 0.4952, + "MATH Level 5": 0.0816, + "GPQA": 0.2936, + "MUSR": 0.3781, + "MMLU-PRO": 0.3445 + } + }, + { + "model_id": "netcat420/MFANN-Llama3.1-Abliterated-Slerp-TIES", + "name": "MFANN-Llama3.1-Abliterated-Slerp-TIES", + "developer": "netcat420", + "scores": { + "IFEval": 0.4293, + "BBH": 0.4968, + "MATH Level 5": 0.0665, + "GPQA": 0.2919, + "MUSR": 0.3687, + "MMLU-PRO": 0.3531 + } + }, + { + "model_id": "netcat420/MFANN-Llama3.1-Abliterated-Slerp-V3.2", + "name": "MFANN-Llama3.1-Abliterated-Slerp-V3.2", + "developer": "netcat420", + "scores": { + "IFEval": 0.4128, + "BBH": 0.4978, + "MATH Level 5": 0.0702, + "GPQA": 0.2878, + "MUSR": 0.3754, + "MMLU-PRO": 0.3527 + } + }, + { + "model_id": "netcat420/MFANN-SFT", + "name": "MFANN-SFT", + "developer": "netcat420", + "scores": { + "IFEval": 0.3682, + "BBH": 0.4852, + "MATH Level 5": 0.0597, + "GPQA": 0.3163, + "MUSR": 0.3725, + "MMLU-PRO": 0.3336 + } + }, + { + "model_id": "netcat420/MFANN-abliterated-phi2-merge-unretrained", + "name": "MFANN-abliterated-phi2-merge-unretrained", + "developer": "netcat420", + "scores": { + "IFEval": 0.3005, + "BBH": 0.4104, + "MATH Level 5": 0.0287, + "GPQA": 0.2609, + "MUSR": 0.3183, + "MMLU-PRO": 0.1478 + } + }, + { + "model_id": "netcat420/MFANN-llama3.1-Abliterated-SLERP", + "name": "MFANN-llama3.1-Abliterated-SLERP", + "developer": "netcat420", + "scores": { + "IFEval": 0.2591, + "BBH": 0.4574, + "MATH Level 5": 0.0483, + "GPQA": 0.2735, + "MUSR": 0.3809, + "MMLU-PRO": 0.2928 + } + }, + { + "model_id": "netcat420/MFANN-llama3.1-abliterated-SLERP-v3", + "name": "MFANN-llama3.1-abliterated-SLERP-v3", + "developer": "netcat420", + "scores": { + "IFEval": 0.3799, + "BBH": 0.4931, + "MATH Level 5": 0.0642, + "GPQA": 0.2911, + "MUSR": 0.366, + "MMLU-PRO": 0.3531 + } + }, + { + "model_id": "netcat420/MFANN-llama3.1-abliterated-SLERP-v3.1", + "name": "MFANN-llama3.1-abliterated-SLERP-v3.1", + "developer": "netcat420", + "scores": { + "IFEval": 0.4202, + "BBH": 0.4921, + "MATH Level 5": 0.0695, + "GPQA": 0.2928, + "MUSR": 0.3686, + "MMLU-PRO": 0.3543 + } + }, + { + "model_id": "netcat420/MFANN-llama3.1-abliterated-v2", + "name": "MFANN-llama3.1-abliterated-v2", + "developer": "netcat420", + "scores": { + "IFEval": 0.4429, + "BBH": 0.4941, + "MATH Level 5": 0.074, + "GPQA": 0.2928, + "MUSR": 0.3845, + "MMLU-PRO": 0.3491 + } + }, + { + "model_id": "netcat420/MFANN-phigments-slerp-V2", + "name": "MFANN-phigments-slerp-V2", + "developer": "netcat420", + "scores": { + "IFEval": 0.3232, + "BBH": 0.4827, + "MATH Level 5": 0.0317, + "GPQA": 0.2727, + "MUSR": 0.4037, + "MMLU-PRO": 0.2717 + } + }, + { + "model_id": "netcat420/MFANN-phigments-slerp-V3.2", + "name": "MFANN-phigments-slerp-V3.2", + "developer": "netcat420", + "scores": { + "IFEval": 0.3524, + "BBH": 0.4809, + "MATH Level 5": 0.0332, + "GPQA": 0.2836, + "MUSR": 0.3708, + "MMLU-PRO": 0.2705 + } + }, + { + "model_id": "netcat420/MFANN-phigments-slerp-V3.3", + "name": "MFANN-phigments-slerp-V3.3", + "developer": "netcat420", + "scores": { + "IFEval": 0.3691, + "BBH": 0.4895, + "MATH Level 5": 0.0332, + "GPQA": 0.2752, + "MUSR": 0.3892, + "MMLU-PRO": 0.2803 + } + }, + { + "model_id": "netcat420/MFANN3b", + "name": "MFANN3b", + "developer": "netcat420", + "scores": { + "IFEval": 0.2524, + "BBH": 0.4433, + "MATH Level 5": 0.0219, + "GPQA": 0.2919, + "MUSR": 0.3606, + "MMLU-PRO": 0.2306 + } + }, + { + "model_id": "netcat420/MFANN3bv0.15", + "name": "MFANN3bv0.15", + "developer": "netcat420", + "scores": { + "IFEval": 0.2012, + "BBH": 0.4539, + "MATH Level 5": 0.0264, + "GPQA": 0.2517, + "MUSR": 0.3958, + "MMLU-PRO": 0.2468 + } + }, + { + "model_id": "netcat420/MFANN3bv0.18", + "name": "MFANN3bv0.18", + "developer": "netcat420", + "scores": { + "IFEval": 0.2206, + "BBH": 0.4514, + "MATH Level 5": 0.0249, + "GPQA": 0.2576, + "MUSR": 0.4024, + "MMLU-PRO": 0.25 + } + }, + { + "model_id": "netcat420/MFANN3bv0.19", + "name": "MFANN3bv0.19", + "developer": "netcat420", + "scores": { + "IFEval": 0.2258, + "BBH": 0.4516, + "MATH Level 5": 0.0227, + "GPQA": 0.2576, + "MUSR": 0.4024, + "MMLU-PRO": 0.252 + } + }, + { + "model_id": "netcat420/MFANN3bv0.20", + "name": "MFANN3bv0.20", + "developer": "netcat420", + "scores": { + "IFEval": 0.2193, + "BBH": 0.4493, + "MATH Level 5": 0.0264, + "GPQA": 0.2592, + "MUSR": 0.4077, + "MMLU-PRO": 0.25 + } + }, + { + "model_id": "netcat420/MFANN3bv0.21", + "name": "MFANN3bv0.21", + "developer": "netcat420", + "scores": { + "IFEval": 0.1909, + "BBH": 0.447, + "MATH Level 5": 0.0317, + "GPQA": 0.2643, + "MUSR": 0.3759, + "MMLU-PRO": 0.2393 + } + }, + { + "model_id": "netcat420/MFANN3bv0.22", + "name": "MFANN3bv0.22", + "developer": "netcat420", + "scores": { + "IFEval": 0.1979, + "BBH": 0.4485, + "MATH Level 5": 0.0264, + "GPQA": 0.2617, + "MUSR": 0.3521, + "MMLU-PRO": 0.2517 + } + }, + { + "model_id": "netcat420/MFANN3bv0.23", + "name": "MFANN3bv0.23", + "developer": "netcat420", + "scores": { + "IFEval": 0.2048, + "BBH": 0.4495, + "MATH Level 5": 0.0249, + "GPQA": 0.2517, + "MUSR": 0.3427, + "MMLU-PRO": 0.2418 + } + }, + { + "model_id": "netcat420/MFANN3bv0.24", + "name": "MFANN3bv0.24", + "developer": "netcat420", + "scores": { + "IFEval": 0.22, + "BBH": 0.4407, + "MATH Level 5": 0.0279, + "GPQA": 0.2584, + "MUSR": 0.3521, + "MMLU-PRO": 0.2352 + } + }, + { + "model_id": "netcat420/MFANN3bv1.1", + "name": "MFANN3bv1.1", + "developer": "netcat420", + "scores": { + "IFEval": 0.2507, + "BBH": 0.3397, + "MATH Level 5": 0.0204, + "GPQA": 0.2668, + "MUSR": 0.3223, + "MMLU-PRO": 0.1159 + } + }, + { + "model_id": "netcat420/MFANN3bv1.2", + "name": "MFANN3bv1.2", + "developer": "netcat420", + "scores": { + "IFEval": 0.2686, + "BBH": 0.366, + "MATH Level 5": 0.0264, + "GPQA": 0.2634, + "MUSR": 0.3156, + "MMLU-PRO": 0.145 + } + }, + { + "model_id": "netcat420/MFANN3bv1.3", + "name": "MFANN3bv1.3", + "developer": "netcat420", + "scores": { + "IFEval": 0.2547, + "BBH": 0.4456, + "MATH Level 5": 0.0211, + "GPQA": 0.2576, + "MUSR": 0.3299, + "MMLU-PRO": 0.2276 + } + }, + { + "model_id": "netcat420/MFANN3bv1.4", + "name": "MFANN3bv1.4", + "developer": "netcat420", + "scores": { + "IFEval": 0.3524, + "BBH": 0.4809, + "MATH Level 5": 0.037, + "GPQA": 0.2827, + "MUSR": 0.3708, + "MMLU-PRO": 0.2705 + } + }, + { + "model_id": "netcat420/MFANNv0.19", + "name": "MFANNv0.19", + "developer": "netcat420", + "scores": { + "IFEval": 0.3057, + "BBH": 0.4731, + "MATH Level 5": 0.0415, + "GPQA": 0.307, + "MUSR": 0.3527, + "MMLU-PRO": 0.2473 + } + }, + { + "model_id": "netcat420/MFANNv0.20", + "name": "MFANNv0.20", + "developer": "netcat420", + "scores": { + "IFEval": 0.3479, + "BBH": 0.4574, + "MATH Level 5": 0.0498, + "GPQA": 0.2903, + "MUSR": 0.3874, + "MMLU-PRO": 0.3202 + } + }, + { + "model_id": "netcat420/MFANNv0.21", + "name": "MFANNv0.21", + "developer": "netcat420", + "scores": { + "IFEval": 0.3233, + "BBH": 0.4576, + "MATH Level 5": 0.0574, + "GPQA": 0.2785, + "MUSR": 0.3993, + "MMLU-PRO": 0.3031 + } + }, + { + "model_id": "netcat420/MFANNv0.22.1", + "name": "MFANNv0.22.1", + "developer": "netcat420", + "scores": { + "IFEval": 0.3089, + "BBH": 0.4661, + "MATH Level 5": 0.0536, + "GPQA": 0.276, + "MUSR": 0.3753, + "MMLU-PRO": 0.3343 + } + }, + { + "model_id": "netcat420/MFANNv0.23", + "name": "MFANNv0.23", + "developer": "netcat420", + "scores": { + "IFEval": 0.3127, + "BBH": 0.4898, + "MATH Level 5": 0.0498, + "GPQA": 0.2844, + "MUSR": 0.3768, + "MMLU-PRO": 0.3388 + } + }, + { + "model_id": "netcat420/MFANNv0.24", + "name": "MFANNv0.24", + "developer": "netcat420", + "scores": { + "IFEval": 0.3162, + "BBH": 0.479, + "MATH Level 5": 0.0612, + "GPQA": 0.2844, + "MUSR": 0.3754, + "MMLU-PRO": 0.3348 + } + }, + { + "model_id": "netcat420/MFANNv0.25", + "name": "MFANNv0.25", + "developer": "netcat420", + "scores": { + "IFEval": 0.3467, + "BBH": 0.4794, + "MATH Level 5": 0.0582, + "GPQA": 0.2802, + "MUSR": 0.3688, + "MMLU-PRO": 0.3343 + } + }, + { + "model_id": "netcat420/Qwen2.5-7B-nerd-uncensored-v0.9-MFANN", + "name": "Qwen2.5-7B-nerd-uncensored-v0.9-MFANN", + "developer": "netcat420", + "scores": { + "IFEval": 0.5878, + "BBH": 0.5237, + "MATH Level 5": 0.3376, + "GPQA": 0.281, + "MUSR": 0.3926, + "MMLU-PRO": 0.3904 + } + }, + { + "model_id": "netcat420/Qwen2.5-7b-MFANN-slerp", + "name": "Qwen2.5-7b-MFANN-slerp", + "developer": "netcat420", + "scores": { + "IFEval": 0.6532, + "BBH": 0.5089, + "MATH Level 5": 0.287, + "GPQA": 0.2953, + "MUSR": 0.4073, + "MMLU-PRO": 0.3417 + } + }, + { + "model_id": "netcat420/Qwen2.5-7b-nerd-uncensored-MFANN-slerp", + "name": "Qwen2.5-7b-nerd-uncensored-MFANN-slerp", + "developer": "netcat420", + "scores": { + "IFEval": 0.1564, + "BBH": 0.292, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3792, + "MMLU-PRO": 0.11 + } + }, + { + "model_id": "netcat420/Qwen2.5-Coder-Scholar-7B-Abliterated-MFANN", + "name": "Qwen2.5-Coder-Scholar-7B-Abliterated-MFANN", + "developer": "netcat420", + "scores": { + "IFEval": 0.5742, + "BBH": 0.5071, + "MATH Level 5": 0.2568, + "GPQA": 0.2928, + "MUSR": 0.4058, + "MMLU-PRO": 0.3157 + } + }, + { + "model_id": "netcat420/Qwen2.5-Coder-Scholar-7B-Abliterated-MFANN-Slerp-Unretrained", + "name": "Qwen2.5-Coder-Scholar-7B-Abliterated-MFANN-Slerp-Unretrained", + "developer": "netcat420", + "scores": { + "IFEval": 0.6486, + "BBH": 0.5066, + "MATH Level 5": 0.2991, + "GPQA": 0.2987, + "MUSR": 0.4152, + "MMLU-PRO": 0.3432 + } + }, + { + "model_id": "netcat420/Qwen2.5-DeepSeek-R1-MFANN-Slerp-7b", + "name": "Qwen2.5-DeepSeek-R1-MFANN-Slerp-7b", + "developer": "netcat420", + "scores": { + "IFEval": 0.2676, + "BBH": 0.3789, + "MATH Level 5": 0.0181, + "GPQA": 0.2324, + "MUSR": 0.3528, + "MMLU-PRO": 0.1677 + } + }, + { + "model_id": "netcat420/Qwen2.5-MFANN-7b", + "name": "Qwen2.5-MFANN-7b", + "developer": "netcat420", + "scores": { + "IFEval": 0.6097, + "BBH": 0.5054, + "MATH Level 5": 0.2787, + "GPQA": 0.2861, + "MUSR": 0.4021, + "MMLU-PRO": 0.3233 + } + }, + { + "model_id": "netcat420/qwen2.5-MFANN-7b-SLERP-V1.2", + "name": "qwen2.5-MFANN-7b-SLERP-V1.2", + "developer": "netcat420", + "scores": { + "IFEval": 0.6606, + "BBH": 0.5111, + "MATH Level 5": 0.287, + "GPQA": 0.297, + "MUSR": 0.4259, + "MMLU-PRO": 0.3438 + } + }, + { + "model_id": "netcat420/qwen2.5-MFANN-7b-SLERPv1.1", + "name": "qwen2.5-MFANN-7b-SLERPv1.1", + "developer": "netcat420", + "scores": { + "IFEval": 0.6555, + "BBH": 0.5075, + "MATH Level 5": 0.2968, + "GPQA": 0.2903, + "MUSR": 0.4126, + "MMLU-PRO": 0.3448 + } + }, + { + "model_id": "netcat420/qwen2.5-MFANN-7b-v1.1", + "name": "qwen2.5-MFANN-7b-v1.1", + "developer": "netcat420", + "scores": { + "IFEval": 0.6088, + "BBH": 0.4967, + "MATH Level 5": 0.2825, + "GPQA": 0.276, + "MUSR": 0.4114, + "MMLU-PRO": 0.3248 + } + }, + { + "model_id": "netease-youdao/Confucius-o1-14B", + "name": "Confucius-o1-14B", + "developer": "netease-youdao", + "scores": { + "IFEval": 0.6378, + "BBH": 0.63, + "MATH Level 5": 0.4313, + "GPQA": 0.3649, + "MUSR": 0.4338, + "MMLU-PRO": 0.5265 + } + }, + { + "model_id": "newsbang/Homer-7B-v0.1", + "name": "Homer-7B-v0.1", + "developer": "newsbang", + "scores": { + "IFEval": 0.6109, + "BBH": 0.5601, + "MATH Level 5": 0.386, + "GPQA": 0.3247, + "MUSR": 0.4357, + "MMLU-PRO": 0.4475 + } + }, + { + "model_id": "newsbang/Homer-7B-v0.2", + "name": "Homer-7B-v0.2", + "developer": "newsbang", + "scores": { + "IFEval": 0.7494, + "BBH": 0.5517, + "MATH Level 5": 0.2477, + "GPQA": 0.3322, + "MUSR": 0.4298, + "MMLU-PRO": 0.441 + } + }, + { + "model_id": "newsbang/Homer-v0.3-Qwen2.5-7B", + "name": "Homer-v0.3-Qwen2.5-7B", + "developer": "newsbang", + "scores": { + "IFEval": 0.5154, + "BBH": 0.5481, + "MATH Level 5": 0.3089, + "GPQA": 0.3339, + "MUSR": 0.4744, + "MMLU-PRO": 0.4456 + } + }, + { + "model_id": "newsbang/Homer-v0.4-Qwen2.5-7B", + "name": "Homer-v0.4-Qwen2.5-7B", + "developer": "newsbang", + "scores": { + "IFEval": 0.7999, + "BBH": 0.5533, + "MATH Level 5": 0.2779, + "GPQA": 0.3154, + "MUSR": 0.4311, + "MMLU-PRO": 0.4363 + } + }, + { + "model_id": "newsbang/Homer-v0.5-Qwen2.5-7B", + "name": "Homer-v0.5-Qwen2.5-7B", + "developer": "newsbang", + "scores": { + "IFEval": 0.7881, + "BBH": 0.554, + "MATH Level 5": 0.3724, + "GPQA": 0.3029, + "MUSR": 0.4193, + "MMLU-PRO": 0.4369 + } + }, + { + "model_id": "newsbang/Homer-v1.0-Qwen2.5-72B", + "name": "Homer-v1.0-Qwen2.5-72B", + "developer": "newsbang", + "scores": { + "IFEval": 0.7628, + "BBH": 0.731, + "MATH Level 5": 0.4902, + "GPQA": 0.4161, + "MUSR": 0.4677, + "MMLU-PRO": 0.6145 + } + }, + { + "model_id": "newsbang/Homer-v1.0-Qwen2.5-7B", + "name": "Homer-v1.0-Qwen2.5-7B", + "developer": "newsbang", + "scores": { + "IFEval": 0.6393, + "BBH": 0.5655, + "MATH Level 5": 0.3323, + "GPQA": 0.3221, + "MUSR": 0.4278, + "MMLU-PRO": 0.4535 + } + }, + { + "model_id": "nguyentd/FinancialAdvice-Qwen2.5-7B", + "name": "FinancialAdvice-Qwen2.5-7B", + "developer": "nguyentd", + "scores": { + "IFEval": 0.4496, + "BBH": 0.4731, + "MATH Level 5": 0.1148, + "GPQA": 0.2945, + "MUSR": 0.4025, + "MMLU-PRO": 0.3752 + } + }, + { + "model_id": "ngxson/MiniThinky-1B-Llama-3.2", + "name": "MiniThinky-1B-Llama-3.2", + "developer": "ngxson", + "scores": { + "IFEval": 0.2771, + "BBH": 0.3142, + "MATH Level 5": 0.0574, + "GPQA": 0.2391, + "MUSR": 0.3434, + "MMLU-PRO": 0.1147 + } + }, + { + "model_id": "ngxson/MiniThinky-v2-1B-Llama-3.2", + "name": "MiniThinky-v2-1B-Llama-3.2", + "developer": "ngxson", + "scores": { + "IFEval": 0.2963, + "BBH": 0.3205, + "MATH Level 5": 0.0287, + "GPQA": 0.2399, + "MUSR": 0.3356, + "MMLU-PRO": 0.1116 + } + }, + { + "model_id": "nhyha/N3N_Delirium-v1_1030_0227", + "name": "N3N_Delirium-v1_1030_0227", + "developer": "nhyha", + "scores": { + "IFEval": 0.8023, + "BBH": 0.5891, + "MATH Level 5": 0.2107, + "GPQA": 0.3372, + "MUSR": 0.4098, + "MMLU-PRO": 0.415 + } + }, + { + "model_id": "nhyha/N3N_Llama-3.1-8B-Instruct_1028_0216", + "name": "N3N_Llama-3.1-8B-Instruct_1028_0216", + "developer": "nhyha", + "scores": { + "IFEval": 0.4796, + "BBH": 0.5054, + "MATH Level 5": 0.1707, + "GPQA": 0.3062, + "MUSR": 0.405, + "MMLU-PRO": 0.3638 + } + }, + { + "model_id": "nhyha/N3N_gemma-2-9b-it_20241029_1532", + "name": "N3N_gemma-2-9b-it_20241029_1532", + "developer": "nhyha", + "scores": { + "IFEval": 0.6752, + "BBH": 0.5863, + "MATH Level 5": 0.2122, + "GPQA": 0.3406, + "MUSR": 0.4594, + "MMLU-PRO": 0.4122 + } + }, + { + "model_id": "nhyha/N3N_gemma-2-9b-it_20241110_2026", + "name": "N3N_gemma-2-9b-it_20241110_2026", + "developer": "nhyha", + "scores": { + "IFEval": 0.6283, + "BBH": 0.5867, + "MATH Level 5": 0.1609, + "GPQA": 0.3364, + "MUSR": 0.4073, + "MMLU-PRO": 0.402 + } + }, + { + "model_id": "nhyha/merge_Qwen2.5-7B-Instruct_20241023_0314", + "name": "merge_Qwen2.5-7B-Instruct_20241023_0314", + "developer": "nhyha", + "scores": { + "IFEval": 0.5695, + "BBH": 0.5559, + "MATH Level 5": 0.3542, + "GPQA": 0.3213, + "MUSR": 0.4251, + "MMLU-PRO": 0.4542 + } + }, + { + "model_id": "nidum/Nidum-Limitless-Gemma-2B", + "name": "Nidum-Limitless-Gemma-2B", + "developer": "nidum", + "scores": { + "IFEval": 0.2424, + "BBH": 0.3079, + "MATH Level 5": 0.0136, + "GPQA": 0.2643, + "MUSR": 0.374, + "MMLU-PRO": 0.1174 + } + }, + { + "model_id": "nisten/franqwenstein-35b", + "name": "franqwenstein-35b", + "developer": "nisten", + "scores": { + "IFEval": 0.3799, + "BBH": 0.6647, + "MATH Level 5": 0.3406, + "GPQA": 0.4035, + "MUSR": 0.494, + "MMLU-PRO": 0.5731 + } + }, + { + "model_id": "nisten/tqwendo-36b", + "name": "tqwendo-36b", + "developer": "nisten", + "scores": { + "IFEval": 0.6778, + "BBH": 0.6432, + "MATH Level 5": 0.4154, + "GPQA": 0.3314, + "MUSR": 0.443, + "MMLU-PRO": 0.4381 + } + }, + { + "model_id": "nlpguy/Lion-Lamarck-v.1.0.8", + "name": "Lion-Lamarck-v.1.0.8", + "developer": "nlpguy", + "scores": { + "IFEval": 0.4509, + "BBH": 0.5869, + "MATH Level 5": 0.5544, + "GPQA": 0.3582, + "MUSR": 0.4673, + "MMLU-PRO": 0.4643 + } + }, + { + "model_id": "nlpguy/Lion-Lamarck-v.1.0.9", + "name": "Lion-Lamarck-v.1.0.9", + "developer": "nlpguy", + "scores": { + "IFEval": 0.3409, + "BBH": 0.5918, + "MATH Level 5": 0.5642, + "GPQA": 0.3901, + "MUSR": 0.53, + "MMLU-PRO": 0.4704 + } + }, + { + "model_id": "nlpguy/Lion-Lamarck-v.1.1.0", + "name": "Lion-Lamarck-v.1.1.0", + "developer": "nlpguy", + "scores": { + "IFEval": 0.3658, + "BBH": 0.5962, + "MATH Level 5": 0.5755, + "GPQA": 0.3926, + "MUSR": 0.5325, + "MMLU-PRO": 0.4631 + } + }, + { + "model_id": "nlpguy/Miisce-one", + "name": "Miisce-one", + "developer": "nlpguy", + "scores": { + "IFEval": 0.6066, + "BBH": 0.6505, + "MATH Level 5": 0.4169, + "GPQA": 0.3859, + "MUSR": 0.482, + "MMLU-PRO": 0.5412 + } + }, + { + "model_id": "nlpguy/Mistral-NeMo-Minitron-Upscale-v1", + "name": "Mistral-NeMo-Minitron-Upscale-v1", + "developer": "nlpguy", + "scores": { + "IFEval": 0.1648, + "BBH": 0.4468, + "MATH Level 5": 0.0144, + "GPQA": 0.2802, + "MUSR": 0.3804, + "MMLU-PRO": 0.2537 + } + }, + { + "model_id": "nlpguy/Mistral-NeMo-Minitron-Upscale-v2", + "name": "Mistral-NeMo-Minitron-Upscale-v2", + "developer": "nlpguy", + "scores": { + "IFEval": 0.1573, + "BBH": 0.395, + "MATH Level 5": 0.0128, + "GPQA": 0.2735, + "MUSR": 0.3791, + "MMLU-PRO": 0.1927 + } + }, + { + "model_id": "nlpguy/Mistral-NeMo-Minitron-Upscale-v3", + "name": "Mistral-NeMo-Minitron-Upscale-v3", + "developer": "nlpguy", + "scores": { + "IFEval": 0.1412, + "BBH": 0.3052, + "MATH Level 5": 0.0113, + "GPQA": 0.2592, + "MUSR": 0.4098, + "MMLU-PRO": 0.1171 + } + }, + { + "model_id": "nlpguy/StableProse", + "name": "StableProse", + "developer": "nlpguy", + "scores": { + "IFEval": 0.1972, + "BBH": 0.5117, + "MATH Level 5": 0.065, + "GPQA": 0.3029, + "MUSR": 0.4067, + "MMLU-PRO": 0.3468 + } + }, + { + "model_id": "nlpguy/StarFusion-alpha1", + "name": "StarFusion-alpha1", + "developer": "nlpguy", + "scores": { + "IFEval": 0.566, + "BBH": 0.4429, + "MATH Level 5": 0.0718, + "GPQA": 0.2953, + "MUSR": 0.4081, + "MMLU-PRO": 0.3191 + } + }, + { + "model_id": "noname0202/Llama-3.2-4x3B-Instruct", + "name": "Llama-3.2-4x3B-Instruct", + "developer": "noname0202", + "scores": { + "IFEval": 0.7067, + "BBH": 0.4647, + "MATH Level 5": 0.1586, + "GPQA": 0.2727, + "MUSR": 0.3674, + "MMLU-PRO": 0.3285 + } + }, + { + "model_id": "noname0202/gemma-2-2b-it-ties", + "name": "gemma-2-2b-it-ties", + "developer": "noname0202", + "scores": { + "IFEval": 0.1266, + "BBH": 0.4206, + "MATH Level 5": 0.0242, + "GPQA": 0.2701, + "MUSR": 0.3929, + "MMLU-PRO": 0.2561 + } + }, + { + "model_id": "noname0202/gemma-2-9b-sft-jp-en-zh-v1", + "name": "gemma-2-9b-sft-jp-en-zh-v1", + "developer": "noname0202", + "scores": { + "IFEval": 0.2988, + "BBH": 0.4519, + "MATH Level 5": 0.0891, + "GPQA": 0.307, + "MUSR": 0.408, + "MMLU-PRO": 0.3125 + } + }, + { + "model_id": "noname0202/gemma-2-9b-sft-jp-en-zh-v2", + "name": "gemma-2-9b-sft-jp-en-zh-v2", + "developer": "noname0202", + "scores": { + "IFEval": 0.3993, + "BBH": 0.4515, + "MATH Level 5": 0.1042, + "GPQA": 0.2878, + "MUSR": 0.3612, + "MMLU-PRO": 0.3675 + } + }, + { + "model_id": "noname0202/llama-math-1b-r16-0to512tokens-test", + "name": "llama-math-1b-r16-0to512tokens-test", + "developer": "noname0202", + "scores": { + "IFEval": 0.547, + "BBH": 0.3488, + "MATH Level 5": 0.0816, + "GPQA": 0.2668, + "MUSR": 0.3143, + "MMLU-PRO": 0.1728 + } + }, + { + "model_id": "noname0202/llama-math-1b-r32-0to512tokens-test", + "name": "llama-math-1b-r32-0to512tokens-test", + "developer": "noname0202", + "scores": { + "IFEval": 0.5683, + "BBH": 0.3495, + "MATH Level 5": 0.0906, + "GPQA": 0.2651, + "MUSR": 0.3209, + "MMLU-PRO": 0.176 + } + }, + { + "model_id": "noname0202/llama-math-1b-r32-test", + "name": "llama-math-1b-r32-test", + "developer": "noname0202", + "scores": { + "IFEval": 0.5819, + "BBH": 0.3486, + "MATH Level 5": 0.0725, + "GPQA": 0.2617, + "MUSR": 0.3156, + "MMLU-PRO": 0.1781 + } + }, + { + "model_id": "noname0202/llama-math-1b-r8-512tokens-test", + "name": "llama-math-1b-r8-512tokens-test", + "developer": "noname0202", + "scores": { + "IFEval": 0.5792, + "BBH": 0.3496, + "MATH Level 5": 0.0816, + "GPQA": 0.2685, + "MUSR": 0.3169, + "MMLU-PRO": 0.1753 + } + }, + { + "model_id": "notbdq/Qwen2.5-14B-Instruct-1M-GRPO-Reasoning", + "name": "Qwen2.5-14B-Instruct-1M-GRPO-Reasoning", + "developer": "notbdq", + "scores": { + "IFEval": 0.8414, + "BBH": 0.6198, + "MATH Level 5": 0.5302, + "GPQA": 0.3431, + "MUSR": 0.418, + "MMLU-PRO": 0.485 + } + }, + { + "model_id": "nothingiisreal/L3.1-8B-Celeste-V1.5", + "name": "L3.1-8B-Celeste-V1.5", + "developer": "nothingiisreal", + "scores": { + "IFEval": 0.7327, + "BBH": 0.5012, + "MATH Level 5": 0.1465, + "GPQA": 0.2844, + "MUSR": 0.3749, + "MMLU-PRO": 0.3704 + } + }, + { + "model_id": "nothingiisreal/MN-12B-Starcannon-v2", + "name": "MN-12B-Starcannon-v2", + "developer": "nothingiisreal", + "scores": { + "IFEval": 0.3925, + "BBH": 0.5004, + "MATH Level 5": 0.0597, + "GPQA": 0.2785, + "MUSR": 0.3978, + "MMLU-PRO": 0.3128 + } + }, + { + "model_id": "nothingiisreal/MN-12B-Starcannon-v3", + "name": "MN-12B-Starcannon-v3", + "developer": "nothingiisreal", + "scores": { + "IFEval": 0.3807, + "BBH": 0.5171, + "MATH Level 5": 0.0778, + "GPQA": 0.2735, + "MUSR": 0.4046, + "MMLU-PRO": 0.3265 + } + }, + { + "model_id": "nvidia/AceInstruct-1.5B", + "name": "AceInstruct-1.5B", + "developer": "nvidia", + "scores": { + "IFEval": 0.3948, + "BBH": 0.3932, + "MATH Level 5": 0.3127, + "GPQA": 0.2718, + "MUSR": 0.346, + "MMLU-PRO": 0.2574 + } + }, + { + "model_id": "nvidia/AceInstruct-72B", + "name": "AceInstruct-72B", + "developer": "nvidia", + "scores": { + "IFEval": 0.7119, + "BBH": 0.6139, + "MATH Level 5": 0.6261, + "GPQA": 0.3213, + "MUSR": 0.4206, + "MMLU-PRO": 0.4874 + } + }, + { + "model_id": "nvidia/AceInstruct-7B", + "name": "AceInstruct-7B", + "developer": "nvidia", + "scores": { + "IFEval": 0.5422, + "BBH": 0.5501, + "MATH Level 5": 0.5295, + "GPQA": 0.307, + "MUSR": 0.4255, + "MMLU-PRO": 0.4177 + } + }, + { + "model_id": "nvidia/AceMath-1.5B-Instruct", + "name": "AceMath-1.5B-Instruct", + "developer": "nvidia", + "scores": { + "IFEval": 0.3212, + "BBH": 0.4024, + "MATH Level 5": 0.5287, + "GPQA": 0.2743, + "MUSR": 0.3607, + "MMLU-PRO": 0.2064 + } + }, + { + "model_id": "nvidia/AceMath-72B-Instruct", + "name": "AceMath-72B-Instruct", + "developer": "nvidia", + "scores": { + "IFEval": 0.495, + "BBH": 0.6402, + "MATH Level 5": 0.7145, + "GPQA": 0.271, + "MUSR": 0.4062, + "MMLU-PRO": 0.4411 + } + }, + { + "model_id": "nvidia/AceMath-72B-RM", + "name": "AceMath-72B-RM", + "developer": "nvidia", + "scores": { + "IFEval": 0.1413, + "BBH": 0.2717, + "MATH Level 5": 0.0, + "GPQA": 0.2341, + "MUSR": 0.3351, + "MMLU-PRO": 0.1179 + } + }, + { + "model_id": "nvidia/AceMath-7B-Instruct", + "name": "AceMath-7B-Instruct", + "developer": "nvidia", + "scores": { + "IFEval": 0.4532, + "BBH": 0.4994, + "MATH Level 5": 0.6337, + "GPQA": 0.2919, + "MUSR": 0.4193, + "MMLU-PRO": 0.3383 + } + }, + { + "model_id": "nvidia/AceMath-7B-RM", + "name": "AceMath-7B-RM", + "developer": "nvidia", + "scores": { + "IFEval": 0.1494, + "BBH": 0.2423, + "MATH Level 5": 0.0, + "GPQA": 0.2458, + "MUSR": 0.358, + "MMLU-PRO": 0.1139 + } + }, + { + "model_id": "nvidia/Hymba-1.5B-Base", + "name": "Hymba-1.5B-Base", + "developer": "nvidia", + "scores": { + "IFEval": 0.2295, + "BBH": 0.3256, + "MATH Level 5": 0.0136, + "GPQA": 0.2559, + "MUSR": 0.3566, + "MMLU-PRO": 0.1922 + } + }, + { + "model_id": "nvidia/Hymba-1.5B-Instruct", + "name": "Hymba-1.5B-Instruct", + "developer": "nvidia", + "scores": { + "IFEval": 0.6009, + "BBH": 0.3067, + "MATH Level 5": 0.0272, + "GPQA": 0.2886, + "MUSR": 0.3316, + "MMLU-PRO": 0.204 + } + }, + { + "model_id": "nvidia/Llama-3.1-Minitron-4B-Depth-Base", + "name": "Llama-3.1-Minitron-4B-Depth-Base", + "developer": "nvidia", + "scores": { + "IFEval": 0.1607, + "BBH": 0.4171, + "MATH Level 5": 0.0196, + "GPQA": 0.2634, + "MUSR": 0.4011, + "MMLU-PRO": 0.2798 + } + }, + { + "model_id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", + "name": "Llama-3.1-Nemotron-70B-Instruct-HF", + "developer": "nvidia", + "scores": { + "IFEval": 0.7381, + "BBH": 0.6316, + "MATH Level 5": 0.4267, + "GPQA": 0.2584, + "MUSR": 0.4328, + "MMLU-PRO": 0.4919 + } + }, + { + "model_id": "nvidia/Minitron-4B-Base", + "name": "Minitron-4B-Base", + "developer": "nvidia", + "scores": { + "IFEval": 0.2218, + "BBH": 0.4084, + "MATH Level 5": 0.0196, + "GPQA": 0.2693, + "MUSR": 0.4134, + "MMLU-PRO": 0.262 + } + }, + { + "model_id": "nvidia/Minitron-8B-Base", + "name": "Minitron-8B-Base", + "developer": "nvidia", + "scores": { + "IFEval": 0.2424, + "BBH": 0.4395, + "MATH Level 5": 0.0257, + "GPQA": 0.2735, + "MUSR": 0.4026, + "MMLU-PRO": 0.3181 + } + }, + { + "model_id": "nvidia/Mistral-NeMo-Minitron-8B-Base", + "name": "Mistral-NeMo-Minitron-8B-Base", + "developer": "nvidia", + "scores": { + "IFEval": 0.1946, + "BBH": 0.5219, + "MATH Level 5": 0.0483, + "GPQA": 0.3255, + "MUSR": 0.4092, + "MMLU-PRO": 0.3796 + } + }, + { + "model_id": "nvidia/Mistral-NeMo-Minitron-8B-Instruct", + "name": "Mistral-NeMo-Minitron-8B-Instruct", + "developer": "nvidia", + "scores": { + "IFEval": 0.5004, + "BBH": 0.5321, + "MATH Level 5": 0.1163, + "GPQA": 0.2878, + "MUSR": 0.3886, + "MMLU-PRO": 0.3991 + } + }, + { + "model_id": "nvidia/Nemotron-Mini-4B-Instruct", + "name": "Nemotron-Mini-4B-Instruct", + "developer": "nvidia", + "scores": { + "IFEval": 0.6669, + "BBH": 0.3865, + "MATH Level 5": 0.0257, + "GPQA": 0.2802, + "MUSR": 0.3767, + "MMLU-PRO": 0.2626 + } + }, + { + "model_id": "nvidia/OpenMath2-Llama3.1-8B", + "name": "OpenMath2-Llama3.1-8B", + "developer": "nvidia", + "scores": { + "IFEval": 0.2331, + "BBH": 0.4096, + "MATH Level 5": 0.2674, + "GPQA": 0.2651, + "MUSR": 0.3436, + "MMLU-PRO": 0.1553 + } + }, + { + "model_id": "nxmwxm/Beast-Soul-new", + "name": "Beast-Soul-new", + "developer": "nxmwxm", + "scores": { + "IFEval": 0.4869, + "BBH": 0.5227, + "MATH Level 5": 0.074, + "GPQA": 0.2819, + "MUSR": 0.4459, + "MMLU-PRO": 0.3102 + } + }, + { + "model_id": "occiglot/occiglot-7b-es-en-instruct", + "name": "occiglot-7b-es-en-instruct", + "developer": "occiglot", + "scores": { + "IFEval": 0.3485, + "BBH": 0.4111, + "MATH Level 5": 0.0242, + "GPQA": 0.2592, + "MUSR": 0.3738, + "MMLU-PRO": 0.2311 + } + }, + { + "model_id": "odyssey-labs/Astral-1-10B", + "name": "Astral-1-10B", + "developer": "odyssey-labs", + "scores": { + "IFEval": 0.3878, + "BBH": 0.4873, + "MATH Level 5": 0.0347, + "GPQA": 0.3054, + "MUSR": 0.428, + "MMLU-PRO": 0.2985 + } + }, + { + "model_id": "olabs-ai/reflection_model", + "name": "reflection_model", + "developer": "olabs-ai", + "scores": { + "IFEval": 0.1599, + "BBH": 0.4713, + "MATH Level 5": 0.0514, + "GPQA": 0.3003, + "MUSR": 0.3508, + "MMLU-PRO": 0.3311 + } + }, + { + "model_id": "ontocord/Llama_3.2_1b-autoredteam_helpfulness-train", + "name": "Llama_3.2_1b-autoredteam_helpfulness-train", + "developer": "ontocord", + "scores": { + "IFEval": 0.2765, + "BBH": 0.3115, + "MATH Level 5": 0.0166, + "GPQA": 0.2592, + "MUSR": 0.3459, + "MMLU-PRO": 0.1132 + } + }, + { + "model_id": "ontocord/RedPajama-3B-v1-AutoRedteam", + "name": "RedPajama-3B-v1-AutoRedteam", + "developer": "ontocord", + "scores": { + "IFEval": 0.1343, + "BBH": 0.3026, + "MATH Level 5": 0.0091, + "GPQA": 0.2424, + "MUSR": 0.3661, + "MMLU-PRO": 0.1108 + } + }, + { + "model_id": "ontocord/RedPajama-3B-v1-AutoRedteam-Harmless-only", + "name": "RedPajama-3B-v1-AutoRedteam-Harmless-only", + "developer": "ontocord", + "scores": { + "IFEval": 0.1525, + "BBH": 0.3124, + "MATH Level 5": 0.006, + "GPQA": 0.2315, + "MUSR": 0.3661, + "MMLU-PRO": 0.11 + } + }, + { + "model_id": "ontocord/RedPajama3b_v1-autoredteam_helpfulness-train", + "name": "RedPajama3b_v1-autoredteam_helpfulness-train", + "developer": "ontocord", + "scores": { + "IFEval": 0.2848, + "BBH": 0.3093, + "MATH Level 5": 0.0068, + "GPQA": 0.2458, + "MUSR": 0.358, + "MMLU-PRO": 0.1107 + } + }, + { + "model_id": "ontocord/merged_0.2_expert_0.8", + "name": "merged_0.2_expert_0.8", + "developer": "ontocord", + "scores": { + "IFEval": 0.1743, + "BBH": 0.3046, + "MATH Level 5": 0.0264, + "GPQA": 0.2617, + "MUSR": 0.3621, + "MMLU-PRO": 0.1111 + } + }, + { + "model_id": "ontocord/merged_0.2_expert_0.8-stack_2x", + "name": "merged_0.2_expert_0.8-stack_2x", + "developer": "ontocord", + "scores": { + "IFEval": 0.1796, + "BBH": 0.3006, + "MATH Level 5": 0.0249, + "GPQA": 0.2626, + "MUSR": 0.3541, + "MMLU-PRO": 0.1103 + } + }, + { + "model_id": "ontocord/merged_0.5_expert_0.5", + "name": "merged_0.5_expert_0.5", + "developer": "ontocord", + "scores": { + "IFEval": 0.1787, + "BBH": 0.3017, + "MATH Level 5": 0.0196, + "GPQA": 0.2643, + "MUSR": 0.3542, + "MMLU-PRO": 0.1108 + } + }, + { + "model_id": "ontocord/ontocord_wide_3b-stage1_shuf_sample1_jsonl-pretrained-autoredteam_helpful-0.25_helpful", + "name": "ontocord_wide_3b-stage1_shuf_sample1_jsonl-pretrained-autoredteam_helpful-0.25_helpful", + "developer": "ontocord", + "scores": { + "IFEval": 0.1318, + "BBH": 0.3004, + "MATH Level 5": 0.0106, + "GPQA": 0.2676, + "MUSR": 0.3631, + "MMLU-PRO": 0.1142 + } + }, + { + "model_id": "ontocord/ontocord_wide_7b-stacked-stage1", + "name": "ontocord_wide_7b-stacked-stage1", + "developer": "ontocord", + "scores": { + "IFEval": 0.1485, + "BBH": 0.2897, + "MATH Level 5": 0.0091, + "GPQA": 0.2534, + "MUSR": 0.3604, + "MMLU-PRO": 0.1105 + } + }, + { + "model_id": "ontocord/ontocord_wide_7b-stacked-stage1-instruct", + "name": "ontocord_wide_7b-stacked-stage1-instruct", + "developer": "ontocord", + "scores": { + "IFEval": 0.153, + "BBH": 0.2854, + "MATH Level 5": 0.0068, + "GPQA": 0.2466, + "MUSR": 0.3538, + "MMLU-PRO": 0.1117 + } + }, + { + "model_id": "ontocord/starcoder2-29b-ls", + "name": "starcoder2-29b-ls", + "developer": "ontocord", + "scores": { + "IFEval": 0.2149, + "BBH": 0.3735, + "MATH Level 5": 0.0189, + "GPQA": 0.2735, + "MUSR": 0.37, + "MMLU-PRO": 0.1869 + } + }, + { + "model_id": "ontocord/starcoder2_3b-AutoRedteam", + "name": "starcoder2_3b-AutoRedteam", + "developer": "ontocord", + "scores": { + "IFEval": 0.1574, + "BBH": 0.3498, + "MATH Level 5": 0.0106, + "GPQA": 0.2517, + "MUSR": 0.3646, + "MMLU-PRO": 0.1336 + } + }, + { + "model_id": "ontocord/wide_3b-merge_test", + "name": "wide_3b-merge_test", + "developer": "ontocord", + "scores": { + "IFEval": 0.1763, + "BBH": 0.3011, + "MATH Level 5": 0.0, + "GPQA": 0.2399, + "MUSR": 0.342, + "MMLU-PRO": 0.1066 + } + }, + { + "model_id": "ontocord/wide_3b-stage1_shuf_sample1_jsonl-pretrained", + "name": "wide_3b-stage1_shuf_sample1_jsonl-pretrained", + "developer": "ontocord", + "scores": { + "IFEval": 0.1395, + "BBH": 0.3004, + "MATH Level 5": 0.0166, + "GPQA": 0.2659, + "MUSR": 0.3632, + "MMLU-PRO": 0.114 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stag1.2-lyrical_law_news_software_howto_formattedtext_math_wiki-merge", + "name": "wide_3b_sft_stag1.2-lyrical_law_news_software_howto_formattedtext_math_wiki-merge", + "developer": "ontocord", + "scores": { + "IFEval": 0.1664, + "BBH": 0.3031, + "MATH Level 5": 0.0113, + "GPQA": 0.2601, + "MUSR": 0.3845, + "MMLU-PRO": 0.1111 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stag1.2-lyrical_news_software_howto_formattedtext-merge", + "name": "wide_3b_sft_stag1.2-lyrical_news_software_howto_formattedtext-merge", + "developer": "ontocord", + "scores": { + "IFEval": 0.1697, + "BBH": 0.2975, + "MATH Level 5": 0.0136, + "GPQA": 0.2601, + "MUSR": 0.3778, + "MMLU-PRO": 0.1125 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-no_redteam_skg_poem.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-no_redteam_skg_poem.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.148, + "BBH": 0.3095, + "MATH Level 5": 0.0204, + "GPQA": 0.2701, + "MUSR": 0.3579, + "MMLU-PRO": 0.1108 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-with_generics_intr.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-with_generics_intr.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.1237, + "BBH": 0.306, + "MATH Level 5": 0.0106, + "GPQA": 0.2743, + "MUSR": 0.3673, + "MMLU-PRO": 0.1111 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-with_generics_intr_math.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-with_generics_intr_math.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.1192, + "BBH": 0.2956, + "MATH Level 5": 0.0068, + "GPQA": 0.2643, + "MUSR": 0.3553, + "MMLU-PRO": 0.1183 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-with_generics_intr_math_stories.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-with_generics_intr_math_stories.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.1128, + "BBH": 0.3171, + "MATH Level 5": 0.0113, + "GPQA": 0.2685, + "MUSR": 0.346, + "MMLU-PRO": 0.1129 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-with_generics_intr_math_stories_no_orig_instr.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-with_generics_intr_math_stories_no_orig_instr.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.1317, + "BBH": 0.3064, + "MATH Level 5": 0.0091, + "GPQA": 0.2651, + "MUSR": 0.3446, + "MMLU-PRO": 0.1144 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-with_generics_intr_stories.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-with_generics_intr_stories.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.1182, + "BBH": 0.3037, + "MATH Level 5": 0.0083, + "GPQA": 0.2659, + "MUSR": 0.3567, + "MMLU-PRO": 0.1162 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-with_generics_math.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-with_generics_math.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.124, + "BBH": 0.3032, + "MATH Level 5": 0.0076, + "GPQA": 0.2584, + "MUSR": 0.3487, + "MMLU-PRO": 0.1128 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-with_math.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-with_math.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.1298, + "BBH": 0.3052, + "MATH Level 5": 0.0159, + "GPQA": 0.2601, + "MUSR": 0.3928, + "MMLU-PRO": 0.1147 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.1-ss1-with_r1_generics_intr_math_stories.no_issue", + "name": "wide_3b_sft_stage1.1-ss1-with_r1_generics_intr_math_stories.no_issue", + "developer": "ontocord", + "scores": { + "IFEval": 0.2049, + "BBH": 0.2912, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3575, + "MMLU-PRO": 0.1167 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.2-ss1-expert_fictional_lyrical", + "name": "wide_3b_sft_stage1.2-ss1-expert_fictional_lyrical", + "developer": "ontocord", + "scores": { + "IFEval": 0.1461, + "BBH": 0.2998, + "MATH Level 5": 0.0136, + "GPQA": 0.2643, + "MUSR": 0.3926, + "MMLU-PRO": 0.1141 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.2-ss1-expert_formatted_text", + "name": "wide_3b_sft_stage1.2-ss1-expert_formatted_text", + "developer": "ontocord", + "scores": { + "IFEval": 0.1487, + "BBH": 0.3069, + "MATH Level 5": 0.0121, + "GPQA": 0.2617, + "MUSR": 0.3474, + "MMLU-PRO": 0.1146 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.2-ss1-expert_how-to", + "name": "wide_3b_sft_stage1.2-ss1-expert_how-to", + "developer": "ontocord", + "scores": { + "IFEval": 0.1245, + "BBH": 0.3047, + "MATH Level 5": 0.0144, + "GPQA": 0.2592, + "MUSR": 0.3658, + "MMLU-PRO": 0.1153 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.2-ss1-expert_math", + "name": "wide_3b_sft_stage1.2-ss1-expert_math", + "developer": "ontocord", + "scores": { + "IFEval": 0.1915, + "BBH": 0.306, + "MATH Level 5": 0.0279, + "GPQA": 0.2592, + "MUSR": 0.37, + "MMLU-PRO": 0.1092 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.2-ss1-expert_news", + "name": "wide_3b_sft_stage1.2-ss1-expert_news", + "developer": "ontocord", + "scores": { + "IFEval": 0.1658, + "BBH": 0.2926, + "MATH Level 5": 0.0166, + "GPQA": 0.2676, + "MUSR": 0.3621, + "MMLU-PRO": 0.1111 + } + }, + { + "model_id": "ontocord/wide_3b_sft_stage1.2-ss1-expert_software", + "name": "wide_3b_sft_stage1.2-ss1-expert_software", + "developer": "ontocord", + "scores": { + "IFEval": 0.1734, + "BBH": 0.298, + "MATH Level 5": 0.0159, + "GPQA": 0.2584, + "MUSR": 0.3569, + "MMLU-PRO": 0.114 + } + }, + { + "model_id": "ontocord/wide_6.6b_sft_stag1.2-lyrical_law_news_software_howto_formattedtext_math_wiki-merge-stacked", + "name": "wide_6.6b_sft_stag1.2-lyrical_law_news_software_howto_formattedtext_math_wiki-merge-stacked", + "developer": "ontocord", + "scores": { + "IFEval": 0.1244, + "BBH": 0.3026, + "MATH Level 5": 0.0144, + "GPQA": 0.2659, + "MUSR": 0.3686, + "MMLU-PRO": 0.1115 + } + }, + { + "model_id": "oobabooga/CodeBooga-34B-v0.1", + "name": "CodeBooga-34B-v0.1", + "developer": "oobabooga", + "scores": { + "IFEval": 0.525, + "BBH": 0.3427, + "MATH Level 5": 0.0393, + "GPQA": 0.2567, + "MUSR": 0.431, + "MMLU-PRO": 0.236 + } + }, + { + "model_id": "oopere/Llama-FinSent-S", + "name": "Llama-FinSent-S", + "developer": "oopere", + "scores": { + "IFEval": 0.2119, + "BBH": 0.3156, + "MATH Level 5": 0.0181, + "GPQA": 0.2567, + "MUSR": 0.3832, + "MMLU-PRO": 0.113 + } + }, + { + "model_id": "oopere/pruned10-llama-3.2-3B", + "name": "pruned10-llama-3.2-3B", + "developer": "oopere", + "scores": { + "IFEval": 0.1776, + "BBH": 0.334, + "MATH Level 5": 0.0196, + "GPQA": 0.2668, + "MUSR": 0.3722, + "MMLU-PRO": 0.164 + } + }, + { + "model_id": "oopere/pruned20-llama-1b", + "name": "pruned20-llama-1b", + "developer": "oopere", + "scores": { + "IFEval": 0.1994, + "BBH": 0.3031, + "MATH Level 5": 0.0106, + "GPQA": 0.25, + "MUSR": 0.3631, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "oopere/pruned20-llama-3.2-3b", + "name": "pruned20-llama-3.2-3b", + "developer": "oopere", + "scores": { + "IFEval": 0.1789, + "BBH": 0.3248, + "MATH Level 5": 0.0159, + "GPQA": 0.2659, + "MUSR": 0.3418, + "MMLU-PRO": 0.128 + } + }, + { + "model_id": "oopere/pruned40-llama-1b", + "name": "pruned40-llama-1b", + "developer": "oopere", + "scores": { + "IFEval": 0.2284, + "BBH": 0.2969, + "MATH Level 5": 0.0076, + "GPQA": 0.2433, + "MUSR": 0.4287, + "MMLU-PRO": 0.1082 + } + }, + { + "model_id": "oopere/pruned40-llama-3.2-1B", + "name": "pruned40-llama-3.2-1B", + "developer": "oopere", + "scores": { + "IFEval": 0.2266, + "BBH": 0.2982, + "MATH Level 5": 0.0083, + "GPQA": 0.2542, + "MUSR": 0.4352, + "MMLU-PRO": 0.1115 + } + }, + { + "model_id": "oopere/pruned40-llama-3.2-3b", + "name": "pruned40-llama-3.2-3b", + "developer": "oopere", + "scores": { + "IFEval": 0.2183, + "BBH": 0.3167, + "MATH Level 5": 0.0128, + "GPQA": 0.2299, + "MUSR": 0.3539, + "MMLU-PRO": 0.1177 + } + }, + { + "model_id": "oopere/pruned60-llama-1b", + "name": "pruned60-llama-1b", + "developer": "oopere", + "scores": { + "IFEval": 0.1829, + "BBH": 0.3016, + "MATH Level 5": 0.0023, + "GPQA": 0.2492, + "MUSR": 0.4088, + "MMLU-PRO": 0.1173 + } + }, + { + "model_id": "oopere/pruned60-llama-3.2-3b", + "name": "pruned60-llama-3.2-3b", + "developer": "oopere", + "scores": { + "IFEval": 0.1825, + "BBH": 0.3166, + "MATH Level 5": 0.0038, + "GPQA": 0.2701, + "MUSR": 0.3633, + "MMLU-PRO": 0.1131 + } + }, + { + "model_id": "open-atlas/Atlas-Flash-1.5B-Preview", + "name": "Atlas-Flash-1.5B-Preview", + "developer": "open-atlas", + "scores": { + "IFEval": 0.327, + "BBH": 0.3215, + "MATH Level 5": 0.2213, + "GPQA": 0.2525, + "MUSR": 0.3488, + "MMLU-PRO": 0.1374 + } + }, + { + "model_id": "open-atlas/Atlas-Flash-7B-Preview", + "name": "Atlas-Flash-7B-Preview", + "developer": "open-atlas", + "scores": { + "IFEval": 0.3908, + "BBH": 0.3542, + "MATH Level 5": 0.2576, + "GPQA": 0.2886, + "MUSR": 0.3836, + "MMLU-PRO": 0.2784 + } + }, + { + "model_id": "open-neo/Kyro-n1-3B", + "name": "Kyro-n1-3B", + "developer": "open-neo", + "scores": { + "IFEval": 0.4595, + "BBH": 0.4685, + "MATH Level 5": 0.2855, + "GPQA": 0.2819, + "MUSR": 0.4088, + "MMLU-PRO": 0.3423 + } + }, + { + "model_id": "open-neo/Kyro-n1-7B", + "name": "Kyro-n1-7B", + "developer": "open-neo", + "scores": { + "IFEval": 0.5573, + "BBH": 0.5387, + "MATH Level 5": 0.3897, + "GPQA": 0.2609, + "MUSR": 0.3884, + "MMLU-PRO": 0.4333 + } + }, + { + "model_id": "open-thoughts/OpenThinker-7B", + "name": "OpenThinker-7B", + "developer": "open-thoughts", + "scores": { + "IFEval": 0.4089, + "BBH": 0.5343, + "MATH Level 5": 0.426, + "GPQA": 0.2567, + "MUSR": 0.382, + "MMLU-PRO": 0.4165 + } + }, + { + "model_id": "openai-community/gpt2", + "name": "gpt2", + "developer": "openai-community", + "scores": { + "IFEval": 0.1793, + "BBH": 0.3036, + "MATH Level 5": 0.0023, + "GPQA": 0.2584, + "MUSR": 0.4471, + "MMLU-PRO": 0.1159 + } + }, + { + "model_id": "openai-community/gpt2-large", + "name": "gpt2-large", + "developer": "openai-community", + "scores": { + "IFEval": 0.2048, + "BBH": 0.3069, + "MATH Level 5": 0.0121, + "GPQA": 0.2592, + "MUSR": 0.3789, + "MMLU-PRO": 0.1142 + } + }, + { + "model_id": "openai-community/gpt2-medium", + "name": "gpt2-medium", + "developer": "openai-community", + "scores": { + "IFEval": 0.2208, + "BBH": 0.305, + "MATH Level 5": 0.0076, + "GPQA": 0.2626, + "MUSR": 0.3884, + "MMLU-PRO": 0.1182 + } + }, + { + "model_id": "openai-community/gpt2-xl", + "name": "gpt2-xl", + "developer": "openai-community", + "scores": { + "IFEval": 0.2039, + "BBH": 0.3009, + "MATH Level 5": 0.0098, + "GPQA": 0.2584, + "MUSR": 0.371, + "MMLU-PRO": 0.1131 + } + }, + { + "model_id": "openbmb/MiniCPM-S-1B-sft-llama-format", + "name": "MiniCPM-S-1B-sft-llama-format", + "developer": "openbmb", + "scores": { + "IFEval": 0.3329, + "BBH": 0.3049, + "MATH Level 5": 0.031, + "GPQA": 0.271, + "MUSR": 0.3317, + "MMLU-PRO": 0.1858 + } + }, + { + "model_id": "openchat/openchat-3.5-0106", + "name": "openchat-3.5-0106", + "developer": "openchat", + "scores": { + "IFEval": 0.5967, + "BBH": 0.4617, + "MATH Level 5": 0.0763, + "GPQA": 0.3079, + "MUSR": 0.4254, + "MMLU-PRO": 0.3291 + } + }, + { + "model_id": "openchat/openchat-3.5-1210", + "name": "openchat-3.5-1210", + "developer": "openchat", + "scores": { + "IFEval": 0.6037, + "BBH": 0.4535, + "MATH Level 5": 0.0785, + "GPQA": 0.3012, + "MUSR": 0.4414, + "MMLU-PRO": 0.3142 + } + }, + { + "model_id": "openchat/openchat-3.6-8b-20240522", + "name": "openchat-3.6-8b-20240522", + "developer": "openchat", + "scores": { + "IFEval": 0.5343, + "BBH": 0.5338, + "MATH Level 5": 0.0997, + "GPQA": 0.318, + "MUSR": 0.3999, + "MMLU-PRO": 0.3229 + } + }, + { + "model_id": "openchat/openchat_3.5", + "name": "openchat_3.5", + "developer": "openchat", + "scores": { + "IFEval": 0.5931, + "BBH": 0.4426, + "MATH Level 5": 0.0725, + "GPQA": 0.2987, + "MUSR": 0.4229, + "MMLU-PRO": 0.3153 + } + }, + { + "model_id": "openchat/openchat_v3.2", + "name": "openchat_v3.2", + "developer": "openchat", + "scores": { + "IFEval": 0.2981, + "BBH": 0.4331, + "MATH Level 5": 0.0128, + "GPQA": 0.2701, + "MUSR": 0.4336, + "MMLU-PRO": 0.2422 + } + }, + { + "model_id": "openchat/openchat_v3.2_super", + "name": "openchat_v3.2_super", + "developer": "openchat", + "scores": { + "IFEval": 0.2862, + "BBH": 0.4221, + "MATH Level 5": 0.0211, + "GPQA": 0.2643, + "MUSR": 0.4161, + "MMLU-PRO": 0.2425 + } + }, + { + "model_id": "orai-nlp/Llama-eus-8B", + "name": "Llama-eus-8B", + "developer": "orai-nlp", + "scores": { + "IFEval": 0.2161, + "BBH": 0.4418, + "MATH Level 5": 0.0468, + "GPQA": 0.2894, + "MUSR": 0.3919, + "MMLU-PRO": 0.3058 + } + }, + { + "model_id": "oxyapi/oxy-1-small", + "name": "oxy-1-small", + "developer": "oxyapi", + "scores": { + "IFEval": 0.6245, + "BBH": 0.5885, + "MATH Level 5": 0.3603, + "GPQA": 0.3716, + "MUSR": 0.4487, + "MMLU-PRO": 0.5001 + } + }, + { + "model_id": "ozone-ai/0x-lite", + "name": "0x-lite", + "developer": "ozone-ai", + "scores": { + "IFEval": 0.774, + "BBH": 0.6341, + "MATH Level 5": 0.5045, + "GPQA": 0.3196, + "MUSR": 0.4221, + "MMLU-PRO": 0.5184 + } + }, + { + "model_id": "ozone-research/Chirp-01", + "name": "Chirp-01", + "developer": "ozone-research", + "scores": { + "IFEval": 0.6348, + "BBH": 0.465, + "MATH Level 5": 0.3467, + "GPQA": 0.2718, + "MUSR": 0.4487, + "MMLU-PRO": 0.3508 + } + }, + { + "model_id": "paloalma/ECE-TW3-JRGL-V1", + "name": "ECE-TW3-JRGL-V1", + "developer": "paloalma", + "scores": { + "IFEval": 0.5535, + "BBH": 0.6284, + "MATH Level 5": 0.1314, + "GPQA": 0.3473, + "MUSR": 0.4621, + "MMLU-PRO": 0.4221 + } + }, + { + "model_id": "paloalma/ECE-TW3-JRGL-V2", + "name": "ECE-TW3-JRGL-V2", + "developer": "paloalma", + "scores": { + "IFEval": 0.2255, + "BBH": 0.6031, + "MATH Level 5": 0.185, + "GPQA": 0.3314, + "MUSR": 0.4793, + "MMLU-PRO": 0.4588 + } + }, + { + "model_id": "paloalma/ECE-TW3-JRGL-V5", + "name": "ECE-TW3-JRGL-V5", + "developer": "paloalma", + "scores": { + "IFEval": 0.4553, + "BBH": 0.6025, + "MATH Level 5": 0.1835, + "GPQA": 0.3414, + "MUSR": 0.4621, + "MMLU-PRO": 0.4648 + } + }, + { + "model_id": "paloalma/Le_Triomphant-ECE-TW3", + "name": "Le_Triomphant-ECE-TW3", + "developer": "paloalma", + "scores": { + "IFEval": 0.5402, + "BBH": 0.6112, + "MATH Level 5": 0.1949, + "GPQA": 0.349, + "MUSR": 0.4725, + "MMLU-PRO": 0.4763 + } + }, + { + "model_id": "paloalma/TW3-JRGL-v2", + "name": "TW3-JRGL-v2", + "developer": "paloalma", + "scores": { + "IFEval": 0.5316, + "BBH": 0.6138, + "MATH Level 5": 0.179, + "GPQA": 0.3591, + "MUSR": 0.4858, + "MMLU-PRO": 0.4858 + } + }, + { + "model_id": "pankajmathur/Al_Dente_v1_8b", + "name": "Al_Dente_v1_8b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.3694, + "BBH": 0.4835, + "MATH Level 5": 0.0408, + "GPQA": 0.2995, + "MUSR": 0.3987, + "MMLU-PRO": 0.286 + } + }, + { + "model_id": "pankajmathur/model_007_13b_v2", + "name": "model_007_13b_v2", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.3056, + "BBH": 0.4702, + "MATH Level 5": 0.0211, + "GPQA": 0.2836, + "MUSR": 0.4611, + "MMLU-PRO": 0.2461 + } + }, + { + "model_id": "pankajmathur/orca_mini_3b", + "name": "orca_mini_3b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.0742, + "BBH": 0.3196, + "MATH Level 5": 0.0083, + "GPQA": 0.2458, + "MUSR": 0.3349, + "MMLU-PRO": 0.1145 + } + }, + { + "model_id": "pankajmathur/orca_mini_7b", + "name": "orca_mini_7b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.0412, + "BBH": 0.3332, + "MATH Level 5": 0.0128, + "GPQA": 0.2542, + "MUSR": 0.3698, + "MMLU-PRO": 0.1246 + } + }, + { + "model_id": "pankajmathur/orca_mini_phi-4", + "name": "orca_mini_phi-4", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.7781, + "BBH": 0.6856, + "MATH Level 5": 0.2953, + "GPQA": 0.3742, + "MUSR": 0.4703, + "MMLU-PRO": 0.5255 + } + }, + { + "model_id": "pankajmathur/orca_mini_v2_7b", + "name": "orca_mini_v2_7b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.1358, + "BBH": 0.3536, + "MATH Level 5": 0.0113, + "GPQA": 0.2492, + "MUSR": 0.3593, + "MMLU-PRO": 0.1542 + } + }, + { + "model_id": "pankajmathur/orca_mini_v3_13b", + "name": "orca_mini_v3_13b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.2897, + "BBH": 0.4711, + "MATH Level 5": 0.0211, + "GPQA": 0.2651, + "MUSR": 0.4598, + "MMLU-PRO": 0.2305 + } + }, + { + "model_id": "pankajmathur/orca_mini_v3_70b", + "name": "orca_mini_v3_70b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.4015, + "BBH": 0.5949, + "MATH Level 5": 0.0385, + "GPQA": 0.318, + "MUSR": 0.5079, + "MMLU-PRO": 0.3757 + } + }, + { + "model_id": "pankajmathur/orca_mini_v3_7b", + "name": "orca_mini_v3_7b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.2821, + "BBH": 0.4095, + "MATH Level 5": 0.0106, + "GPQA": 0.2466, + "MUSR": 0.4982, + "MMLU-PRO": 0.2084 + } + }, + { + "model_id": "pankajmathur/orca_mini_v5_8b", + "name": "orca_mini_v5_8b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.4806, + "BBH": 0.5064, + "MATH Level 5": 0.0989, + "GPQA": 0.2869, + "MUSR": 0.4, + "MMLU-PRO": 0.3076 + } + }, + { + "model_id": "pankajmathur/orca_mini_v5_8b_dpo", + "name": "orca_mini_v5_8b_dpo", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.4896, + "BBH": 0.5075, + "MATH Level 5": 0.0974, + "GPQA": 0.2743, + "MUSR": 0.3894, + "MMLU-PRO": 0.3116 + } + }, + { + "model_id": "pankajmathur/orca_mini_v5_8b_orpo", + "name": "orca_mini_v5_8b_orpo", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.0824, + "BBH": 0.4964, + "MATH Level 5": 0.0665, + "GPQA": 0.2844, + "MUSR": 0.4131, + "MMLU-PRO": 0.2947 + } + }, + { + "model_id": "pankajmathur/orca_mini_v6_8b", + "name": "orca_mini_v6_8b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.0111, + "BBH": 0.3029, + "MATH Level 5": 0.0038, + "GPQA": 0.2383, + "MUSR": 0.3555, + "MMLU-PRO": 0.1125 + } + }, + { + "model_id": "pankajmathur/orca_mini_v6_8b_dpo", + "name": "orca_mini_v6_8b_dpo", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.3883, + "BBH": 0.5203, + "MATH Level 5": 0.0612, + "GPQA": 0.3012, + "MUSR": 0.409, + "MMLU-PRO": 0.3596 + } + }, + { + "model_id": "pankajmathur/orca_mini_v7_72b", + "name": "orca_mini_v7_72b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.593, + "BBH": 0.6842, + "MATH Level 5": 0.0937, + "GPQA": 0.3851, + "MUSR": 0.507, + "MMLU-PRO": 0.5622 + } + }, + { + "model_id": "pankajmathur/orca_mini_v7_7b", + "name": "orca_mini_v7_7b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.4388, + "BBH": 0.5275, + "MATH Level 5": 0.1208, + "GPQA": 0.2961, + "MUSR": 0.436, + "MMLU-PRO": 0.4167 + } + }, + { + "model_id": "pankajmathur/orca_mini_v8_1_70b", + "name": "orca_mini_v8_1_70b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.8571, + "BBH": 0.6781, + "MATH Level 5": 0.3527, + "GPQA": 0.4329, + "MUSR": 0.4437, + "MMLU-PRO": 0.4983 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_0_3B-Instruct", + "name": "orca_mini_v9_0_3B-Instruct", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.5754, + "BBH": 0.4413, + "MATH Level 5": 0.1465, + "GPQA": 0.3012, + "MUSR": 0.3659, + "MMLU-PRO": 0.2603 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_1_1B-Instruct", + "name": "orca_mini_v9_1_1B-Instruct", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.3629, + "BBH": 0.3205, + "MATH Level 5": 0.0461, + "GPQA": 0.2567, + "MUSR": 0.3381, + "MMLU-PRO": 0.1374 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_2_14B", + "name": "orca_mini_v9_2_14B", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.7781, + "BBH": 0.6856, + "MATH Level 5": 0.2953, + "GPQA": 0.3742, + "MUSR": 0.4703, + "MMLU-PRO": 0.5255 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_2_70b", + "name": "orca_mini_v9_2_70b", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.8383, + "BBH": 0.6745, + "MATH Level 5": 0.2938, + "GPQA": 0.3733, + "MUSR": 0.471, + "MMLU-PRO": 0.4821 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_4_70B", + "name": "orca_mini_v9_4_70B", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.8015, + "BBH": 0.6419, + "MATH Level 5": 0.3263, + "GPQA": 0.3658, + "MUSR": 0.4647, + "MMLU-PRO": 0.4536 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_5_1B-Instruct", + "name": "orca_mini_v9_5_1B-Instruct", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.4638, + "BBH": 0.3337, + "MATH Level 5": 0.0302, + "GPQA": 0.2701, + "MUSR": 0.3182, + "MMLU-PRO": 0.137 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_5_1B-Instruct_preview", + "name": "orca_mini_v9_5_1B-Instruct_preview", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.3936, + "BBH": 0.3277, + "MATH Level 5": 0.0385, + "GPQA": 0.2634, + "MUSR": 0.3395, + "MMLU-PRO": 0.1327 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_5_3B-Instruct", + "name": "orca_mini_v9_5_3B-Instruct", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.7207, + "BBH": 0.4496, + "MATH Level 5": 0.1322, + "GPQA": 0.2869, + "MUSR": 0.427, + "MMLU-PRO": 0.2882 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_6_1B-Instruct", + "name": "orca_mini_v9_6_1B-Instruct", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.6086, + "BBH": 0.3561, + "MATH Level 5": 0.077, + "GPQA": 0.2685, + "MUSR": 0.3396, + "MMLU-PRO": 0.1809 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_6_3B-Instruct", + "name": "orca_mini_v9_6_3B-Instruct", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.7316, + "BBH": 0.4568, + "MATH Level 5": 0.1329, + "GPQA": 0.2936, + "MUSR": 0.4068, + "MMLU-PRO": 0.2851 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_7_1B-Instruct", + "name": "orca_mini_v9_7_1B-Instruct", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.561, + "BBH": 0.3182, + "MATH Level 5": 0.0446, + "GPQA": 0.2727, + "MUSR": 0.3527, + "MMLU-PRO": 0.1345 + } + }, + { + "model_id": "pankajmathur/orca_mini_v9_7_3B-Instruct", + "name": "orca_mini_v9_7_3B-Instruct", + "developer": "pankajmathur", + "scores": { + "IFEval": 0.5618, + "BBH": 0.3297, + "MATH Level 5": 0.0619, + "GPQA": 0.2617, + "MUSR": 0.3619, + "MMLU-PRO": 0.1375 + } + }, + { + "model_id": "paulml/ECE-ILAB-Q1", + "name": "ECE-ILAB-Q1", + "developer": "paulml", + "scores": { + "IFEval": 0.7865, + "BBH": 0.6718, + "MATH Level 5": 0.3557, + "GPQA": 0.3867, + "MUSR": 0.4614, + "MMLU-PRO": 0.5505 + } + }, + { + "model_id": "pints-ai/1.5-Pints-16K-v0.1", + "name": "1.5-Pints-16K-v0.1", + "developer": "pints-ai", + "scores": { + "IFEval": 0.1636, + "BBH": 0.3133, + "MATH Level 5": 0.0144, + "GPQA": 0.2357, + "MUSR": 0.3579, + "MMLU-PRO": 0.1119 + } + }, + { + "model_id": "pints-ai/1.5-Pints-2K-v0.1", + "name": "1.5-Pints-2K-v0.1", + "developer": "pints-ai", + "scores": { + "IFEval": 0.1762, + "BBH": 0.298, + "MATH Level 5": 0.0128, + "GPQA": 0.2483, + "MUSR": 0.3502, + "MMLU-PRO": 0.1104 + } + }, + { + "model_id": "piotr25691/thea-3b-25r", + "name": "thea-3b-25r", + "developer": "piotr25691", + "scores": { + "IFEval": 0.7344, + "BBH": 0.4484, + "MATH Level 5": 0.1782, + "GPQA": 0.2676, + "MUSR": 0.3315, + "MMLU-PRO": 0.3182 + } + }, + { + "model_id": "piotr25691/thea-c-3b-25r", + "name": "thea-c-3b-25r", + "developer": "piotr25691", + "scores": { + "IFEval": 0.7402, + "BBH": 0.4532, + "MATH Level 5": 0.1526, + "GPQA": 0.2651, + "MUSR": 0.3315, + "MMLU-PRO": 0.3178 + } + }, + { + "model_id": "piotr25691/thea-rp-3b-25r", + "name": "thea-rp-3b-25r", + "developer": "piotr25691", + "scores": { + "IFEval": 0.6578, + "BBH": 0.439, + "MATH Level 5": 0.1322, + "GPQA": 0.2743, + "MUSR": 0.3819, + "MMLU-PRO": 0.306 + } + }, + { + "model_id": "postbot/gpt2-medium-emailgen", + "name": "gpt2-medium-emailgen", + "developer": "postbot", + "scores": { + "IFEval": 0.1492, + "BBH": 0.313, + "MATH Level 5": 0.0, + "GPQA": 0.2601, + "MUSR": 0.3911, + "MMLU-PRO": 0.1147 + } + }, + { + "model_id": "prince-canuma/Ministral-8B-Instruct-2410-HF", + "name": "Ministral-8B-Instruct-2410-HF", + "developer": "prince-canuma", + "scores": { + "IFEval": 0.5912, + "BBH": 0.4586, + "MATH Level 5": 0.1918, + "GPQA": 0.281, + "MUSR": 0.4138, + "MMLU-PRO": 0.3298 + } + }, + { + "model_id": "princeton-nlp/Llama-3-8B-ProLong-512k-Base", + "name": "Llama-3-8B-ProLong-512k-Base", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.5322, + "BBH": 0.5033, + "MATH Level 5": 0.0687, + "GPQA": 0.2617, + "MUSR": 0.4223, + "MMLU-PRO": 0.3329 + } + }, + { + "model_id": "princeton-nlp/Llama-3-8B-ProLong-512k-Instruct", + "name": "Llama-3-8B-ProLong-512k-Instruct", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.3978, + "BBH": 0.4983, + "MATH Level 5": 0.0582, + "GPQA": 0.281, + "MUSR": 0.425, + "MMLU-PRO": 0.3246 + } + }, + { + "model_id": "princeton-nlp/Llama-3-8B-ProLong-64k-Base", + "name": "Llama-3-8B-ProLong-64k-Base", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.5201, + "BBH": 0.4927, + "MATH Level 5": 0.065, + "GPQA": 0.2651, + "MUSR": 0.4341, + "MMLU-PRO": 0.3348 + } + }, + { + "model_id": "princeton-nlp/Llama-3-8B-ProLong-64k-Instruct", + "name": "Llama-3-8B-ProLong-64k-Instruct", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.5563, + "BBH": 0.5083, + "MATH Level 5": 0.065, + "GPQA": 0.2953, + "MUSR": 0.4397, + "MMLU-PRO": 0.3275 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT", + "name": "Llama-3-Base-8B-SFT", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.2796, + "BBH": 0.4643, + "MATH Level 5": 0.04, + "GPQA": 0.2978, + "MUSR": 0.4118, + "MMLU-PRO": 0.3093 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-CPO", + "name": "Llama-3-Base-8B-SFT-CPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.3703, + "BBH": 0.4595, + "MATH Level 5": 0.0544, + "GPQA": 0.2743, + "MUSR": 0.3609, + "MMLU-PRO": 0.2976 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-DPO", + "name": "Llama-3-Base-8B-SFT-DPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4111, + "BBH": 0.4666, + "MATH Level 5": 0.0415, + "GPQA": 0.3104, + "MUSR": 0.3867, + "MMLU-PRO": 0.3078 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-IPO", + "name": "Llama-3-Base-8B-SFT-IPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4487, + "BBH": 0.469, + "MATH Level 5": 0.0393, + "GPQA": 0.2978, + "MUSR": 0.3919, + "MMLU-PRO": 0.3115 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-KTO", + "name": "Llama-3-Base-8B-SFT-KTO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4523, + "BBH": 0.4693, + "MATH Level 5": 0.0529, + "GPQA": 0.3054, + "MUSR": 0.3842, + "MMLU-PRO": 0.3054 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-ORPO", + "name": "Llama-3-Base-8B-SFT-ORPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4517, + "BBH": 0.4734, + "MATH Level 5": 0.0468, + "GPQA": 0.3138, + "MUSR": 0.3707, + "MMLU-PRO": 0.3083 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-RDPO", + "name": "Llama-3-Base-8B-SFT-RDPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.448, + "BBH": 0.4662, + "MATH Level 5": 0.0574, + "GPQA": 0.3062, + "MUSR": 0.4027, + "MMLU-PRO": 0.3014 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-RRHF", + "name": "Llama-3-Base-8B-SFT-RRHF", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.3357, + "BBH": 0.452, + "MATH Level 5": 0.0453, + "GPQA": 0.3054, + "MUSR": 0.3722, + "MMLU-PRO": 0.2889 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-SLiC-HF", + "name": "Llama-3-Base-8B-SFT-SLiC-HF", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.489, + "BBH": 0.4704, + "MATH Level 5": 0.0506, + "GPQA": 0.2869, + "MUSR": 0.4091, + "MMLU-PRO": 0.3063 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Base-8B-SFT-SimPO", + "name": "Llama-3-Base-8B-SFT-SimPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4685, + "BBH": 0.4741, + "MATH Level 5": 0.0551, + "GPQA": 0.2886, + "MUSR": 0.4127, + "MMLU-PRO": 0.3105 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-CPO", + "name": "Llama-3-Instruct-8B-CPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.7293, + "BBH": 0.4999, + "MATH Level 5": 0.0989, + "GPQA": 0.2601, + "MUSR": 0.3514, + "MMLU-PRO": 0.3652 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-CPO-v0.2", + "name": "Llama-3-Instruct-8B-CPO-v0.2", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.7506, + "BBH": 0.5027, + "MATH Level 5": 0.108, + "GPQA": 0.2609, + "MUSR": 0.3619, + "MMLU-PRO": 0.3706 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-DPO", + "name": "Llama-3-Instruct-8B-DPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.6757, + "BBH": 0.4991, + "MATH Level 5": 0.0846, + "GPQA": 0.2718, + "MUSR": 0.3738, + "MMLU-PRO": 0.3665 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-DPO-v0.2", + "name": "Llama-3-Instruct-8B-DPO-v0.2", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.7208, + "BBH": 0.5056, + "MATH Level 5": 0.0899, + "GPQA": 0.2869, + "MUSR": 0.3844, + "MMLU-PRO": 0.3769 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-KTO", + "name": "Llama-3-Instruct-8B-KTO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.6864, + "BBH": 0.4982, + "MATH Level 5": 0.0725, + "GPQA": 0.276, + "MUSR": 0.3698, + "MMLU-PRO": 0.3599 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-KTO-v0.2", + "name": "Llama-3-Instruct-8B-KTO-v0.2", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.729, + "BBH": 0.508, + "MATH Level 5": 0.0997, + "GPQA": 0.2601, + "MUSR": 0.3777, + "MMLU-PRO": 0.3668 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-ORPO", + "name": "Llama-3-Instruct-8B-ORPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.7128, + "BBH": 0.5001, + "MATH Level 5": 0.0785, + "GPQA": 0.2584, + "MUSR": 0.3502, + "MMLU-PRO": 0.3646 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-ORPO-v0.2", + "name": "Llama-3-Instruct-8B-ORPO-v0.2", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.7633, + "BBH": 0.5078, + "MATH Level 5": 0.102, + "GPQA": 0.2836, + "MUSR": 0.378, + "MMLU-PRO": 0.3731 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-RDPO", + "name": "Llama-3-Instruct-8B-RDPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.666, + "BBH": 0.5034, + "MATH Level 5": 0.0846, + "GPQA": 0.2827, + "MUSR": 0.3752, + "MMLU-PRO": 0.3607 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-RDPO-v0.2", + "name": "Llama-3-Instruct-8B-RDPO-v0.2", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.7077, + "BBH": 0.5049, + "MATH Level 5": 0.0869, + "GPQA": 0.2928, + "MUSR": 0.3804, + "MMLU-PRO": 0.3774 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-RRHF", + "name": "Llama-3-Instruct-8B-RRHF", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.7275, + "BBH": 0.4911, + "MATH Level 5": 0.0967, + "GPQA": 0.2802, + "MUSR": 0.3476, + "MMLU-PRO": 0.3644 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-RRHF-v0.2", + "name": "Llama-3-Instruct-8B-RRHF-v0.2", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.7125, + "BBH": 0.4984, + "MATH Level 5": 0.0876, + "GPQA": 0.2601, + "MUSR": 0.3738, + "MMLU-PRO": 0.3482 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-SLiC-HF", + "name": "Llama-3-Instruct-8B-SLiC-HF", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.74, + "BBH": 0.5029, + "MATH Level 5": 0.0974, + "GPQA": 0.2861, + "MUSR": 0.3723, + "MMLU-PRO": 0.3585 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-SLiC-HF-v0.2", + "name": "Llama-3-Instruct-8B-SLiC-HF-v0.2", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.711, + "BBH": 0.4984, + "MATH Level 5": 0.0876, + "GPQA": 0.2601, + "MUSR": 0.3738, + "MMLU-PRO": 0.3482 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-SimPO", + "name": "Llama-3-Instruct-8B-SimPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.6504, + "BBH": 0.4845, + "MATH Level 5": 0.0861, + "GPQA": 0.2936, + "MUSR": 0.3948, + "MMLU-PRO": 0.3489 + } + }, + { + "model_id": "princeton-nlp/Llama-3-Instruct-8B-SimPO-v0.2", + "name": "Llama-3-Instruct-8B-SimPO-v0.2", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.6809, + "BBH": 0.5038, + "MATH Level 5": 0.074, + "GPQA": 0.3012, + "MUSR": 0.3988, + "MMLU-PRO": 0.3622 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Base-SFT-CPO", + "name": "Mistral-7B-Base-SFT-CPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4655, + "BBH": 0.4382, + "MATH Level 5": 0.0279, + "GPQA": 0.2919, + "MUSR": 0.4071, + "MMLU-PRO": 0.2651 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Base-SFT-DPO", + "name": "Mistral-7B-Base-SFT-DPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4403, + "BBH": 0.435, + "MATH Level 5": 0.0211, + "GPQA": 0.2727, + "MUSR": 0.4122, + "MMLU-PRO": 0.2645 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Base-SFT-IPO", + "name": "Mistral-7B-Base-SFT-IPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.483, + "BBH": 0.4458, + "MATH Level 5": 0.0287, + "GPQA": 0.2802, + "MUSR": 0.3776, + "MMLU-PRO": 0.2792 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Base-SFT-KTO", + "name": "Mistral-7B-Base-SFT-KTO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4785, + "BBH": 0.4476, + "MATH Level 5": 0.0393, + "GPQA": 0.2903, + "MUSR": 0.4368, + "MMLU-PRO": 0.2872 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Base-SFT-RDPO", + "name": "Mistral-7B-Base-SFT-RDPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4606, + "BBH": 0.444, + "MATH Level 5": 0.0219, + "GPQA": 0.2777, + "MUSR": 0.3579, + "MMLU-PRO": 0.2777 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Base-SFT-RRHF", + "name": "Mistral-7B-Base-SFT-RRHF", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4407, + "BBH": 0.4281, + "MATH Level 5": 0.0249, + "GPQA": 0.2903, + "MUSR": 0.4187, + "MMLU-PRO": 0.2398 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Base-SFT-SLiC-HF", + "name": "Mistral-7B-Base-SFT-SLiC-HF", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.5127, + "BBH": 0.4422, + "MATH Level 5": 0.0355, + "GPQA": 0.2919, + "MUSR": 0.4261, + "MMLU-PRO": 0.2781 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Base-SFT-SimPO", + "name": "Mistral-7B-Base-SFT-SimPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4701, + "BBH": 0.4398, + "MATH Level 5": 0.0144, + "GPQA": 0.2836, + "MUSR": 0.3971, + "MMLU-PRO": 0.2702 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-CPO", + "name": "Mistral-7B-Instruct-CPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4203, + "BBH": 0.4069, + "MATH Level 5": 0.0204, + "GPQA": 0.2659, + "MUSR": 0.4178, + "MMLU-PRO": 0.2701 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-DPO", + "name": "Mistral-7B-Instruct-DPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.5176, + "BBH": 0.406, + "MATH Level 5": 0.031, + "GPQA": 0.2685, + "MUSR": 0.3833, + "MMLU-PRO": 0.2749 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-IPO", + "name": "Mistral-7B-Instruct-IPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4929, + "BBH": 0.4322, + "MATH Level 5": 0.0204, + "GPQA": 0.2735, + "MUSR": 0.4324, + "MMLU-PRO": 0.2708 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-KTO", + "name": "Mistral-7B-Instruct-KTO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4908, + "BBH": 0.414, + "MATH Level 5": 0.0264, + "GPQA": 0.2735, + "MUSR": 0.3953, + "MMLU-PRO": 0.2812 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-ORPO", + "name": "Mistral-7B-Instruct-ORPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.472, + "BBH": 0.4104, + "MATH Level 5": 0.0295, + "GPQA": 0.2743, + "MUSR": 0.3912, + "MMLU-PRO": 0.2662 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-RDPO", + "name": "Mistral-7B-Instruct-RDPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4887, + "BBH": 0.405, + "MATH Level 5": 0.0249, + "GPQA": 0.2802, + "MUSR": 0.3873, + "MMLU-PRO": 0.2777 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-RRHF", + "name": "Mistral-7B-Instruct-RRHF", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.496, + "BBH": 0.419, + "MATH Level 5": 0.0279, + "GPQA": 0.276, + "MUSR": 0.3979, + "MMLU-PRO": 0.2651 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-SLiC-HF", + "name": "Mistral-7B-Instruct-SLiC-HF", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.5115, + "BBH": 0.404, + "MATH Level 5": 0.0174, + "GPQA": 0.2727, + "MUSR": 0.3913, + "MMLU-PRO": 0.2715 + } + }, + { + "model_id": "princeton-nlp/Mistral-7B-Instruct-SimPO", + "name": "Mistral-7B-Instruct-SimPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.4687, + "BBH": 0.4507, + "MATH Level 5": 0.0287, + "GPQA": 0.2785, + "MUSR": 0.4098, + "MMLU-PRO": 0.2797 + } + }, + { + "model_id": "princeton-nlp/Sheared-LLaMA-1.3B", + "name": "Sheared-LLaMA-1.3B", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.2198, + "BBH": 0.3197, + "MATH Level 5": 0.0128, + "GPQA": 0.2399, + "MUSR": 0.3713, + "MMLU-PRO": 0.1171 + } + }, + { + "model_id": "princeton-nlp/Sheared-LLaMA-2.7B", + "name": "Sheared-LLaMA-2.7B", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.2417, + "BBH": 0.3259, + "MATH Level 5": 0.0128, + "GPQA": 0.2752, + "MUSR": 0.3567, + "MMLU-PRO": 0.1187 + } + }, + { + "model_id": "princeton-nlp/gemma-2-9b-it-DPO", + "name": "gemma-2-9b-it-DPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.2769, + "BBH": 0.5941, + "MATH Level 5": 0.0831, + "GPQA": 0.3356, + "MUSR": 0.382, + "MMLU-PRO": 0.3723 + } + }, + { + "model_id": "princeton-nlp/gemma-2-9b-it-SimPO", + "name": "gemma-2-9b-it-SimPO", + "developer": "princeton-nlp", + "scores": { + "IFEval": 0.3207, + "BBH": 0.5839, + "MATH Level 5": 0.071, + "GPQA": 0.3356, + "MUSR": 0.4123, + "MMLU-PRO": 0.3975 + } + }, + { + "model_id": "prithivMLmods/Bellatrix-1.5B-xElite", + "name": "Bellatrix-1.5B-xElite", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.1964, + "BBH": 0.3501, + "MATH Level 5": 0.287, + "GPQA": 0.2785, + "MUSR": 0.3619, + "MMLU-PRO": 0.1657 + } + }, + { + "model_id": "prithivMLmods/Bellatrix-Tiny-1.5B-R1", + "name": "Bellatrix-Tiny-1.5B-R1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3352, + "BBH": 0.4022, + "MATH Level 5": 0.0604, + "GPQA": 0.2987, + "MUSR": 0.3683, + "MMLU-PRO": 0.2751 + } + }, + { + "model_id": "prithivMLmods/Bellatrix-Tiny-1B-v2", + "name": "Bellatrix-Tiny-1B-v2", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.151, + "BBH": 0.3268, + "MATH Level 5": 0.0287, + "GPQA": 0.2727, + "MUSR": 0.343, + "MMLU-PRO": 0.1493 + } + }, + { + "model_id": "prithivMLmods/Blaze-14B-xElite", + "name": "Blaze-14B-xElite", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.0363, + "BBH": 0.6628, + "MATH Level 5": 0.3693, + "GPQA": 0.3943, + "MUSR": 0.4625, + "MMLU-PRO": 0.5111 + } + }, + { + "model_id": "prithivMLmods/COCO-7B-Instruct-1M", + "name": "COCO-7B-Instruct-1M", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4743, + "BBH": 0.541, + "MATH Level 5": 0.3497, + "GPQA": 0.3079, + "MUSR": 0.4382, + "MMLU-PRO": 0.4186 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-14B-Elite", + "name": "Calcium-Opus-14B-Elite", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6052, + "BBH": 0.6317, + "MATH Level 5": 0.4789, + "GPQA": 0.3742, + "MUSR": 0.486, + "MMLU-PRO": 0.5302 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-14B-Elite-1M", + "name": "Calcium-Opus-14B-Elite-1M", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5613, + "BBH": 0.6329, + "MATH Level 5": 0.4456, + "GPQA": 0.3523, + "MUSR": 0.4676, + "MMLU-PRO": 0.5152 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-14B-Elite-Stock", + "name": "Calcium-Opus-14B-Elite-Stock", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6143, + "BBH": 0.6329, + "MATH Level 5": 0.4668, + "GPQA": 0.3683, + "MUSR": 0.4808, + "MMLU-PRO": 0.5284 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-14B-Elite2", + "name": "Calcium-Opus-14B-Elite2", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6176, + "BBH": 0.6318, + "MATH Level 5": 0.469, + "GPQA": 0.37, + "MUSR": 0.494, + "MMLU-PRO": 0.5301 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-14B-Elite2-R1", + "name": "Calcium-Opus-14B-Elite2-R1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6326, + "BBH": 0.6362, + "MATH Level 5": 0.3338, + "GPQA": 0.3909, + "MUSR": 0.49, + "MMLU-PRO": 0.5248 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-14B-Elite3", + "name": "Calcium-Opus-14B-Elite3", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5428, + "BBH": 0.635, + "MATH Level 5": 0.4705, + "GPQA": 0.3708, + "MUSR": 0.4795, + "MMLU-PRO": 0.5335 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-14B-Elite4", + "name": "Calcium-Opus-14B-Elite4", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6112, + "BBH": 0.6195, + "MATH Level 5": 0.3625, + "GPQA": 0.3557, + "MUSR": 0.4687, + "MMLU-PRO": 0.5149 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-14B-Merge", + "name": "Calcium-Opus-14B-Merge", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4949, + "BBH": 0.6319, + "MATH Level 5": 0.4637, + "GPQA": 0.3708, + "MUSR": 0.4861, + "MMLU-PRO": 0.5356 + } + }, + { + "model_id": "prithivMLmods/Calcium-Opus-20B-v1", + "name": "Calcium-Opus-20B-v1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3093, + "BBH": 0.599, + "MATH Level 5": 0.3618, + "GPQA": 0.3532, + "MUSR": 0.4943, + "MMLU-PRO": 0.4734 + } + }, + { + "model_id": "prithivMLmods/Codepy-Deepthink-3B", + "name": "Codepy-Deepthink-3B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4327, + "BBH": 0.4259, + "MATH Level 5": 0.1156, + "GPQA": 0.2794, + "MUSR": 0.331, + "MMLU-PRO": 0.309 + } + }, + { + "model_id": "prithivMLmods/Coma-II-14B", + "name": "Coma-II-14B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4168, + "BBH": 0.6321, + "MATH Level 5": 0.5514, + "GPQA": 0.4002, + "MUSR": 0.5351, + "MMLU-PRO": 0.504 + } + }, + { + "model_id": "prithivMLmods/Condor-Opus-14B-Exp", + "name": "Condor-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4043, + "BBH": 0.6154, + "MATH Level 5": 0.5227, + "GPQA": 0.3918, + "MUSR": 0.5194, + "MMLU-PRO": 0.5014 + } + }, + { + "model_id": "prithivMLmods/Cygnus-II-14B", + "name": "Cygnus-II-14B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6184, + "BBH": 0.6661, + "MATH Level 5": 0.4396, + "GPQA": 0.3876, + "MUSR": 0.4688, + "MMLU-PRO": 0.5391 + } + }, + { + "model_id": "prithivMLmods/Deepthink-Llama-3-8B-Preview", + "name": "Deepthink-Llama-3-8B-Preview", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.2955, + "BBH": 0.4665, + "MATH Level 5": 0.355, + "GPQA": 0.3163, + "MUSR": 0.3707, + "MMLU-PRO": 0.2739 + } + }, + { + "model_id": "prithivMLmods/Deepthink-Reasoning-14B", + "name": "Deepthink-Reasoning-14B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5424, + "BBH": 0.6334, + "MATH Level 5": 0.423, + "GPQA": 0.3666, + "MUSR": 0.4732, + "MMLU-PRO": 0.5296 + } + }, + { + "model_id": "prithivMLmods/Deepthink-Reasoning-7B", + "name": "Deepthink-Reasoning-7B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.484, + "BBH": 0.5505, + "MATH Level 5": 0.3346, + "GPQA": 0.2995, + "MUSR": 0.4432, + "MMLU-PRO": 0.4349 + } + }, + { + "model_id": "prithivMLmods/Dinobot-Opus-14B-Exp", + "name": "Dinobot-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.824, + "BBH": 0.637, + "MATH Level 5": 0.5317, + "GPQA": 0.3247, + "MUSR": 0.426, + "MMLU-PRO": 0.4979 + } + }, + { + "model_id": "prithivMLmods/Elita-0.1-Distilled-R1-abliterated", + "name": "Elita-0.1-Distilled-R1-abliterated", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3542, + "BBH": 0.3828, + "MATH Level 5": 0.3066, + "GPQA": 0.2659, + "MUSR": 0.366, + "MMLU-PRO": 0.2758 + } + }, + { + "model_id": "prithivMLmods/Elita-1", + "name": "Elita-1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4906, + "BBH": 0.652, + "MATH Level 5": 0.3429, + "GPQA": 0.3758, + "MUSR": 0.4834, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "prithivMLmods/Epimetheus-14B-Axo", + "name": "Epimetheus-14B-Axo", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5546, + "BBH": 0.6613, + "MATH Level 5": 0.4101, + "GPQA": 0.3926, + "MUSR": 0.482, + "MMLU-PRO": 0.5304 + } + }, + { + "model_id": "prithivMLmods/Equuleus-Opus-14B-Exp", + "name": "Equuleus-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.7001, + "BBH": 0.6434, + "MATH Level 5": 0.4585, + "GPQA": 0.3867, + "MUSR": 0.4952, + "MMLU-PRO": 0.5374 + } + }, + { + "model_id": "prithivMLmods/Eridanus-Opus-14B-r999", + "name": "Eridanus-Opus-14B-r999", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6386, + "BBH": 0.6584, + "MATH Level 5": 0.386, + "GPQA": 0.3943, + "MUSR": 0.4769, + "MMLU-PRO": 0.5362 + } + }, + { + "model_id": "prithivMLmods/Evac-Opus-14B-Exp", + "name": "Evac-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5916, + "BBH": 0.6475, + "MATH Level 5": 0.4215, + "GPQA": 0.3884, + "MUSR": 0.4728, + "MMLU-PRO": 0.5317 + } + }, + { + "model_id": "prithivMLmods/FastThink-0.5B-Tiny", + "name": "FastThink-0.5B-Tiny", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.258, + "BBH": 0.3206, + "MATH Level 5": 0.0204, + "GPQA": 0.2609, + "MUSR": 0.3566, + "MMLU-PRO": 0.1649 + } + }, + { + "model_id": "prithivMLmods/GWQ-9B-Preview", + "name": "GWQ-9B-Preview", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5066, + "BBH": 0.5806, + "MATH Level 5": 0.2266, + "GPQA": 0.3398, + "MUSR": 0.4951, + "MMLU-PRO": 0.3984 + } + }, + { + "model_id": "prithivMLmods/GWQ-9B-Preview2", + "name": "GWQ-9B-Preview2", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5209, + "BBH": 0.5797, + "MATH Level 5": 0.2372, + "GPQA": 0.3263, + "MUSR": 0.486, + "MMLU-PRO": 0.3997 + } + }, + { + "model_id": "prithivMLmods/GWQ2b", + "name": "GWQ2b", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4115, + "BBH": 0.4143, + "MATH Level 5": 0.0627, + "GPQA": 0.2827, + "MUSR": 0.4311, + "MMLU-PRO": 0.2473 + } + }, + { + "model_id": "prithivMLmods/Gaea-Opus-14B-Exp", + "name": "Gaea-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5956, + "BBH": 0.656, + "MATH Level 5": 0.4275, + "GPQA": 0.3909, + "MUSR": 0.4859, + "MMLU-PRO": 0.5401 + } + }, + { + "model_id": "prithivMLmods/Galactic-Qwen-14B-Exp1", + "name": "Galactic-Qwen-14B-Exp1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5832, + "BBH": 0.6582, + "MATH Level 5": 0.4018, + "GPQA": 0.3935, + "MUSR": 0.4781, + "MMLU-PRO": 0.5396 + } + }, + { + "model_id": "prithivMLmods/Galactic-Qwen-14B-Exp2", + "name": "Galactic-Qwen-14B-Exp2", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.662, + "BBH": 0.7203, + "MATH Level 5": 0.3474, + "GPQA": 0.3993, + "MUSR": 0.5354, + "MMLU-PRO": 0.5691 + } + }, + { + "model_id": "prithivMLmods/Gauss-Opus-14B-R999", + "name": "Gauss-Opus-14B-R999", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3907, + "BBH": 0.6228, + "MATH Level 5": 0.5755, + "GPQA": 0.3918, + "MUSR": 0.5338, + "MMLU-PRO": 0.5007 + } + }, + { + "model_id": "prithivMLmods/Jolt-v0.1", + "name": "Jolt-v0.1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5092, + "BBH": 0.6521, + "MATH Level 5": 0.3565, + "GPQA": 0.38, + "MUSR": 0.4847, + "MMLU-PRO": 0.5386 + } + }, + { + "model_id": "prithivMLmods/Lacerta-Opus-14B-Elite8", + "name": "Lacerta-Opus-14B-Elite8", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6141, + "BBH": 0.6401, + "MATH Level 5": 0.3648, + "GPQA": 0.3784, + "MUSR": 0.4635, + "MMLU-PRO": 0.5322 + } + }, + { + "model_id": "prithivMLmods/Llama-3.1-5B-Instruct", + "name": "Llama-3.1-5B-Instruct", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.1407, + "BBH": 0.3051, + "MATH Level 5": 0.0151, + "GPQA": 0.2643, + "MUSR": 0.354, + "MMLU-PRO": 0.1184 + } + }, + { + "model_id": "prithivMLmods/Llama-3.1-8B-Open-SFT", + "name": "Llama-3.1-8B-Open-SFT", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4123, + "BBH": 0.4968, + "MATH Level 5": 0.1216, + "GPQA": 0.3096, + "MUSR": 0.3904, + "MMLU-PRO": 0.3522 + } + }, + { + "model_id": "prithivMLmods/Llama-3.2-3B-Math-Oct", + "name": "Llama-3.2-3B-Math-Oct", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4585, + "BBH": 0.4372, + "MATH Level 5": 0.1156, + "GPQA": 0.2584, + "MUSR": 0.347, + "MMLU-PRO": 0.2911 + } + }, + { + "model_id": "prithivMLmods/Llama-3.2-6B-AlgoCode", + "name": "Llama-3.2-6B-AlgoCode", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.2136, + "BBH": 0.3748, + "MATH Level 5": 0.0136, + "GPQA": 0.2869, + "MUSR": 0.4013, + "MMLU-PRO": 0.1798 + } + }, + { + "model_id": "prithivMLmods/Llama-8B-Distill-CoT", + "name": "Llama-8B-Distill-CoT", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3342, + "BBH": 0.4298, + "MATH Level 5": 0.4003, + "GPQA": 0.2894, + "MUSR": 0.372, + "MMLU-PRO": 0.2732 + } + }, + { + "model_id": "prithivMLmods/Llama-Deepsync-1B", + "name": "Llama-Deepsync-1B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.357, + "BBH": 0.3386, + "MATH Level 5": 0.0438, + "GPQA": 0.2601, + "MUSR": 0.3565, + "MMLU-PRO": 0.1738 + } + }, + { + "model_id": "prithivMLmods/Llama-Deepsync-3B", + "name": "Llama-Deepsync-3B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4302, + "BBH": 0.4292, + "MATH Level 5": 0.1178, + "GPQA": 0.2718, + "MUSR": 0.3324, + "MMLU-PRO": 0.3031 + } + }, + { + "model_id": "prithivMLmods/Llama-Express.1-Math", + "name": "Llama-Express.1-Math", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5084, + "BBH": 0.3364, + "MATH Level 5": 0.0559, + "GPQA": 0.2634, + "MUSR": 0.3143, + "MMLU-PRO": 0.161 + } + }, + { + "model_id": "prithivMLmods/LwQ-10B-Instruct", + "name": "LwQ-10B-Instruct", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3935, + "BBH": 0.5122, + "MATH Level 5": 0.04, + "GPQA": 0.3121, + "MUSR": 0.4544, + "MMLU-PRO": 0.3318 + } + }, + { + "model_id": "prithivMLmods/LwQ-Reasoner-10B", + "name": "LwQ-Reasoner-10B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.2941, + "BBH": 0.5866, + "MATH Level 5": 0.358, + "GPQA": 0.3465, + "MUSR": 0.4079, + "MMLU-PRO": 0.4147 + } + }, + { + "model_id": "prithivMLmods/Magellanic-Opus-14B-Exp", + "name": "Magellanic-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6866, + "BBH": 0.6383, + "MATH Level 5": 0.3799, + "GPQA": 0.3742, + "MUSR": 0.4926, + "MMLU-PRO": 0.5273 + } + }, + { + "model_id": "prithivMLmods/Magellanic-Qwen-25B-R999", + "name": "Magellanic-Qwen-25B-R999", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.1873, + "BBH": 0.2608, + "MATH Level 5": 0.0053, + "GPQA": 0.2508, + "MUSR": 0.3831, + "MMLU-PRO": 0.13 + } + }, + { + "model_id": "prithivMLmods/Megatron-Corpus-14B-Exp", + "name": "Megatron-Corpus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4983, + "BBH": 0.6355, + "MATH Level 5": 0.3429, + "GPQA": 0.3633, + "MUSR": 0.4767, + "MMLU-PRO": 0.526 + } + }, + { + "model_id": "prithivMLmods/Megatron-Corpus-14B-Exp.v2", + "name": "Megatron-Corpus-14B-Exp.v2", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.487, + "BBH": 0.6321, + "MATH Level 5": 0.2591, + "GPQA": 0.3423, + "MUSR": 0.449, + "MMLU-PRO": 0.481 + } + }, + { + "model_id": "prithivMLmods/Megatron-Opus-14B-2.0", + "name": "Megatron-Opus-14B-2.0", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6694, + "BBH": 0.6871, + "MATH Level 5": 0.2779, + "GPQA": 0.3591, + "MUSR": 0.414, + "MMLU-PRO": 0.517 + } + }, + { + "model_id": "prithivMLmods/Megatron-Opus-14B-2.1", + "name": "Megatron-Opus-14B-2.1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.0246, + "BBH": 0.6727, + "MATH Level 5": 0.2998, + "GPQA": 0.3834, + "MUSR": 0.4928, + "MMLU-PRO": 0.5174 + } + }, + { + "model_id": "prithivMLmods/Megatron-Opus-14B-Exp", + "name": "Megatron-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4979, + "BBH": 0.6516, + "MATH Level 5": 0.3535, + "GPQA": 0.375, + "MUSR": 0.4887, + "MMLU-PRO": 0.5401 + } + }, + { + "model_id": "prithivMLmods/Megatron-Opus-14B-Stock", + "name": "Megatron-Opus-14B-Stock", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5174, + "BBH": 0.6412, + "MATH Level 5": 0.3346, + "GPQA": 0.375, + "MUSR": 0.482, + "MMLU-PRO": 0.5293 + } + }, + { + "model_id": "prithivMLmods/Megatron-Opus-7B-Exp", + "name": "Megatron-Opus-7B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6017, + "BBH": 0.5367, + "MATH Level 5": 0.1971, + "GPQA": 0.3112, + "MUSR": 0.4186, + "MMLU-PRO": 0.39 + } + }, + { + "model_id": "prithivMLmods/Messier-Opus-14B-Elite7", + "name": "Messier-Opus-14B-Elite7", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.7113, + "BBH": 0.6499, + "MATH Level 5": 0.4071, + "GPQA": 0.3909, + "MUSR": 0.4886, + "MMLU-PRO": 0.5404 + } + }, + { + "model_id": "prithivMLmods/Omni-Reasoner-Merged", + "name": "Omni-Reasoner-Merged", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4599, + "BBH": 0.5508, + "MATH Level 5": 0.3331, + "GPQA": 0.3037, + "MUSR": 0.4616, + "MMLU-PRO": 0.4364 + } + }, + { + "model_id": "prithivMLmods/Omni-Reasoner3-Merged", + "name": "Omni-Reasoner3-Merged", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4935, + "BBH": 0.4388, + "MATH Level 5": 0.1088, + "GPQA": 0.2643, + "MUSR": 0.3522, + "MMLU-PRO": 0.295 + } + }, + { + "model_id": "prithivMLmods/Pegasus-Opus-14B-Exp", + "name": "Pegasus-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6982, + "BBH": 0.6548, + "MATH Level 5": 0.4086, + "GPQA": 0.3951, + "MUSR": 0.486, + "MMLU-PRO": 0.5412 + } + }, + { + "model_id": "prithivMLmods/Phi-4-Empathetic", + "name": "Phi-4-Empathetic", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.0497, + "BBH": 0.6727, + "MATH Level 5": 0.2621, + "GPQA": 0.38, + "MUSR": 0.4991, + "MMLU-PRO": 0.5066 + } + }, + { + "model_id": "prithivMLmods/Phi-4-Math-IO", + "name": "Phi-4-Math-IO", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.059, + "BBH": 0.6668, + "MATH Level 5": 0.4577, + "GPQA": 0.3985, + "MUSR": 0.4873, + "MMLU-PRO": 0.5205 + } + }, + { + "model_id": "prithivMLmods/Phi-4-QwQ", + "name": "Phi-4-QwQ", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.0559, + "BBH": 0.6696, + "MATH Level 5": 0.4577, + "GPQA": 0.3909, + "MUSR": 0.4651, + "MMLU-PRO": 0.5275 + } + }, + { + "model_id": "prithivMLmods/Phi-4-Super", + "name": "Phi-4-Super", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.0481, + "BBH": 0.672, + "MATH Level 5": 0.3489, + "GPQA": 0.3943, + "MUSR": 0.5044, + "MMLU-PRO": 0.5266 + } + }, + { + "model_id": "prithivMLmods/Phi-4-Super-1", + "name": "Phi-4-Super-1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.0418, + "BBH": 0.6729, + "MATH Level 5": 0.352, + "GPQA": 0.3935, + "MUSR": 0.5017, + "MMLU-PRO": 0.5235 + } + }, + { + "model_id": "prithivMLmods/Phi-4-Super-o1", + "name": "Phi-4-Super-o1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.0418, + "BBH": 0.6729, + "MATH Level 5": 0.352, + "GPQA": 0.3935, + "MUSR": 0.5017, + "MMLU-PRO": 0.5235 + } + }, + { + "model_id": "prithivMLmods/Phi-4-o1", + "name": "Phi-4-o1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.029, + "BBH": 0.6689, + "MATH Level 5": 0.3995, + "GPQA": 0.3826, + "MUSR": 0.4978, + "MMLU-PRO": 0.5174 + } + }, + { + "model_id": "prithivMLmods/Phi4-Super", + "name": "Phi4-Super", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.0481, + "BBH": 0.672, + "MATH Level 5": 0.3489, + "GPQA": 0.3943, + "MUSR": 0.5044, + "MMLU-PRO": 0.5266 + } + }, + { + "model_id": "prithivMLmods/Porpoise-Opus-14B-Exp", + "name": "Porpoise-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.7098, + "BBH": 0.6519, + "MATH Level 5": 0.4041, + "GPQA": 0.3935, + "MUSR": 0.4926, + "MMLU-PRO": 0.5396 + } + }, + { + "model_id": "prithivMLmods/Primal-Opus-14B-Optimus-v1", + "name": "Primal-Opus-14B-Optimus-v1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5013, + "BBH": 0.6419, + "MATH Level 5": 0.3384, + "GPQA": 0.3725, + "MUSR": 0.4847, + "MMLU-PRO": 0.5259 + } + }, + { + "model_id": "prithivMLmods/Primal-Opus-14B-Optimus-v2", + "name": "Primal-Opus-14B-Optimus-v2", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6404, + "BBH": 0.6544, + "MATH Level 5": 0.4207, + "GPQA": 0.3918, + "MUSR": 0.49, + "MMLU-PRO": 0.5422 + } + }, + { + "model_id": "prithivMLmods/QwQ-LCoT-14B-Conversational", + "name": "QwQ-LCoT-14B-Conversational", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4047, + "BBH": 0.624, + "MATH Level 5": 0.4653, + "GPQA": 0.3498, + "MUSR": 0.4847, + "MMLU-PRO": 0.5278 + } + }, + { + "model_id": "prithivMLmods/QwQ-LCoT-3B-Instruct", + "name": "QwQ-LCoT-3B-Instruct", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4354, + "BBH": 0.4763, + "MATH Level 5": 0.2825, + "GPQA": 0.2819, + "MUSR": 0.4358, + "MMLU-PRO": 0.3582 + } + }, + { + "model_id": "prithivMLmods/QwQ-LCoT-7B-Instruct", + "name": "QwQ-LCoT-7B-Instruct", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4987, + "BBH": 0.5466, + "MATH Level 5": 0.3716, + "GPQA": 0.302, + "MUSR": 0.4802, + "MMLU-PRO": 0.4334 + } + }, + { + "model_id": "prithivMLmods/QwQ-LCoT1-Merged", + "name": "QwQ-LCoT1-Merged", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4751, + "BBH": 0.5481, + "MATH Level 5": 0.3731, + "GPQA": 0.307, + "MUSR": 0.4696, + "MMLU-PRO": 0.4358 + } + }, + { + "model_id": "prithivMLmods/QwQ-LCoT2-7B-Instruct", + "name": "QwQ-LCoT2-7B-Instruct", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5561, + "BBH": 0.5425, + "MATH Level 5": 0.327, + "GPQA": 0.2978, + "MUSR": 0.4564, + "MMLU-PRO": 0.4342 + } + }, + { + "model_id": "prithivMLmods/QwQ-MathOct-7B", + "name": "QwQ-MathOct-7B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4684, + "BBH": 0.5486, + "MATH Level 5": 0.2953, + "GPQA": 0.3029, + "MUSR": 0.4601, + "MMLU-PRO": 0.433 + } + }, + { + "model_id": "prithivMLmods/QwQ-R1-Distill-1.5B-CoT", + "name": "QwQ-R1-Distill-1.5B-CoT", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.2194, + "BBH": 0.3666, + "MATH Level 5": 0.3346, + "GPQA": 0.2861, + "MUSR": 0.3434, + "MMLU-PRO": 0.1913 + } + }, + { + "model_id": "prithivMLmods/QwQ-R1-Distill-7B-CoT", + "name": "QwQ-R1-Distill-7B-CoT", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.35, + "BBH": 0.4388, + "MATH Level 5": 0.4683, + "GPQA": 0.2936, + "MUSR": 0.3779, + "MMLU-PRO": 0.2804 + } + }, + { + "model_id": "prithivMLmods/Qwen-7B-Distill-Reasoner", + "name": "Qwen-7B-Distill-Reasoner", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3396, + "BBH": 0.4409, + "MATH Level 5": 0.395, + "GPQA": 0.3272, + "MUSR": 0.366, + "MMLU-PRO": 0.2818 + } + }, + { + "model_id": "prithivMLmods/Qwen2.5-1.5B-DeepSeek-R1-Instruct", + "name": "Qwen2.5-1.5B-DeepSeek-R1-Instruct", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.1397, + "BBH": 0.2824, + "MATH Level 5": 0.0, + "GPQA": 0.276, + "MUSR": 0.3724, + "MMLU-PRO": 0.1123 + } + }, + { + "model_id": "prithivMLmods/Qwen2.5-14B-DeepSeek-R1-1M", + "name": "Qwen2.5-14B-DeepSeek-R1-1M", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4193, + "BBH": 0.5935, + "MATH Level 5": 0.5128, + "GPQA": 0.3322, + "MUSR": 0.4606, + "MMLU-PRO": 0.4899 + } + }, + { + "model_id": "prithivMLmods/Qwen2.5-7B-DeepSeek-R1-1M", + "name": "Qwen2.5-7B-DeepSeek-R1-1M", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.1861, + "BBH": 0.3126, + "MATH Level 5": 0.0151, + "GPQA": 0.2617, + "MUSR": 0.3417, + "MMLU-PRO": 0.1201 + } + }, + { + "model_id": "prithivMLmods/SmolLM2-CoT-360M", + "name": "SmolLM2-CoT-360M", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.2216, + "BBH": 0.3135, + "MATH Level 5": 0.0204, + "GPQA": 0.2366, + "MUSR": 0.3794, + "MMLU-PRO": 0.1085 + } + }, + { + "model_id": "prithivMLmods/Sombrero-Opus-14B-Elite5", + "name": "Sombrero-Opus-14B-Elite5", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.7881, + "BBH": 0.6502, + "MATH Level 5": 0.5355, + "GPQA": 0.3364, + "MUSR": 0.4287, + "MMLU-PRO": 0.52 + } + }, + { + "model_id": "prithivMLmods/Sombrero-Opus-14B-Elite6", + "name": "Sombrero-Opus-14B-Elite6", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.7226, + "BBH": 0.6488, + "MATH Level 5": 0.4079, + "GPQA": 0.3935, + "MUSR": 0.4886, + "MMLU-PRO": 0.539 + } + }, + { + "model_id": "prithivMLmods/Sombrero-Opus-14B-Sm1", + "name": "Sombrero-Opus-14B-Sm1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3813, + "BBH": 0.6355, + "MATH Level 5": 0.5665, + "GPQA": 0.4035, + "MUSR": 0.5299, + "MMLU-PRO": 0.5125 + } + }, + { + "model_id": "prithivMLmods/Sombrero-Opus-14B-Sm2", + "name": "Sombrero-Opus-14B-Sm2", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4272, + "BBH": 0.6609, + "MATH Level 5": 0.4864, + "GPQA": 0.3884, + "MUSR": 0.5088, + "MMLU-PRO": 0.5345 + } + }, + { + "model_id": "prithivMLmods/Sombrero-Opus-14B-Sm4", + "name": "Sombrero-Opus-14B-Sm4", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4347, + "BBH": 0.6613, + "MATH Level 5": 0.4879, + "GPQA": 0.3951, + "MUSR": 0.5192, + "MMLU-PRO": 0.53 + } + }, + { + "model_id": "prithivMLmods/Sombrero-Opus-14B-Sm5", + "name": "Sombrero-Opus-14B-Sm5", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6852, + "BBH": 0.6564, + "MATH Level 5": 0.4094, + "GPQA": 0.3867, + "MUSR": 0.4806, + "MMLU-PRO": 0.54 + } + }, + { + "model_id": "prithivMLmods/Sqweeks-7B-Instruct", + "name": "Sqweeks-7B-Instruct", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.2158, + "BBH": 0.4667, + "MATH Level 5": 0.5144, + "GPQA": 0.307, + "MUSR": 0.4476, + "MMLU-PRO": 0.3133 + } + }, + { + "model_id": "prithivMLmods/Tadpole-Opus-14B-Exp", + "name": "Tadpole-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.575, + "BBH": 0.6369, + "MATH Level 5": 0.3134, + "GPQA": 0.3859, + "MUSR": 0.4728, + "MMLU-PRO": 0.5322 + } + }, + { + "model_id": "prithivMLmods/Taurus-Opus-7B", + "name": "Taurus-Opus-7B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4223, + "BBH": 0.5367, + "MATH Level 5": 0.2168, + "GPQA": 0.3263, + "MUSR": 0.4399, + "MMLU-PRO": 0.3951 + } + }, + { + "model_id": "prithivMLmods/Triangulum-10B", + "name": "Triangulum-10B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.3229, + "BBH": 0.5968, + "MATH Level 5": 0.355, + "GPQA": 0.354, + "MUSR": 0.4172, + "MMLU-PRO": 0.4178 + } + }, + { + "model_id": "prithivMLmods/Triangulum-5B", + "name": "Triangulum-5B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.1283, + "BBH": 0.3124, + "MATH Level 5": 0.0106, + "GPQA": 0.255, + "MUSR": 0.3445, + "MMLU-PRO": 0.1223 + } + }, + { + "model_id": "prithivMLmods/Triangulum-v2-10B", + "name": "Triangulum-v2-10B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6705, + "BBH": 0.6065, + "MATH Level 5": 0.2447, + "GPQA": 0.3372, + "MUSR": 0.4281, + "MMLU-PRO": 0.4466 + } + }, + { + "model_id": "prithivMLmods/Tucana-Opus-14B-r999", + "name": "Tucana-Opus-14B-r999", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6067, + "BBH": 0.6557, + "MATH Level 5": 0.4063, + "GPQA": 0.3918, + "MUSR": 0.473, + "MMLU-PRO": 0.5384 + } + }, + { + "model_id": "prithivMLmods/Tulu-MathLingo-8B", + "name": "Tulu-MathLingo-8B", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5589, + "BBH": 0.4659, + "MATH Level 5": 0.145, + "GPQA": 0.2903, + "MUSR": 0.3864, + "MMLU-PRO": 0.3044 + } + }, + { + "model_id": "prithivMLmods/Viper-Coder-7B-Elite14", + "name": "Viper-Coder-7B-Elite14", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.1488, + "BBH": 0.2829, + "MATH Level 5": 0.0106, + "GPQA": 0.255, + "MUSR": 0.3422, + "MMLU-PRO": 0.1089 + } + }, + { + "model_id": "prithivMLmods/Viper-Coder-Hybrid-v1.2", + "name": "Viper-Coder-Hybrid-v1.2", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6736, + "BBH": 0.6391, + "MATH Level 5": 0.3331, + "GPQA": 0.3742, + "MUSR": 0.4822, + "MMLU-PRO": 0.5243 + } + }, + { + "model_id": "prithivMLmods/Viper-Coder-Hybrid-v1.3", + "name": "Viper-Coder-Hybrid-v1.3", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.7555, + "BBH": 0.6471, + "MATH Level 5": 0.4517, + "GPQA": 0.3381, + "MUSR": 0.4403, + "MMLU-PRO": 0.5097 + } + }, + { + "model_id": "prithivMLmods/Viper-Coder-HybridMini-v1.3", + "name": "Viper-Coder-HybridMini-v1.3", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.6104, + "BBH": 0.5365, + "MATH Level 5": 0.463, + "GPQA": 0.3171, + "MUSR": 0.4505, + "MMLU-PRO": 0.4352 + } + }, + { + "model_id": "prithivMLmods/Viper-Coder-v0.1", + "name": "Viper-Coder-v0.1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5521, + "BBH": 0.6143, + "MATH Level 5": 0.327, + "GPQA": 0.354, + "MUSR": 0.4394, + "MMLU-PRO": 0.3928 + } + }, + { + "model_id": "prithivMLmods/Viper-Coder-v1.1", + "name": "Viper-Coder-v1.1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4432, + "BBH": 0.6492, + "MATH Level 5": 0.5461, + "GPQA": 0.401, + "MUSR": 0.5219, + "MMLU-PRO": 0.5232 + } + }, + { + "model_id": "prithivMLmods/Viper-Coder-v1.6-r999", + "name": "Viper-Coder-v1.6-r999", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4433, + "BBH": 0.6492, + "MATH Level 5": 0.5657, + "GPQA": 0.401, + "MUSR": 0.5219, + "MMLU-PRO": 0.5232 + } + }, + { + "model_id": "prithivMLmods/Viper-Coder-v1.7-Vsm6", + "name": "Viper-Coder-v1.7-Vsm6", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5004, + "BBH": 0.6502, + "MATH Level 5": 0.4645, + "GPQA": 0.3968, + "MUSR": 0.4768, + "MMLU-PRO": 0.5288 + } + }, + { + "model_id": "prithivMLmods/Viper-OneCoder-UIGEN", + "name": "Viper-OneCoder-UIGEN", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.4692, + "BBH": 0.6047, + "MATH Level 5": 0.3867, + "GPQA": 0.3423, + "MUSR": 0.4514, + "MMLU-PRO": 0.3904 + } + }, + { + "model_id": "prithivMLmods/Volans-Opus-14B-Exp", + "name": "Volans-Opus-14B-Exp", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5868, + "BBH": 0.6521, + "MATH Level 5": 0.4252, + "GPQA": 0.3851, + "MUSR": 0.4872, + "MMLU-PRO": 0.5385 + } + }, + { + "model_id": "prithivMLmods/WebMind-7B-v0.1", + "name": "WebMind-7B-v0.1", + "developer": "prithivMLmods", + "scores": { + "IFEval": 0.5278, + "BBH": 0.5434, + "MATH Level 5": 0.3648, + "GPQA": 0.3171, + "MUSR": 0.4537, + "MMLU-PRO": 0.4279 + } + }, + { + "model_id": "pszemraj/Llama-3-6.3b-v0.1", + "name": "Llama-3-6.3b-v0.1", + "developer": "pszemraj", + "scores": { + "IFEval": 0.1044, + "BBH": 0.4197, + "MATH Level 5": 0.0211, + "GPQA": 0.2836, + "MUSR": 0.3908, + "MMLU-PRO": 0.284 + } + }, + { + "model_id": "pszemraj/Mistral-v0.3-6B", + "name": "Mistral-v0.3-6B", + "developer": "pszemraj", + "scores": { + "IFEval": 0.2454, + "BBH": 0.3774, + "MATH Level 5": 0.0136, + "GPQA": 0.2651, + "MUSR": 0.3908, + "MMLU-PRO": 0.2143 + } + }, + { + "model_id": "qingy2019/LLaMa_3.2_3B_Catalysts", + "name": "LLaMa_3.2_3B_Catalysts", + "developer": "qingy2019", + "scores": { + "IFEval": 0.4992, + "BBH": 0.4468, + "MATH Level 5": 0.1292, + "GPQA": 0.2886, + "MUSR": 0.3788, + "MMLU-PRO": 0.3008 + } + }, + { + "model_id": "qingy2019/OpenMath2-Llama3.1-8B", + "name": "OpenMath2-Llama3.1-8B", + "developer": "qingy2019", + "scores": { + "IFEval": 0.2331, + "BBH": 0.4096, + "MATH Level 5": 0.2674, + "GPQA": 0.2651, + "MUSR": 0.3436, + "MMLU-PRO": 0.1553 + } + }, + { + "model_id": "qingy2019/Oracle-14B", + "name": "Oracle-14B", + "developer": "qingy2019", + "scores": { + "IFEval": 0.2358, + "BBH": 0.4612, + "MATH Level 5": 0.0642, + "GPQA": 0.2576, + "MUSR": 0.3717, + "MMLU-PRO": 0.2382 + } + }, + { + "model_id": "qingy2019/Qwen2.5-Math-14B-Instruct", + "name": "Qwen2.5-Math-14B-Instruct", + "developer": "qingy2019", + "scores": { + "IFEval": 0.6066, + "BBH": 0.635, + "MATH Level 5": 0.3716, + "GPQA": 0.3725, + "MUSR": 0.4757, + "MMLU-PRO": 0.5331 + } + }, + { + "model_id": "qingy2019/Qwen2.5-Math-14B-Instruct-Alpha", + "name": "Qwen2.5-Math-14B-Instruct-Alpha", + "developer": "qingy2019", + "scores": { + "IFEval": 0.5981, + "BBH": 0.6375, + "MATH Level 5": 0.3142, + "GPQA": 0.37, + "MUSR": 0.4649, + "MMLU-PRO": 0.5331 + } + }, + { + "model_id": "qingy2019/Qwen2.5-Math-14B-Instruct-Pro", + "name": "Qwen2.5-Math-14B-Instruct-Pro", + "developer": "qingy2019", + "scores": { + "IFEval": 0.1922, + "BBH": 0.5319, + "MATH Level 5": 0.284, + "GPQA": 0.3112, + "MUSR": 0.374, + "MMLU-PRO": 0.3558 + } + }, + { + "model_id": "qingy2019/Qwen2.5-Ultimate-14B-Instruct", + "name": "Qwen2.5-Ultimate-14B-Instruct", + "developer": "qingy2019", + "scores": { + "IFEval": 0.3938, + "BBH": 0.5842, + "MATH Level 5": 0.2893, + "GPQA": 0.3565, + "MUSR": 0.4135, + "MMLU-PRO": 0.4929 + } + }, + { + "model_id": "qingy2024/Benchmaxx-Llama-3.2-1B-Instruct", + "name": "Benchmaxx-Llama-3.2-1B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.2014, + "BBH": 0.8269, + "MATH Level 5": 0.4804, + "GPQA": 0.2836, + "MUSR": 0.3446, + "MMLU-PRO": 0.1113 + } + }, + { + "model_id": "qingy2024/Eyas-17B-Instruct", + "name": "Eyas-17B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.6575, + "BBH": 0.6085, + "MATH Level 5": 0.247, + "GPQA": 0.3146, + "MUSR": 0.4522, + "MMLU-PRO": 0.4343 + } + }, + { + "model_id": "qingy2024/Falcon3-2x10B-MoE-Instruct", + "name": "Falcon3-2x10B-MoE-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.785, + "BBH": 0.6185, + "MATH Level 5": 0.2795, + "GPQA": 0.3305, + "MUSR": 0.4284, + "MMLU-PRO": 0.4423 + } + }, + { + "model_id": "qingy2024/Fusion-14B-Instruct", + "name": "Fusion-14B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.726, + "BBH": 0.6396, + "MATH Level 5": 0.3369, + "GPQA": 0.3549, + "MUSR": 0.44, + "MMLU-PRO": 0.5044 + } + }, + { + "model_id": "qingy2024/Fusion2-14B-Instruct", + "name": "Fusion2-14B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.6064, + "BBH": 0.6119, + "MATH Level 5": 0.3127, + "GPQA": 0.3448, + "MUSR": 0.4634, + "MMLU-PRO": 0.5051 + } + }, + { + "model_id": "qingy2024/Fusion4-14B-Instruct", + "name": "Fusion4-14B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.7649, + "BBH": 0.6543, + "MATH Level 5": 0.3882, + "GPQA": 0.3305, + "MUSR": 0.4326, + "MMLU-PRO": 0.5194 + } + }, + { + "model_id": "qingy2024/OwO-14B-Instruct", + "name": "OwO-14B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.1383, + "BBH": 0.6165, + "MATH Level 5": 0.4162, + "GPQA": 0.3641, + "MUSR": 0.4407, + "MMLU-PRO": 0.5181 + } + }, + { + "model_id": "qingy2024/QwEnlarge-16B-Instruct", + "name": "QwEnlarge-16B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.7802, + "BBH": 0.5949, + "MATH Level 5": 0.46, + "GPQA": 0.3331, + "MUSR": 0.4101, + "MMLU-PRO": 0.4476 + } + }, + { + "model_id": "qingy2024/QwQ-14B-Math-v0.2", + "name": "QwQ-14B-Math-v0.2", + "developer": "qingy2024", + "scores": { + "IFEval": 0.3391, + "BBH": 0.5731, + "MATH Level 5": 0.4811, + "GPQA": 0.2626, + "MUSR": 0.4021, + "MMLU-PRO": 0.48 + } + }, + { + "model_id": "qingy2024/Qwarkstar-4B", + "name": "Qwarkstar-4B", + "developer": "qingy2024", + "scores": { + "IFEval": 0.1994, + "BBH": 0.4015, + "MATH Level 5": 0.0861, + "GPQA": 0.3247, + "MUSR": 0.4428, + "MMLU-PRO": 0.2425 + } + }, + { + "model_id": "qingy2024/Qwarkstar-4B-Instruct-Preview", + "name": "Qwarkstar-4B-Instruct-Preview", + "developer": "qingy2024", + "scores": { + "IFEval": 0.5324, + "BBH": 0.4358, + "MATH Level 5": 0.1284, + "GPQA": 0.2802, + "MUSR": 0.3896, + "MMLU-PRO": 0.2502 + } + }, + { + "model_id": "qingy2024/Qwen2.5-4B", + "name": "Qwen2.5-4B", + "developer": "qingy2024", + "scores": { + "IFEval": 0.2158, + "BBH": 0.4269, + "MATH Level 5": 0.0514, + "GPQA": 0.2911, + "MUSR": 0.461, + "MMLU-PRO": 0.2525 + } + }, + { + "model_id": "qingy2024/Qwen2.5-Coder-Draft-1.5B-Instruct", + "name": "Qwen2.5-Coder-Draft-1.5B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.4125, + "BBH": 0.3837, + "MATH Level 5": 0.1579, + "GPQA": 0.2601, + "MUSR": 0.358, + "MMLU-PRO": 0.2244 + } + }, + { + "model_id": "qingy2024/Qwen2.5-Math-14B-Instruct-Alpha", + "name": "Qwen2.5-Math-14B-Instruct-Alpha", + "developer": "qingy2024", + "scores": { + "IFEval": 0.7704, + "BBH": 0.6465, + "MATH Level 5": 0.429, + "GPQA": 0.349, + "MUSR": 0.4021, + "MMLU-PRO": 0.4966 + } + }, + { + "model_id": "qingy2024/Qwen2.5-Math-14B-Instruct-Preview", + "name": "Qwen2.5-Math-14B-Instruct-Preview", + "developer": "qingy2024", + "scores": { + "IFEval": 0.7826, + "BBH": 0.6294, + "MATH Level 5": 0.4758, + "GPQA": 0.3406, + "MUSR": 0.4115, + "MMLU-PRO": 0.4993 + } + }, + { + "model_id": "qingy2024/Qwen2.6-14B-Instruct", + "name": "Qwen2.6-14B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.5811, + "BBH": 0.6394, + "MATH Level 5": 0.3051, + "GPQA": 0.3792, + "MUSR": 0.4569, + "MMLU-PRO": 0.5285 + } + }, + { + "model_id": "qingy2024/Qwen2.6-Math-14B-Instruct", + "name": "Qwen2.6-Math-14B-Instruct", + "developer": "qingy2024", + "scores": { + "IFEval": 0.3862, + "BBH": 0.6324, + "MATH Level 5": 0.429, + "GPQA": 0.37, + "MUSR": 0.4759, + "MMLU-PRO": 0.5241 + } + }, + { + "model_id": "qq8933/OpenLongCoT-Base-Gemma2-2B", + "name": "OpenLongCoT-Base-Gemma2-2B", + "developer": "qq8933", + "scores": { + "IFEval": 0.1965, + "BBH": 0.3106, + "MATH Level 5": 0.0234, + "GPQA": 0.2626, + "MUSR": 0.3222, + "MMLU-PRO": 0.1316 + } + }, + { + "model_id": "raphgg/test-2.5-72B", + "name": "test-2.5-72B", + "developer": "raphgg", + "scores": { + "IFEval": 0.8437, + "BBH": 0.7266, + "MATH Level 5": 0.4109, + "GPQA": 0.3893, + "MUSR": 0.4812, + "MMLU-PRO": 0.5837 + } + }, + { + "model_id": "rasyosef/Mistral-NeMo-Minitron-8B-Chat", + "name": "Mistral-NeMo-Minitron-8B-Chat", + "developer": "rasyosef", + "scores": { + "IFEval": 0.4452, + "BBH": 0.4759, + "MATH Level 5": 0.0272, + "GPQA": 0.276, + "MUSR": 0.4304, + "MMLU-PRO": 0.2404 + } + }, + { + "model_id": "rasyosef/Phi-1_5-Instruct-v0.1", + "name": "Phi-1_5-Instruct-v0.1", + "developer": "rasyosef", + "scores": { + "IFEval": 0.2402, + "BBH": 0.3118, + "MATH Level 5": 0.0136, + "GPQA": 0.2601, + "MUSR": 0.3422, + "MMLU-PRO": 0.1562 + } + }, + { + "model_id": "rasyosef/phi-2-instruct-apo", + "name": "phi-2-instruct-apo", + "developer": "rasyosef", + "scores": { + "IFEval": 0.3146, + "BBH": 0.4445, + "MATH Level 5": 0.0302, + "GPQA": 0.2701, + "MUSR": 0.3342, + "MMLU-PRO": 0.2155 + } + }, + { + "model_id": "rasyosef/phi-2-instruct-v0.1", + "name": "phi-2-instruct-v0.1", + "developer": "rasyosef", + "scores": { + "IFEval": 0.3681, + "BBH": 0.4726, + "MATH Level 5": 0.0, + "GPQA": 0.2743, + "MUSR": 0.3524, + "MMLU-PRO": 0.2247 + } + }, + { + "model_id": "realtreetune/rho-1b-sft-MATH", + "name": "rho-1b-sft-MATH", + "developer": "realtreetune", + "scores": { + "IFEval": 0.2121, + "BBH": 0.3144, + "MATH Level 5": 0.0347, + "GPQA": 0.2525, + "MUSR": 0.3458, + "MMLU-PRO": 0.1117 + } + }, + { + "model_id": "recoilme/Gemma-2-Ataraxy-Gemmasutra-9B-slerp", + "name": "Gemma-2-Ataraxy-Gemmasutra-9B-slerp", + "developer": "recoilme", + "scores": { + "IFEval": 0.7649, + "BBH": 0.5974, + "MATH Level 5": 0.0174, + "GPQA": 0.3305, + "MUSR": 0.4245, + "MMLU-PRO": 0.4207 + } + }, + { + "model_id": "recoilme/recoilme-gemma-2-9B-v0.1", + "name": "recoilme-gemma-2-9B-v0.1", + "developer": "recoilme", + "scores": { + "IFEval": 0.7515, + "BBH": 0.5995, + "MATH Level 5": 0.2039, + "GPQA": 0.3389, + "MUSR": 0.4191, + "MMLU-PRO": 0.4159 + } + }, + { + "model_id": "recoilme/recoilme-gemma-2-9B-v0.2", + "name": "recoilme-gemma-2-9B-v0.2", + "developer": "recoilme", + "scores": { + "IFEval": 0.2747, + "BBH": 0.6031, + "MATH Level 5": 0.0831, + "GPQA": 0.3305, + "MUSR": 0.4686, + "MMLU-PRO": 0.4122 + } + }, + { + "model_id": "recoilme/recoilme-gemma-2-9B-v0.3", + "name": "recoilme-gemma-2-9B-v0.3", + "developer": "recoilme", + "scores": { + "IFEval": 0.7439, + "BBH": 0.5993, + "MATH Level 5": 0.0876, + "GPQA": 0.3238, + "MUSR": 0.4204, + "MMLU-PRO": 0.4072 + } + }, + { + "model_id": "recoilme/recoilme-gemma-2-9B-v0.4", + "name": "recoilme-gemma-2-9B-v0.4", + "developer": "recoilme", + "scores": { + "IFEval": 0.2562, + "BBH": 0.5967, + "MATH Level 5": 0.0846, + "GPQA": 0.3406, + "MUSR": 0.4727, + "MMLU-PRO": 0.4406 + } + }, + { + "model_id": "recoilme/recoilme-gemma-2-9B-v0.5", + "name": "recoilme-gemma-2-9B-v0.5", + "developer": "recoilme", + "scores": { + "IFEval": 0.7664, + "BBH": 0.5981, + "MATH Level 5": 0.2115, + "GPQA": 0.3364, + "MUSR": 0.4232, + "MMLU-PRO": 0.42 + } + }, + { + "model_id": "redrix/AngelSlayer-12B-Unslop-Mell-RPMax-DARKNESS", + "name": "AngelSlayer-12B-Unslop-Mell-RPMax-DARKNESS", + "developer": "redrix", + "scores": { + "IFEval": 0.536, + "BBH": 0.5129, + "MATH Level 5": 0.1133, + "GPQA": 0.3154, + "MUSR": 0.3818, + "MMLU-PRO": 0.318 + } + }, + { + "model_id": "redrix/patricide-12B-Unslop-Mell", + "name": "patricide-12B-Unslop-Mell", + "developer": "redrix", + "scores": { + "IFEval": 0.4074, + "BBH": 0.5399, + "MATH Level 5": 0.1314, + "GPQA": 0.3238, + "MUSR": 0.4026, + "MMLU-PRO": 0.357 + } + }, + { + "model_id": "refuelai/Llama-3-Refueled", + "name": "Llama-3-Refueled", + "developer": "refuelai", + "scores": { + "IFEval": 0.462, + "BBH": 0.5871, + "MATH Level 5": 0.0665, + "GPQA": 0.2995, + "MUSR": 0.4454, + "MMLU-PRO": 0.3095 + } + }, + { + "model_id": "rhplus0831/maid-yuzu-v7", + "name": "maid-yuzu-v7", + "developer": "rhplus0831", + "scores": { + "IFEval": 0.6462, + "BBH": 0.4805, + "MATH Level 5": 0.102, + "GPQA": 0.3096, + "MUSR": 0.4136, + "MMLU-PRO": 0.354 + } + }, + { + "model_id": "rhymes-ai/Aria", + "name": "Aria", + "developer": "rhymes-ai", + "scores": { + "IFEval": 0.4773, + "BBH": 0.5695, + "MATH Level 5": 0.1934, + "GPQA": 0.3624, + "MUSR": 0.4338, + "MMLU-PRO": 0.4405 + } + }, + { + "model_id": "rhysjones/phi-2-orange-v2", + "name": "phi-2-orange-v2", + "developer": "rhysjones", + "scores": { + "IFEval": 0.367, + "BBH": 0.477, + "MATH Level 5": 0.0408, + "GPQA": 0.2617, + "MUSR": 0.363, + "MMLU-PRO": 0.2532 + } + }, + { + "model_id": "riaz/FineLlama-3.1-8B", + "name": "FineLlama-3.1-8B", + "developer": "riaz", + "scores": { + "IFEval": 0.4373, + "BBH": 0.4586, + "MATH Level 5": 0.0514, + "GPQA": 0.2752, + "MUSR": 0.3763, + "MMLU-PRO": 0.2964 + } + }, + { + "model_id": "rmdhirr/Gluon-8B", + "name": "Gluon-8B", + "developer": "rmdhirr", + "scores": { + "IFEval": 0.5053, + "BBH": 0.5153, + "MATH Level 5": 0.1443, + "GPQA": 0.3121, + "MUSR": 0.4039, + "MMLU-PRO": 0.3808 + } + }, + { + "model_id": "rombodawg/Rombos-Coder-V2.5-Qwen-14b", + "name": "Rombos-Coder-V2.5-Qwen-14b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.7047, + "BBH": 0.6165, + "MATH Level 5": 0.3301, + "GPQA": 0.3029, + "MUSR": 0.3915, + "MMLU-PRO": 0.3939 + } + }, + { + "model_id": "rombodawg/Rombos-Coder-V2.5-Qwen-7b", + "name": "Rombos-Coder-V2.5-Qwen-7b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.621, + "BBH": 0.5077, + "MATH Level 5": 0.3338, + "GPQA": 0.2836, + "MUSR": 0.3979, + "MMLU-PRO": 0.3398 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.5-Qwen-0.5b", + "name": "Rombos-LLM-V2.5-Qwen-0.5b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.2847, + "BBH": 0.3294, + "MATH Level 5": 0.068, + "GPQA": 0.2668, + "MUSR": 0.3236, + "MMLU-PRO": 0.1866 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.5-Qwen-1.5b", + "name": "Rombos-LLM-V2.5-Qwen-1.5b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.3402, + "BBH": 0.4257, + "MATH Level 5": 0.0853, + "GPQA": 0.2886, + "MUSR": 0.4186, + "MMLU-PRO": 0.2922 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.5-Qwen-14b", + "name": "Rombos-LLM-V2.5-Qwen-14b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.584, + "BBH": 0.6481, + "MATH Level 5": 0.4554, + "GPQA": 0.3716, + "MUSR": 0.4717, + "MMLU-PRO": 0.5376 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.5-Qwen-32b", + "name": "Rombos-LLM-V2.5-Qwen-32b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.6827, + "BBH": 0.7046, + "MATH Level 5": 0.4955, + "GPQA": 0.3968, + "MUSR": 0.5034, + "MMLU-PRO": 0.5916 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.5-Qwen-3b", + "name": "Rombos-LLM-V2.5-Qwen-3b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.5342, + "BBH": 0.4809, + "MATH Level 5": 0.2795, + "GPQA": 0.3079, + "MUSR": 0.4042, + "MMLU-PRO": 0.3761 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.5-Qwen-72b", + "name": "Rombos-LLM-V2.5-Qwen-72b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.7155, + "BBH": 0.723, + "MATH Level 5": 0.5423, + "GPQA": 0.3985, + "MUSR": 0.4599, + "MMLU-PRO": 0.5935 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.5-Qwen-7b", + "name": "Rombos-LLM-V2.5-Qwen-7b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.6237, + "BBH": 0.5544, + "MATH Level 5": 0.3814, + "GPQA": 0.318, + "MUSR": 0.4291, + "MMLU-PRO": 0.4469 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.5.1-Qwen-3b", + "name": "Rombos-LLM-V2.5.1-Qwen-3b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.2595, + "BBH": 0.3884, + "MATH Level 5": 0.0914, + "GPQA": 0.2743, + "MUSR": 0.3991, + "MMLU-PRO": 0.2719 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.6-Nemotron-70b", + "name": "Rombos-LLM-V2.6-Nemotron-70b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.7527, + "BBH": 0.6938, + "MATH Level 5": 0.3331, + "GPQA": 0.406, + "MUSR": 0.4669, + "MMLU-PRO": 0.5329 + } + }, + { + "model_id": "rombodawg/Rombos-LLM-V2.6-Qwen-14b", + "name": "Rombos-LLM-V2.6-Qwen-14b", + "developer": "rombodawg", + "scores": { + "IFEval": 0.8432, + "BBH": 0.6442, + "MATH Level 5": 0.5211, + "GPQA": 0.3339, + "MUSR": 0.4221, + "MMLU-PRO": 0.4961 + } + }, + { + "model_id": "rombodawg/rombos_Replete-Coder-Instruct-8b-Merged", + "name": "rombos_Replete-Coder-Instruct-8b-Merged", + "developer": "rombodawg", + "scores": { + "IFEval": 0.5388, + "BBH": 0.4462, + "MATH Level 5": 0.0778, + "GPQA": 0.2693, + "MUSR": 0.366, + "MMLU-PRO": 0.1809 + } + }, + { + "model_id": "rombodawg/rombos_Replete-Coder-Llama3-8B", + "name": "rombos_Replete-Coder-Llama3-8B", + "developer": "rombodawg", + "scores": { + "IFEval": 0.4714, + "BBH": 0.3276, + "MATH Level 5": 0.0393, + "GPQA": 0.2668, + "MUSR": 0.3966, + "MMLU-PRO": 0.1335 + } + }, + { + "model_id": "rootxhacker/Apollo-70B", + "name": "Apollo-70B", + "developer": "rootxhacker", + "scores": { + "IFEval": 0.5099, + "BBH": 0.6804, + "MATH Level 5": 0.5612, + "GPQA": 0.4572, + "MUSR": 0.4948, + "MMLU-PRO": 0.5279 + } + }, + { + "model_id": "rootxhacker/Apollo_v2-32B", + "name": "Apollo_v2-32B", + "developer": "rootxhacker", + "scores": { + "IFEval": 0.428, + "BBH": 0.7072, + "MATH Level 5": 0.4275, + "GPQA": 0.3784, + "MUSR": 0.4994, + "MMLU-PRO": 0.5869 + } + }, + { + "model_id": "rootxhacker/apollo-7B", + "name": "apollo-7B", + "developer": "rootxhacker", + "scores": { + "IFEval": 0.2953, + "BBH": 0.3636, + "MATH Level 5": 0.0257, + "GPQA": 0.2785, + "MUSR": 0.4131, + "MMLU-PRO": 0.1748 + } + }, + { + "model_id": "rsh345/mistral-ft-optimized-1218-NeuralHermes-2.5-Mistral-7B", + "name": "mistral-ft-optimized-1218-NeuralHermes-2.5-Mistral-7B", + "developer": "rsh345", + "scores": { + "IFEval": 0.3892, + "BBH": 0.5188, + "MATH Level 5": 0.0733, + "GPQA": 0.3029, + "MUSR": 0.4672, + "MMLU-PRO": 0.3054 + } + }, + { + "model_id": "rubenroy/Geneva-12B-GCv2-5m", + "name": "Geneva-12B-GCv2-5m", + "developer": "rubenroy", + "scores": { + "IFEval": 0.2586, + "BBH": 0.5278, + "MATH Level 5": 0.0801, + "GPQA": 0.2878, + "MUSR": 0.3525, + "MMLU-PRO": 0.325 + } + }, + { + "model_id": "rubenroy/Gilgamesh-72B", + "name": "Gilgamesh-72B", + "developer": "rubenroy", + "scores": { + "IFEval": 0.8486, + "BBH": 0.7253, + "MATH Level 5": 0.4381, + "GPQA": 0.3943, + "MUSR": 0.4626, + "MMLU-PRO": 0.5802 + } + }, + { + "model_id": "rubenroy/Zurich-14B-GCv2-5m", + "name": "Zurich-14B-GCv2-5m", + "developer": "rubenroy", + "scores": { + "IFEval": 0.6164, + "BBH": 0.6308, + "MATH Level 5": 0.3074, + "GPQA": 0.3616, + "MUSR": 0.4874, + "MMLU-PRO": 0.5233 + } + }, + { + "model_id": "ruizhe1217/sft-s1-qwen-0.5b", + "name": "sft-s1-qwen-0.5b", + "developer": "ruizhe1217", + "scores": { + "IFEval": 0.2749, + "BBH": 0.3301, + "MATH Level 5": 0.0619, + "GPQA": 0.271, + "MUSR": 0.3196, + "MMLU-PRO": 0.1892 + } + }, + { + "model_id": "rwitz/go-bruins-v2", + "name": "go-bruins-v2", + "developer": "rwitz", + "scores": { + "IFEval": 0.4096, + "BBH": 0.3799, + "MATH Level 5": 0.0672, + "GPQA": 0.2626, + "MUSR": 0.4138, + "MMLU-PRO": 0.2761 + } + }, + { + "model_id": "sabersaleh/Llama2-7B-CPO", + "name": "Llama2-7B-CPO", + "developer": "sabersaleh", + "scores": { + "IFEval": 0.1545, + "BBH": 0.3458, + "MATH Level 5": 0.0136, + "GPQA": 0.2676, + "MUSR": 0.4048, + "MMLU-PRO": 0.1606 + } + }, + { + "model_id": "sabersaleh/Llama2-7B-DPO", + "name": "Llama2-7B-DPO", + "developer": "sabersaleh", + "scores": { + "IFEval": 0.1453, + "BBH": 0.3512, + "MATH Level 5": 0.0159, + "GPQA": 0.2685, + "MUSR": 0.4114, + "MMLU-PRO": 0.1626 + } + }, + { + "model_id": "sabersaleh/Llama2-7B-IPO", + "name": "Llama2-7B-IPO", + "developer": "sabersaleh", + "scores": { + "IFEval": 0.1769, + "BBH": 0.3475, + "MATH Level 5": 0.0159, + "GPQA": 0.2676, + "MUSR": 0.4048, + "MMLU-PRO": 0.1617 + } + }, + { + "model_id": "sabersaleh/Llama2-7B-KTO", + "name": "Llama2-7B-KTO", + "developer": "sabersaleh", + "scores": { + "IFEval": 0.1528, + "BBH": 0.3501, + "MATH Level 5": 0.0189, + "GPQA": 0.2676, + "MUSR": 0.4167, + "MMLU-PRO": 0.1636 + } + }, + { + "model_id": "sabersaleh/Llama2-7B-SPO", + "name": "Llama2-7B-SPO", + "developer": "sabersaleh", + "scores": { + "IFEval": 0.1567, + "BBH": 0.3383, + "MATH Level 5": 0.0196, + "GPQA": 0.2768, + "MUSR": 0.3874, + "MMLU-PRO": 0.1757 + } + }, + { + "model_id": "sabersaleh/Llama2-7B-SimPO", + "name": "Llama2-7B-SimPO", + "developer": "sabersaleh", + "scores": { + "IFEval": 0.1659, + "BBH": 0.3489, + "MATH Level 5": 0.0159, + "GPQA": 0.271, + "MUSR": 0.4007, + "MMLU-PRO": 0.1641 + } + }, + { + "model_id": "sabersaleh/Llama3", + "name": "Llama3", + "developer": "sabersaleh", + "scores": { + "IFEval": 0.3321, + "BBH": 0.4782, + "MATH Level 5": 0.0566, + "GPQA": 0.3104, + "MUSR": 0.3933, + "MMLU-PRO": 0.3162 + } + }, + { + "model_id": "sabersalehk/Llama3-001-300", + "name": "Llama3-001-300", + "developer": "sabersalehk", + "scores": { + "IFEval": 0.3179, + "BBH": 0.4745, + "MATH Level 5": 0.0529, + "GPQA": 0.2995, + "MUSR": 0.4064, + "MMLU-PRO": 0.3158 + } + }, + { + "model_id": "sabersalehk/Llama3-SimPO", + "name": "Llama3-SimPO", + "developer": "sabersalehk", + "scores": { + "IFEval": 0.3642, + "BBH": 0.4874, + "MATH Level 5": 0.0574, + "GPQA": 0.3079, + "MUSR": 0.4046, + "MMLU-PRO": 0.3157 + } + }, + { + "model_id": "sabersalehk/Llama3_001_200", + "name": "Llama3_001_200", + "developer": "sabersalehk", + "scores": { + "IFEval": 0.3218, + "BBH": 0.4728, + "MATH Level 5": 0.0514, + "GPQA": 0.3037, + "MUSR": 0.4037, + "MMLU-PRO": 0.3183 + } + }, + { + "model_id": "sabersalehk/Llama3_01_300", + "name": "Llama3_01_300", + "developer": "sabersalehk", + "scores": { + "IFEval": 0.2959, + "BBH": 0.4691, + "MATH Level 5": 0.0498, + "GPQA": 0.3079, + "MUSR": 0.4065, + "MMLU-PRO": 0.3124 + } + }, + { + "model_id": "saishf/Fimbulvetr-Kuro-Lotus-10.7B", + "name": "Fimbulvetr-Kuro-Lotus-10.7B", + "developer": "saishf", + "scores": { + "IFEval": 0.4939, + "BBH": 0.4342, + "MATH Level 5": 0.0536, + "GPQA": 0.3012, + "MUSR": 0.4445, + "MMLU-PRO": 0.3389 + } + }, + { + "model_id": "saishf/Neural-SOVLish-Devil-8B-L3", + "name": "Neural-SOVLish-Devil-8B-L3", + "developer": "saishf", + "scores": { + "IFEval": 0.4199, + "BBH": 0.5142, + "MATH Level 5": 0.0891, + "GPQA": 0.3079, + "MUSR": 0.411, + "MMLU-PRO": 0.3807 + } + }, + { + "model_id": "saishshinde15/TethysAI_Base_Reasoning", + "name": "TethysAI_Base_Reasoning", + "developer": "saishshinde15", + "scores": { + "IFEval": 0.6369, + "BBH": 0.4519, + "MATH Level 5": 0.3142, + "GPQA": 0.2861, + "MUSR": 0.4075, + "MMLU-PRO": 0.3236 + } + }, + { + "model_id": "saishshinde15/TethysAI_Vortex", + "name": "TethysAI_Vortex", + "developer": "saishshinde15", + "scores": { + "IFEval": 0.4298, + "BBH": 0.4749, + "MATH Level 5": 0.315, + "GPQA": 0.3054, + "MUSR": 0.4458, + "MMLU-PRO": 0.3241 + } + }, + { + "model_id": "saishshinde15/TethysAI_Vortex_Reasoning", + "name": "TethysAI_Vortex_Reasoning", + "developer": "saishshinde15", + "scores": { + "IFEval": 0.4021, + "BBH": 0.4694, + "MATH Level 5": 0.2145, + "GPQA": 0.3045, + "MUSR": 0.4084, + "MMLU-PRO": 0.3381 + } + }, + { + "model_id": "sakaltcommunity/novablast-preview", + "name": "novablast-preview", + "developer": "sakaltcommunity", + "scores": { + "IFEval": 0.453, + "BBH": 0.7043, + "MATH Level 5": 0.4894, + "GPQA": 0.3817, + "MUSR": 0.5021, + "MMLU-PRO": 0.5915 + } + }, + { + "model_id": "sakaltcommunity/sakaltum-7b", + "name": "sakaltum-7b", + "developer": "sakaltcommunity", + "scores": { + "IFEval": 0.2604, + "BBH": 0.4575, + "MATH Level 5": 0.0295, + "GPQA": 0.2727, + "MUSR": 0.3775, + "MMLU-PRO": 0.2769 + } + }, + { + "model_id": "sakhan10/quantized_open_llama_3b_v2", + "name": "quantized_open_llama_3b_v2", + "developer": "sakhan10", + "scores": { + "IFEval": 0.1872, + "BBH": 0.302, + "MATH Level 5": 0.0, + "GPQA": 0.2768, + "MUSR": 0.3682, + "MMLU-PRO": 0.1095 + } + }, + { + "model_id": "saltlux/luxia-21.4b-alignment-v1.0", + "name": "luxia-21.4b-alignment-v1.0", + "developer": "saltlux", + "scores": { + "IFEval": 0.3693, + "BBH": 0.6373, + "MATH Level 5": 0.0974, + "GPQA": 0.3012, + "MUSR": 0.4328, + "MMLU-PRO": 0.3403 + } + }, + { + "model_id": "saltlux/luxia-21.4b-alignment-v1.2", + "name": "luxia-21.4b-alignment-v1.2", + "developer": "saltlux", + "scores": { + "IFEval": 0.4115, + "BBH": 0.6371, + "MATH Level 5": 0.0846, + "GPQA": 0.3079, + "MUSR": 0.4459, + "MMLU-PRO": 0.3473 + } + }, + { + "model_id": "sam-paech/Darkest-muse-v1", + "name": "Darkest-muse-v1", + "developer": "sam-paech", + "scores": { + "IFEval": 0.7344, + "BBH": 0.5968, + "MATH Level 5": 0.2145, + "GPQA": 0.344, + "MUSR": 0.4502, + "MMLU-PRO": 0.4184 + } + }, + { + "model_id": "sam-paech/Delirium-v1", + "name": "Delirium-v1", + "developer": "sam-paech", + "scores": { + "IFEval": 0.7208, + "BBH": 0.5962, + "MATH Level 5": 0.2107, + "GPQA": 0.3431, + "MUSR": 0.4514, + "MMLU-PRO": 0.419 + } + }, + { + "model_id": "sam-paech/Quill-v1", + "name": "Quill-v1", + "developer": "sam-paech", + "scores": { + "IFEval": 0.7122, + "BBH": 0.5969, + "MATH Level 5": 0.2122, + "GPQA": 0.3398, + "MUSR": 0.4555, + "MMLU-PRO": 0.4171 + } + }, + { + "model_id": "sarvamai/OpenHathi-7B-Hi-v0.1-Base", + "name": "OpenHathi-7B-Hi-v0.1-Base", + "developer": "sarvamai", + "scores": { + "IFEval": 0.1804, + "BBH": 0.3354, + "MATH Level 5": 0.0083, + "GPQA": 0.2534, + "MUSR": 0.3658, + "MMLU-PRO": 0.1543 + } + }, + { + "model_id": "schnapss/testmerge-7b", + "name": "testmerge-7b", + "developer": "schnapss", + "scores": { + "IFEval": 0.3922, + "BBH": 0.5187, + "MATH Level 5": 0.0687, + "GPQA": 0.2961, + "MUSR": 0.4686, + "MMLU-PRO": 0.306 + } + }, + { + "model_id": "sci-m-wang/Mistral-7B-Instruct-sa-v0.1", + "name": "Mistral-7B-Instruct-sa-v0.1", + "developer": "sci-m-wang", + "scores": { + "IFEval": 0.4335, + "BBH": 0.3273, + "MATH Level 5": 0.0144, + "GPQA": 0.2592, + "MUSR": 0.39, + "MMLU-PRO": 0.2362 + } + }, + { + "model_id": "sci-m-wang/Phi-3-mini-4k-instruct-sa-v0.1", + "name": "Phi-3-mini-4k-instruct-sa-v0.1", + "developer": "sci-m-wang", + "scores": { + "IFEval": 0.5021, + "BBH": 0.5502, + "MATH Level 5": 0.148, + "GPQA": 0.3289, + "MUSR": 0.4073, + "MMLU-PRO": 0.3985 + } + }, + { + "model_id": "sci-m-wang/deepseek-llm-7b-chat-sa-v0.1", + "name": "deepseek-llm-7b-chat-sa-v0.1", + "developer": "sci-m-wang", + "scores": { + "IFEval": 0.4036, + "BBH": 0.3718, + "MATH Level 5": 0.0264, + "GPQA": 0.2567, + "MUSR": 0.4173, + "MMLU-PRO": 0.2209 + } + }, + { + "model_id": "securin/Securin-LLM-V2.5-Qwen-1.5B", + "name": "Securin-LLM-V2.5-Qwen-1.5B", + "developer": "securin", + "scores": { + "IFEval": 0.1492, + "BBH": 0.3158, + "MATH Level 5": 0.0249, + "GPQA": 0.25, + "MUSR": 0.3606, + "MMLU-PRO": 0.1615 + } + }, + { + "model_id": "senseable/WestLake-7B-v2", + "name": "WestLake-7B-v2", + "developer": "senseable", + "scores": { + "IFEval": 0.4419, + "BBH": 0.4073, + "MATH Level 5": 0.0483, + "GPQA": 0.2768, + "MUSR": 0.3937, + "MMLU-PRO": 0.2764 + } + }, + { + "model_id": "sequelbox/Llama3.1-70B-PlumChat", + "name": "Llama3.1-70B-PlumChat", + "developer": "sequelbox", + "scores": { + "IFEval": 0.5616, + "BBH": 0.6753, + "MATH Level 5": 0.3029, + "GPQA": 0.3909, + "MUSR": 0.4774, + "MMLU-PRO": 0.5164 + } + }, + { + "model_id": "sequelbox/Llama3.1-8B-MOTH", + "name": "Llama3.1-8B-MOTH", + "developer": "sequelbox", + "scores": { + "IFEval": 0.5245, + "BBH": 0.4902, + "MATH Level 5": 0.1216, + "GPQA": 0.2685, + "MUSR": 0.3689, + "MMLU-PRO": 0.3339 + } + }, + { + "model_id": "sequelbox/Llama3.1-8B-PlumChat", + "name": "Llama3.1-8B-PlumChat", + "developer": "sequelbox", + "scores": { + "IFEval": 0.4243, + "BBH": 0.3873, + "MATH Level 5": 0.0363, + "GPQA": 0.2651, + "MUSR": 0.3755, + "MMLU-PRO": 0.2127 + } + }, + { + "model_id": "sequelbox/Llama3.1-8B-PlumCode", + "name": "Llama3.1-8B-PlumCode", + "developer": "sequelbox", + "scores": { + "IFEval": 0.2045, + "BBH": 0.3368, + "MATH Level 5": 0.0272, + "GPQA": 0.276, + "MUSR": 0.3773, + "MMLU-PRO": 0.2335 + } + }, + { + "model_id": "sequelbox/Llama3.1-8B-PlumMath", + "name": "Llama3.1-8B-PlumMath", + "developer": "sequelbox", + "scores": { + "IFEval": 0.2242, + "BBH": 0.4032, + "MATH Level 5": 0.0476, + "GPQA": 0.318, + "MUSR": 0.3919, + "MMLU-PRO": 0.2975 + } + }, + { + "model_id": "sequelbox/gemma-2-9B-MOTH", + "name": "gemma-2-9B-MOTH", + "developer": "sequelbox", + "scores": { + "IFEval": 0.2059, + "BBH": 0.308, + "MATH Level 5": 0.0106, + "GPQA": 0.2601, + "MUSR": 0.3409, + "MMLU-PRO": 0.114 + } + }, + { + "model_id": "sethuiyer/Llama-3.1-8B-Experimental-1206-Instruct", + "name": "Llama-3.1-8B-Experimental-1206-Instruct", + "developer": "sethuiyer", + "scores": { + "IFEval": 0.6967, + "BBH": 0.5104, + "MATH Level 5": 0.1118, + "GPQA": 0.2995, + "MUSR": 0.3966, + "MMLU-PRO": 0.3529 + } + }, + { + "model_id": "sethuiyer/Llama-3.1-8B-Experimental-1208-Instruct", + "name": "Llama-3.1-8B-Experimental-1208-Instruct", + "developer": "sethuiyer", + "scores": { + "IFEval": 0.61, + "BBH": 0.4964, + "MATH Level 5": 0.0891, + "GPQA": 0.2961, + "MUSR": 0.379, + "MMLU-PRO": 0.3511 + } + }, + { + "model_id": "sethuiyer/LlamaZero-3.1-8B-Experimental-1208", + "name": "LlamaZero-3.1-8B-Experimental-1208", + "developer": "sethuiyer", + "scores": { + "IFEval": 0.6051, + "BBH": 0.4981, + "MATH Level 5": 0.108, + "GPQA": 0.2685, + "MUSR": 0.382, + "MMLU-PRO": 0.3 + } + }, + { + "model_id": "sethuiyer/Llamaverse-3.1-8B-Instruct", + "name": "Llamaverse-3.1-8B-Instruct", + "developer": "sethuiyer", + "scores": { + "IFEval": 0.6185, + "BBH": 0.5414, + "MATH Level 5": 0.1858, + "GPQA": 0.2911, + "MUSR": 0.3762, + "MMLU-PRO": 0.3523 + } + }, + { + "model_id": "sethuiyer/Llamazing-3.1-8B-Instruct", + "name": "Llamazing-3.1-8B-Instruct", + "developer": "sethuiyer", + "scores": { + "IFEval": 0.5711, + "BBH": 0.5291, + "MATH Level 5": 0.0544, + "GPQA": 0.3121, + "MUSR": 0.3976, + "MMLU-PRO": 0.3606 + } + }, + { + "model_id": "sethuiyer/Qwen2.5-7B-Anvita", + "name": "Qwen2.5-7B-Anvita", + "developer": "sethuiyer", + "scores": { + "IFEval": 0.648, + "BBH": 0.5466, + "MATH Level 5": 0.2017, + "GPQA": 0.3272, + "MUSR": 0.4337, + "MMLU-PRO": 0.4166 + } + }, + { + "model_id": "shadowml/BeagSake-7B", + "name": "BeagSake-7B", + "developer": "shadowml", + "scores": { + "IFEval": 0.5216, + "BBH": 0.4711, + "MATH Level 5": 0.0506, + "GPQA": 0.281, + "MUSR": 0.4124, + "MMLU-PRO": 0.2585 + } + }, + { + "model_id": "shadowml/Mixolar-4x7b", + "name": "Mixolar-4x7b", + "developer": "shadowml", + "scores": { + "IFEval": 0.3893, + "BBH": 0.5216, + "MATH Level 5": 0.0582, + "GPQA": 0.2928, + "MUSR": 0.4258, + "MMLU-PRO": 0.3305 + } + }, + { + "model_id": "shastraai/Shastra-LLAMA2-Math-Commonsense-SFT", + "name": "Shastra-LLAMA2-Math-Commonsense-SFT", + "developer": "shastraai", + "scores": { + "IFEval": 0.3042, + "BBH": 0.3843, + "MATH Level 5": 0.0174, + "GPQA": 0.2592, + "MUSR": 0.3604, + "MMLU-PRO": 0.1997 + } + }, + { + "model_id": "shivam9980/NEPALI-LLM", + "name": "NEPALI-LLM", + "developer": "shivam9980", + "scores": { + "IFEval": 0.0417, + "BBH": 0.3828, + "MATH Level 5": 0.0091, + "GPQA": 0.2617, + "MUSR": 0.4122, + "MMLU-PRO": 0.2064 + } + }, + { + "model_id": "shivam9980/mistral-7b-news-cnn-merged", + "name": "mistral-7b-news-cnn-merged", + "developer": "shivam9980", + "scores": { + "IFEval": 0.4634, + "BBH": 0.3635, + "MATH Level 5": 0.0189, + "GPQA": 0.3087, + "MUSR": 0.4523, + "MMLU-PRO": 0.2827 + } + }, + { + "model_id": "shivank21/mistral_dpo_self", + "name": "mistral_dpo_self", + "developer": "shivank21", + "scores": { + "IFEval": 0.3403, + "BBH": 0.3216, + "MATH Level 5": 0.0219, + "GPQA": 0.2408, + "MUSR": 0.3247, + "MMLU-PRO": 0.2214 + } + }, + { + "model_id": "shuttleai/shuttle-3", + "name": "shuttle-3", + "developer": "shuttleai", + "scores": { + "IFEval": 0.8154, + "BBH": 0.742, + "MATH Level 5": 0.46, + "GPQA": 0.4119, + "MUSR": 0.4377, + "MMLU-PRO": 0.5716 + } + }, + { + "model_id": "shyamieee/Padma-v7.0", + "name": "Padma-v7.0", + "developer": "shyamieee", + "scores": { + "IFEval": 0.3841, + "BBH": 0.5119, + "MATH Level 5": 0.0702, + "GPQA": 0.2861, + "MUSR": 0.4386, + "MMLU-PRO": 0.3029 + } + }, + { + "model_id": "silma-ai/SILMA-9B-Instruct-v1.0", + "name": "SILMA-9B-Instruct-v1.0", + "developer": "silma-ai", + "scores": { + "IFEval": 0.5842, + "BBH": 0.5219, + "MATH Level 5": 0.1163, + "GPQA": 0.3054, + "MUSR": 0.4637, + "MMLU-PRO": 0.392 + } + }, + { + "model_id": "silma-ai/SILMA-Kashif-2B-Instruct-v1.0", + "name": "SILMA-Kashif-2B-Instruct-v1.0", + "developer": "silma-ai", + "scores": { + "IFEval": 0.1181, + "BBH": 0.3793, + "MATH Level 5": 0.0113, + "GPQA": 0.2701, + "MUSR": 0.4043, + "MMLU-PRO": 0.2258 + } + }, + { + "model_id": "siqi00/Mistral-7B-DFT", + "name": "Mistral-7B-DFT", + "developer": "siqi00", + "scores": { + "IFEval": 0.5569, + "BBH": 0.4665, + "MATH Level 5": 0.0378, + "GPQA": 0.3045, + "MUSR": 0.4191, + "MMLU-PRO": 0.2963 + } + }, + { + "model_id": "siqi00/Mistral-7B-DFT2", + "name": "Mistral-7B-DFT2", + "developer": "siqi00", + "scores": { + "IFEval": 0.5804, + "BBH": 0.3968, + "MATH Level 5": 0.0453, + "GPQA": 0.2995, + "MUSR": 0.4401, + "MMLU-PRO": 0.2852 + } + }, + { + "model_id": "skumar9/Llama-medx_v2", + "name": "Llama-medx_v2", + "developer": "skumar9", + "scores": { + "IFEval": 0.4462, + "BBH": 0.4909, + "MATH Level 5": 0.0914, + "GPQA": 0.3054, + "MUSR": 0.3661, + "MMLU-PRO": 0.3463 + } + }, + { + "model_id": "skymizer/Llama2-7b-sft-chat-custom-template-dpo", + "name": "Llama2-7b-sft-chat-custom-template-dpo", + "developer": "skymizer", + "scores": { + "IFEval": 0.2353, + "BBH": 0.3688, + "MATH Level 5": 0.0144, + "GPQA": 0.2391, + "MUSR": 0.4429, + "MMLU-PRO": 0.1946 + } + }, + { + "model_id": "someon98/qwen-CoMa-0.5b", + "name": "qwen-CoMa-0.5b", + "developer": "someon98", + "scores": { + "IFEval": 0.2277, + "BBH": 0.2953, + "MATH Level 5": 0.0045, + "GPQA": 0.2399, + "MUSR": 0.4046, + "MMLU-PRO": 0.1099 + } + }, + { + "model_id": "sometimesanotion/ChocoTrio-14B-v1", + "name": "ChocoTrio-14B-v1", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7089, + "BBH": 0.6506, + "MATH Level 5": 0.3973, + "GPQA": 0.3851, + "MUSR": 0.4821, + "MMLU-PRO": 0.537 + } + }, + { + "model_id": "sometimesanotion/IF-reasoning-experiment-40", + "name": "IF-reasoning-experiment-40", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.633, + "BBH": 0.6112, + "MATH Level 5": 0.3716, + "GPQA": 0.38, + "MUSR": 0.5194, + "MMLU-PRO": 0.5025 + } + }, + { + "model_id": "sometimesanotion/IF-reasoning-experiment-80", + "name": "IF-reasoning-experiment-80", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5463, + "BBH": 0.421, + "MATH Level 5": 0.0989, + "GPQA": 0.2844, + "MUSR": 0.5025, + "MMLU-PRO": 0.3368 + } + }, + { + "model_id": "sometimesanotion/KytheraMix-7B-v0.2", + "name": "KytheraMix-7B-v0.2", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6129, + "BBH": 0.5635, + "MATH Level 5": 0.2923, + "GPQA": 0.3356, + "MUSR": 0.4594, + "MMLU-PRO": 0.4505 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.1-experimental", + "name": "Lamarck-14B-v0.1-experimental", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5354, + "BBH": 0.6583, + "MATH Level 5": 0.358, + "GPQA": 0.3817, + "MUSR": 0.4728, + "MMLU-PRO": 0.5408 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.3", + "name": "Lamarck-14B-v0.3", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5032, + "BBH": 0.6611, + "MATH Level 5": 0.3406, + "GPQA": 0.3884, + "MUSR": 0.4688, + "MMLU-PRO": 0.5411 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.4-Qwenvergence", + "name": "Lamarck-14B-v0.4-Qwenvergence", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4906, + "BBH": 0.6535, + "MATH Level 5": 0.3399, + "GPQA": 0.3784, + "MUSR": 0.4847, + "MMLU-PRO": 0.5406 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.6", + "name": "Lamarck-14B-v0.6", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6973, + "BBH": 0.646, + "MATH Level 5": 0.4041, + "GPQA": 0.3893, + "MUSR": 0.4847, + "MMLU-PRO": 0.54 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.6-002-model_stock", + "name": "Lamarck-14B-v0.6-002-model_stock", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6692, + "BBH": 0.6143, + "MATH Level 5": 0.3776, + "GPQA": 0.3742, + "MUSR": 0.518, + "MMLU-PRO": 0.5054 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.6-model_stock", + "name": "Lamarck-14B-v0.6-model_stock", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.679, + "BBH": 0.6269, + "MATH Level 5": 0.4245, + "GPQA": 0.3842, + "MUSR": 0.5007, + "MMLU-PRO": 0.5198 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.7-Fusion", + "name": "Lamarck-14B-v0.7-Fusion", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6821, + "BBH": 0.6544, + "MATH Level 5": 0.4041, + "GPQA": 0.401, + "MUSR": 0.4991, + "MMLU-PRO": 0.5391 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.7-rc1", + "name": "Lamarck-14B-v0.7-rc1", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7305, + "BBH": 0.6486, + "MATH Level 5": 0.3852, + "GPQA": 0.3893, + "MUSR": 0.4715, + "MMLU-PRO": 0.5416 + } + }, + { + "model_id": "sometimesanotion/Lamarck-14B-v0.7-rc4", + "name": "Lamarck-14B-v0.7-rc4", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7211, + "BBH": 0.651, + "MATH Level 5": 0.4026, + "GPQA": 0.3893, + "MUSR": 0.4912, + "MMLU-PRO": 0.54 + } + }, + { + "model_id": "sometimesanotion/LamarckInfusion-14B-v1", + "name": "LamarckInfusion-14B-v1", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7198, + "BBH": 0.6539, + "MATH Level 5": 0.4169, + "GPQA": 0.3909, + "MUSR": 0.4899, + "MMLU-PRO": 0.5376 + } + }, + { + "model_id": "sometimesanotion/LamarckInfusion-14B-v2", + "name": "LamarckInfusion-14B-v2", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6812, + "BBH": 0.6564, + "MATH Level 5": 0.4388, + "GPQA": 0.3876, + "MUSR": 0.4993, + "MMLU-PRO": 0.5416 + } + }, + { + "model_id": "sometimesanotion/LamarckInfusion-14B-v2-hi", + "name": "LamarckInfusion-14B-v2-hi", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6855, + "BBH": 0.6555, + "MATH Level 5": 0.423, + "GPQA": 0.3884, + "MUSR": 0.4847, + "MMLU-PRO": 0.5405 + } + }, + { + "model_id": "sometimesanotion/LamarckInfusion-14B-v2-lo", + "name": "LamarckInfusion-14B-v2-lo", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6788, + "BBH": 0.6528, + "MATH Level 5": 0.4237, + "GPQA": 0.3859, + "MUSR": 0.4991, + "MMLU-PRO": 0.5397 + } + }, + { + "model_id": "sometimesanotion/LamarckInfusion-14B-v3", + "name": "LamarckInfusion-14B-v3", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7131, + "BBH": 0.6518, + "MATH Level 5": 0.4124, + "GPQA": 0.3867, + "MUSR": 0.482, + "MMLU-PRO": 0.5407 + } + }, + { + "model_id": "sometimesanotion/Qwen-14B-ProseStock-v4", + "name": "Qwen-14B-ProseStock-v4", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4942, + "BBH": 0.6498, + "MATH Level 5": 0.364, + "GPQA": 0.3884, + "MUSR": 0.4938, + "MMLU-PRO": 0.5386 + } + }, + { + "model_id": "sometimesanotion/Qwen-2.5-14B-Virmarckeoso", + "name": "Qwen-2.5-14B-Virmarckeoso", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4813, + "BBH": 0.657, + "MATH Level 5": 0.3565, + "GPQA": 0.3792, + "MUSR": 0.4794, + "MMLU-PRO": 0.5377 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-14B-Vimarckoso", + "name": "Qwen2.5-14B-Vimarckoso", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4574, + "BBH": 0.6446, + "MATH Level 5": 0.3384, + "GPQA": 0.3926, + "MUSR": 0.4859, + "MMLU-PRO": 0.5329 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-14B-Vimarckoso-v2", + "name": "Qwen2.5-14B-Vimarckoso-v2", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4505, + "BBH": 0.655, + "MATH Level 5": 0.358, + "GPQA": 0.3826, + "MUSR": 0.4819, + "MMLU-PRO": 0.538 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-14B-Vimarckoso-v3", + "name": "Qwen2.5-14B-Vimarckoso-v3", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7257, + "BBH": 0.6415, + "MATH Level 5": 0.4003, + "GPQA": 0.38, + "MUSR": 0.4807, + "MMLU-PRO": 0.5343 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-14B-Vimarckoso-v3-IF-Variant", + "name": "Qwen2.5-14B-Vimarckoso-v3-IF-Variant", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6413, + "BBH": 0.5521, + "MATH Level 5": 0.2545, + "GPQA": 0.3473, + "MUSR": 0.5319, + "MMLU-PRO": 0.4589 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-14B-Vimarckoso-v3-Prose01", + "name": "Qwen2.5-14B-Vimarckoso-v3-Prose01", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6872, + "BBH": 0.6359, + "MATH Level 5": 0.3995, + "GPQA": 0.3867, + "MUSR": 0.4807, + "MMLU-PRO": 0.5275 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-14B-Vimarckoso-v3-model_stock", + "name": "Qwen2.5-14B-Vimarckoso-v3-model_stock", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7162, + "BBH": 0.6421, + "MATH Level 5": 0.4245, + "GPQA": 0.38, + "MUSR": 0.4781, + "MMLU-PRO": 0.5316 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-7B-Gordion-v0.1", + "name": "Qwen2.5-7B-Gordion-v0.1", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7482, + "BBH": 0.5524, + "MATH Level 5": 0.2915, + "GPQA": 0.3079, + "MUSR": 0.4016, + "MMLU-PRO": 0.43 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-7B-Gordion-v0.1-Prose", + "name": "Qwen2.5-7B-Gordion-v0.1-Prose", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5347, + "BBH": 0.5599, + "MATH Level 5": 0.2893, + "GPQA": 0.3205, + "MUSR": 0.4502, + "MMLU-PRO": 0.4525 + } + }, + { + "model_id": "sometimesanotion/Qwen2.5-7B-Gordion-v0.1-Reason", + "name": "Qwen2.5-7B-Gordion-v0.1-Reason", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4917, + "BBH": 0.5498, + "MATH Level 5": 0.2621, + "GPQA": 0.3406, + "MUSR": 0.4434, + "MMLU-PRO": 0.4307 + } + }, + { + "model_id": "sometimesanotion/Qwentessential-14B-v1", + "name": "Qwentessential-14B-v1", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6279, + "BBH": 0.6545, + "MATH Level 5": 0.4071, + "GPQA": 0.3876, + "MUSR": 0.4873, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v013", + "name": "Qwentinuum-14B-v013", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6711, + "BBH": 0.6087, + "MATH Level 5": 0.3708, + "GPQA": 0.3574, + "MUSR": 0.5154, + "MMLU-PRO": 0.4991 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v1", + "name": "Qwentinuum-14B-v1", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5032, + "BBH": 0.6573, + "MATH Level 5": 0.3603, + "GPQA": 0.3826, + "MUSR": 0.4781, + "MMLU-PRO": 0.541 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v2", + "name": "Qwentinuum-14B-v2", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5378, + "BBH": 0.6555, + "MATH Level 5": 0.3754, + "GPQA": 0.3884, + "MUSR": 0.4714, + "MMLU-PRO": 0.5409 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v3", + "name": "Qwentinuum-14B-v3", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6158, + "BBH": 0.6539, + "MATH Level 5": 0.3535, + "GPQA": 0.3876, + "MUSR": 0.486, + "MMLU-PRO": 0.5413 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v5", + "name": "Qwentinuum-14B-v5", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6286, + "BBH": 0.655, + "MATH Level 5": 0.3444, + "GPQA": 0.3876, + "MUSR": 0.4874, + "MMLU-PRO": 0.5418 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v6", + "name": "Qwentinuum-14B-v6", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6304, + "BBH": 0.6545, + "MATH Level 5": 0.3603, + "GPQA": 0.3867, + "MUSR": 0.49, + "MMLU-PRO": 0.54 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v6-Prose", + "name": "Qwentinuum-14B-v6-Prose", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5643, + "BBH": 0.6545, + "MATH Level 5": 0.3701, + "GPQA": 0.3884, + "MUSR": 0.4913, + "MMLU-PRO": 0.5392 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v7", + "name": "Qwentinuum-14B-v7", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6109, + "BBH": 0.6551, + "MATH Level 5": 0.3573, + "GPQA": 0.3909, + "MUSR": 0.482, + "MMLU-PRO": 0.541 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v8", + "name": "Qwentinuum-14B-v8", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5412, + "BBH": 0.6534, + "MATH Level 5": 0.3912, + "GPQA": 0.3834, + "MUSR": 0.4873, + "MMLU-PRO": 0.5412 + } + }, + { + "model_id": "sometimesanotion/Qwentinuum-14B-v9", + "name": "Qwentinuum-14B-v9", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5107, + "BBH": 0.658, + "MATH Level 5": 0.3482, + "GPQA": 0.3859, + "MUSR": 0.4781, + "MMLU-PRO": 0.5421 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-qv256", + "name": "Qwenvergence-14B-qv256", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7006, + "BBH": 0.6312, + "MATH Level 5": 0.3897, + "GPQA": 0.3784, + "MUSR": 0.4926, + "MMLU-PRO": 0.5178 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v0.6-004-model_stock", + "name": "Qwenvergence-14B-v0.6-004-model_stock", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.686, + "BBH": 0.6249, + "MATH Level 5": 0.4094, + "GPQA": 0.3834, + "MUSR": 0.5033, + "MMLU-PRO": 0.5193 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v10", + "name": "Qwenvergence-14B-v10", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6757, + "BBH": 0.6316, + "MATH Level 5": 0.4789, + "GPQA": 0.3792, + "MUSR": 0.4991, + "MMLU-PRO": 0.5239 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v11", + "name": "Qwenvergence-14B-v11", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7192, + "BBH": 0.6368, + "MATH Level 5": 0.4645, + "GPQA": 0.3725, + "MUSR": 0.4754, + "MMLU-PRO": 0.5327 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v12-Prose", + "name": "Qwenvergence-14B-v12-Prose", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5412, + "BBH": 0.6504, + "MATH Level 5": 0.3535, + "GPQA": 0.3867, + "MUSR": 0.4991, + "MMLU-PRO": 0.5381 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v12-Prose-DS", + "name": "Qwenvergence-14B-v12-Prose-DS", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6173, + "BBH": 0.6507, + "MATH Level 5": 0.4305, + "GPQA": 0.3943, + "MUSR": 0.5151, + "MMLU-PRO": 0.5369 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v13-Prose-DS", + "name": "Qwenvergence-14B-v13-Prose-DS", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.7178, + "BBH": 0.6405, + "MATH Level 5": 0.386, + "GPQA": 0.3834, + "MUSR": 0.4927, + "MMLU-PRO": 0.5349 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v15-Prose-MS", + "name": "Qwenvergence-14B-v15-Prose-MS", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5032, + "BBH": 0.655, + "MATH Level 5": 0.3633, + "GPQA": 0.3951, + "MUSR": 0.4913, + "MMLU-PRO": 0.5393 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v2-Prose", + "name": "Qwenvergence-14B-v2-Prose", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4705, + "BBH": 0.6519, + "MATH Level 5": 0.3557, + "GPQA": 0.3935, + "MUSR": 0.4926, + "MMLU-PRO": 0.5372 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v3", + "name": "Qwenvergence-14B-v3", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5044, + "BBH": 0.6548, + "MATH Level 5": 0.3693, + "GPQA": 0.3842, + "MUSR": 0.4886, + "MMLU-PRO": 0.5386 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v3-Prose", + "name": "Qwenvergence-14B-v3-Prose", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4918, + "BBH": 0.6513, + "MATH Level 5": 0.3648, + "GPQA": 0.3951, + "MUSR": 0.4939, + "MMLU-PRO": 0.537 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v3-Reason", + "name": "Qwenvergence-14B-v3-Reason", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5367, + "BBH": 0.6561, + "MATH Level 5": 0.358, + "GPQA": 0.3867, + "MUSR": 0.474, + "MMLU-PRO": 0.5395 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v6-Prose", + "name": "Qwenvergence-14B-v6-Prose", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.599, + "BBH": 0.6544, + "MATH Level 5": 0.3565, + "GPQA": 0.3884, + "MUSR": 0.4887, + "MMLU-PRO": 0.5371 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v6-Prose-model_stock", + "name": "Qwenvergence-14B-v6-Prose-model_stock", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4811, + "BBH": 0.653, + "MATH Level 5": 0.3603, + "GPQA": 0.3935, + "MUSR": 0.4899, + "MMLU-PRO": 0.5387 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v8", + "name": "Qwenvergence-14B-v8", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.5913, + "BBH": 0.6522, + "MATH Level 5": 0.4048, + "GPQA": 0.3809, + "MUSR": 0.4768, + "MMLU-PRO": 0.5435 + } + }, + { + "model_id": "sometimesanotion/Qwenvergence-14B-v9", + "name": "Qwenvergence-14B-v9", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.6598, + "BBH": 0.6166, + "MATH Level 5": 0.4139, + "GPQA": 0.3683, + "MUSR": 0.5141, + "MMLU-PRO": 0.5111 + } + }, + { + "model_id": "sometimesanotion/lamarck-14b-prose-model_stock", + "name": "lamarck-14b-prose-model_stock", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4276, + "BBH": 0.6488, + "MATH Level 5": 0.3414, + "GPQA": 0.3935, + "MUSR": 0.4846, + "MMLU-PRO": 0.5354 + } + }, + { + "model_id": "sometimesanotion/lamarck-14b-reason-model_stock", + "name": "lamarck-14b-reason-model_stock", + "developer": "sometimesanotion", + "scores": { + "IFEval": 0.4965, + "BBH": 0.6569, + "MATH Level 5": 0.358, + "GPQA": 0.3842, + "MUSR": 0.4741, + "MMLU-PRO": 0.5402 + } + }, + { + "model_id": "sonthenguyen/ft-unsloth-zephyr-sft-bnb-4bit-20241014-161415", + "name": "ft-unsloth-zephyr-sft-bnb-4bit-20241014-161415", + "developer": "sonthenguyen", + "scores": { + "IFEval": 0.2893, + "BBH": 0.3804, + "MATH Level 5": 0.0113, + "GPQA": 0.2466, + "MUSR": 0.3861, + "MMLU-PRO": 0.1401 + } + }, + { + "model_id": "sonthenguyen/ft-unsloth-zephyr-sft-bnb-4bit-20241014-164205", + "name": "ft-unsloth-zephyr-sft-bnb-4bit-20241014-164205", + "developer": "sonthenguyen", + "scores": { + "IFEval": 0.3199, + "BBH": 0.3959, + "MATH Level 5": 0.0083, + "GPQA": 0.276, + "MUSR": 0.4272, + "MMLU-PRO": 0.2124 + } + }, + { + "model_id": "sonthenguyen/ft-unsloth-zephyr-sft-bnb-4bit-20241014-170522", + "name": "ft-unsloth-zephyr-sft-bnb-4bit-20241014-170522", + "developer": "sonthenguyen", + "scores": { + "IFEval": 0.3764, + "BBH": 0.3828, + "MATH Level 5": 0.0091, + "GPQA": 0.2651, + "MUSR": 0.4404, + "MMLU-PRO": 0.2055 + } + }, + { + "model_id": "sonthenguyen/zephyr-sft-bnb-4bit-DPO-mtbc-213steps", + "name": "zephyr-sft-bnb-4bit-DPO-mtbc-213steps", + "developer": "sonthenguyen", + "scores": { + "IFEval": 0.4275, + "BBH": 0.4197, + "MATH Level 5": 0.0257, + "GPQA": 0.2617, + "MUSR": 0.4086, + "MMLU-PRO": 0.2709 + } + }, + { + "model_id": "sonthenguyen/zephyr-sft-bnb-4bit-DPO-mtbo-180steps", + "name": "zephyr-sft-bnb-4bit-DPO-mtbo-180steps", + "developer": "sonthenguyen", + "scores": { + "IFEval": 0.4087, + "BBH": 0.4323, + "MATH Level 5": 0.0234, + "GPQA": 0.276, + "MUSR": 0.3885, + "MMLU-PRO": 0.2748 + } + }, + { + "model_id": "sonthenguyen/zephyr-sft-bnb-4bit-DPO-mtbr-180steps", + "name": "zephyr-sft-bnb-4bit-DPO-mtbr-180steps", + "developer": "sonthenguyen", + "scores": { + "IFEval": 0.4032, + "BBH": 0.4305, + "MATH Level 5": 0.0249, + "GPQA": 0.2802, + "MUSR": 0.4258, + "MMLU-PRO": 0.2711 + } + }, + { + "model_id": "sophosympatheia/Midnight-Miqu-70B-v1.5", + "name": "Midnight-Miqu-70B-v1.5", + "developer": "sophosympatheia", + "scores": { + "IFEval": 0.6118, + "BBH": 0.5606, + "MATH Level 5": 0.0702, + "GPQA": 0.2961, + "MUSR": 0.4244, + "MMLU-PRO": 0.3825 + } + }, + { + "model_id": "speakleash/Bielik-11B-v2", + "name": "Bielik-11B-v2", + "developer": "speakleash", + "scores": { + "IFEval": 0.2381, + "BBH": 0.4931, + "MATH Level 5": 0.0785, + "GPQA": 0.2886, + "MUSR": 0.3924, + "MMLU-PRO": 0.3137 + } + }, + { + "model_id": "speakleash/Bielik-11B-v2.0-Instruct", + "name": "Bielik-11B-v2.0-Instruct", + "developer": "speakleash", + "scores": { + "IFEval": 0.5252, + "BBH": 0.5362, + "MATH Level 5": 0.1186, + "GPQA": 0.3171, + "MUSR": 0.4467, + "MMLU-PRO": 0.3351 + } + }, + { + "model_id": "speakleash/Bielik-11B-v2.1-Instruct", + "name": "Bielik-11B-v2.1-Instruct", + "developer": "speakleash", + "scores": { + "IFEval": 0.509, + "BBH": 0.553, + "MATH Level 5": 0.2666, + "GPQA": 0.3372, + "MUSR": 0.4185, + "MMLU-PRO": 0.3447 + } + }, + { + "model_id": "speakleash/Bielik-11B-v2.2-Instruct", + "name": "Bielik-11B-v2.2-Instruct", + "developer": "speakleash", + "scores": { + "IFEval": 0.5552, + "BBH": 0.5597, + "MATH Level 5": 0.2681, + "GPQA": 0.3314, + "MUSR": 0.4171, + "MMLU-PRO": 0.3487 + } + }, + { + "model_id": "speakleash/Bielik-11B-v2.3-Instruct", + "name": "Bielik-11B-v2.3-Instruct", + "developer": "speakleash", + "scores": { + "IFEval": 0.5583, + "BBH": 0.5663, + "MATH Level 5": 0.2085, + "GPQA": 0.3406, + "MUSR": 0.4518, + "MMLU-PRO": 0.3444 + } + }, + { + "model_id": "spmurrayzzz/Mistral-Syndicate-7B", + "name": "Mistral-Syndicate-7B", + "developer": "spmurrayzzz", + "scores": { + "IFEval": 0.2496, + "BBH": 0.4245, + "MATH Level 5": 0.034, + "GPQA": 0.276, + "MUSR": 0.4386, + "MMLU-PRO": 0.2631 + } + }, + { + "model_id": "spow12/ChatWaifu_12B_v2.0", + "name": "ChatWaifu_12B_v2.0", + "developer": "spow12", + "scores": { + "IFEval": 0.4768, + "BBH": 0.5208, + "MATH Level 5": 0.071, + "GPQA": 0.2768, + "MUSR": 0.4432, + "MMLU-PRO": 0.3388 + } + }, + { + "model_id": "spow12/ChatWaifu_22B_v2.0_preview", + "name": "ChatWaifu_22B_v2.0_preview", + "developer": "spow12", + "scores": { + "IFEval": 0.6745, + "BBH": 0.617, + "MATH Level 5": 0.1888, + "GPQA": 0.3154, + "MUSR": 0.3685, + "MMLU-PRO": 0.3988 + } + }, + { + "model_id": "spow12/ChatWaifu_v1.4", + "name": "ChatWaifu_v1.4", + "developer": "spow12", + "scores": { + "IFEval": 0.5691, + "BBH": 0.5176, + "MATH Level 5": 0.1057, + "GPQA": 0.307, + "MUSR": 0.4743, + "MMLU-PRO": 0.3475 + } + }, + { + "model_id": "spow12/ChatWaifu_v2.0_22B", + "name": "ChatWaifu_v2.0_22B", + "developer": "spow12", + "scores": { + "IFEval": 0.6517, + "BBH": 0.5908, + "MATH Level 5": 0.2032, + "GPQA": 0.3238, + "MUSR": 0.3842, + "MMLU-PRO": 0.3812 + } + }, + { + "model_id": "ssmits/Qwen2.5-95B-Instruct", + "name": "Qwen2.5-95B-Instruct", + "developer": "ssmits", + "scores": { + "IFEval": 0.8431, + "BBH": 0.7038, + "MATH Level 5": 0.5302, + "GPQA": 0.3641, + "MUSR": 0.4284, + "MMLU-PRO": 0.5217 + } + }, + { + "model_id": "stabilityai/StableBeluga2", + "name": "StableBeluga2", + "developer": "stabilityai", + "scores": { + "IFEval": 0.3787, + "BBH": 0.5824, + "MATH Level 5": 0.0438, + "GPQA": 0.3163, + "MUSR": 0.473, + "MMLU-PRO": 0.3326 + } + }, + { + "model_id": "stabilityai/stablelm-2-12b", + "name": "stablelm-2-12b", + "developer": "stabilityai", + "scores": { + "IFEval": 0.1569, + "BBH": 0.4509, + "MATH Level 5": 0.0431, + "GPQA": 0.2785, + "MUSR": 0.4479, + "MMLU-PRO": 0.3072 + } + }, + { + "model_id": "stabilityai/stablelm-2-12b-chat", + "name": "stablelm-2-12b-chat", + "developer": "stabilityai", + "scores": { + "IFEval": 0.4082, + "BBH": 0.4672, + "MATH Level 5": 0.0536, + "GPQA": 0.2668, + "MUSR": 0.3914, + "MMLU-PRO": 0.2734 + } + }, + { + "model_id": "stabilityai/stablelm-2-1_6b", + "name": "stablelm-2-1_6b", + "developer": "stabilityai", + "scores": { + "IFEval": 0.1157, + "BBH": 0.3385, + "MATH Level 5": 0.0076, + "GPQA": 0.2483, + "MUSR": 0.3882, + "MMLU-PRO": 0.1464 + } + }, + { + "model_id": "stabilityai/stablelm-2-1_6b-chat", + "name": "stablelm-2-1_6b-chat", + "developer": "stabilityai", + "scores": { + "IFEval": 0.306, + "BBH": 0.339, + "MATH Level 5": 0.0249, + "GPQA": 0.2475, + "MUSR": 0.358, + "MMLU-PRO": 0.1622 + } + }, + { + "model_id": "stabilityai/stablelm-2-zephyr-1_6b", + "name": "stablelm-2-zephyr-1_6b", + "developer": "stabilityai", + "scores": { + "IFEval": 0.3279, + "BBH": 0.3352, + "MATH Level 5": 0.0332, + "GPQA": 0.2433, + "MUSR": 0.3511, + "MMLU-PRO": 0.1714 + } + }, + { + "model_id": "stabilityai/stablelm-3b-4e1t", + "name": "stablelm-3b-4e1t", + "developer": "stabilityai", + "scores": { + "IFEval": 0.2203, + "BBH": 0.3504, + "MATH Level 5": 0.0106, + "GPQA": 0.2374, + "MUSR": 0.3778, + "MMLU-PRO": 0.1669 + } + }, + { + "model_id": "stabilityai/stablelm-zephyr-3b", + "name": "stablelm-zephyr-3b", + "developer": "stabilityai", + "scores": { + "IFEval": 0.3683, + "BBH": 0.3866, + "MATH Level 5": 0.0431, + "GPQA": 0.2391, + "MUSR": 0.4183, + "MMLU-PRO": 0.1768 + } + }, + { + "model_id": "sthenno-com/miscii-14b-0130", + "name": "miscii-14b-0130", + "developer": "sthenno-com", + "scores": { + "IFEval": 0.6647, + "BBH": 0.6505, + "MATH Level 5": 0.432, + "GPQA": 0.3817, + "MUSR": 0.4912, + "MMLU-PRO": 0.5363 + } + }, + { + "model_id": "sthenno-com/miscii-14b-0218", + "name": "miscii-14b-0218", + "developer": "sthenno-com", + "scores": { + "IFEval": 0.7656, + "BBH": 0.6559, + "MATH Level 5": 0.5144, + "GPQA": 0.3834, + "MUSR": 0.4273, + "MMLU-PRO": 0.5298 + } + }, + { + "model_id": "sthenno-com/miscii-14b-1028", + "name": "miscii-14b-1028", + "developer": "sthenno-com", + "scores": { + "IFEval": 0.8237, + "BBH": 0.6448, + "MATH Level 5": 0.503, + "GPQA": 0.3565, + "MUSR": 0.4182, + "MMLU-PRO": 0.5153 + } + }, + { + "model_id": "sthenno-com/miscii-14b-1225", + "name": "miscii-14b-1225", + "developer": "sthenno-com", + "scores": { + "IFEval": 0.7878, + "BBH": 0.6572, + "MATH Level 5": 0.4517, + "GPQA": 0.3775, + "MUSR": 0.4366, + "MMLU-PRO": 0.5272 + } + }, + { + "model_id": "sthenno/tempesthenno-0120", + "name": "tempesthenno-0120", + "developer": "sthenno", + "scores": { + "IFEval": 0.539, + "BBH": 0.6373, + "MATH Level 5": 0.3353, + "GPQA": 0.3943, + "MUSR": 0.4633, + "MMLU-PRO": 0.529 + } + }, + { + "model_id": "sthenno/tempesthenno-fusion-0309", + "name": "tempesthenno-fusion-0309", + "developer": "sthenno", + "scores": { + "IFEval": 0.7692, + "BBH": 0.6581, + "MATH Level 5": 0.4766, + "GPQA": 0.37, + "MUSR": 0.4325, + "MMLU-PRO": 0.5258 + } + }, + { + "model_id": "sthenno/tempesthenno-kto-0205-ckpt80", + "name": "tempesthenno-kto-0205-ckpt80", + "developer": "sthenno", + "scores": { + "IFEval": 0.8054, + "BBH": 0.6543, + "MATH Level 5": 0.4592, + "GPQA": 0.3482, + "MUSR": 0.4248, + "MMLU-PRO": 0.5286 + } + }, + { + "model_id": "sthenno/tempesthenno-nuslerp-001", + "name": "tempesthenno-nuslerp-001", + "developer": "sthenno", + "scores": { + "IFEval": 0.7926, + "BBH": 0.6578, + "MATH Level 5": 0.4758, + "GPQA": 0.3733, + "MUSR": 0.43, + "MMLU-PRO": 0.5257 + } + }, + { + "model_id": "sthenno/tempesthenno-nuslerp-0124", + "name": "tempesthenno-nuslerp-0124", + "developer": "sthenno", + "scores": { + "IFEval": 0.7004, + "BBH": 0.6469, + "MATH Level 5": 0.4116, + "GPQA": 0.3901, + "MUSR": 0.4859, + "MMLU-PRO": 0.5352 + } + }, + { + "model_id": "sthenno/tempesthenno-ppo-ckpt40", + "name": "tempesthenno-ppo-ckpt40", + "developer": "sthenno", + "scores": { + "IFEval": 0.7923, + "BBH": 0.655, + "MATH Level 5": 0.4736, + "GPQA": 0.3775, + "MUSR": 0.4352, + "MMLU-PRO": 0.5292 + } + }, + { + "model_id": "sthenno/tempesthenno-sft-0309-ckpt10", + "name": "tempesthenno-sft-0309-ckpt10", + "developer": "sthenno", + "scores": { + "IFEval": 0.7744, + "BBH": 0.6552, + "MATH Level 5": 0.4721, + "GPQA": 0.3716, + "MUSR": 0.4364, + "MMLU-PRO": 0.5258 + } + }, + { + "model_id": "sthenno/tempesthenno-sft-0314-stage1-ckpt50", + "name": "tempesthenno-sft-0314-stage1-ckpt50", + "developer": "sthenno", + "scores": { + "IFEval": 0.7394, + "BBH": 0.6601, + "MATH Level 5": 0.4683, + "GPQA": 0.3733, + "MUSR": 0.4429, + "MMLU-PRO": 0.5302 + } + }, + { + "model_id": "sthenno/tempestissimo-14b-0309", + "name": "tempestissimo-14b-0309", + "developer": "sthenno", + "scores": { + "IFEval": 0.7549, + "BBH": 0.6587, + "MATH Level 5": 0.4796, + "GPQA": 0.3666, + "MUSR": 0.4312, + "MMLU-PRO": 0.5281 + } + }, + { + "model_id": "streamerbtw1002/Nexuim-R1-7B-Instruct", + "name": "Nexuim-R1-7B-Instruct", + "developer": "streamerbtw1002", + "scores": { + "IFEval": 0.6934, + "BBH": 0.5175, + "MATH Level 5": 0.4456, + "GPQA": 0.2592, + "MUSR": 0.3356, + "MMLU-PRO": 0.4138 + } + }, + { + "model_id": "stupidity-ai/Llama-3-8B-Instruct-MultiMoose", + "name": "Llama-3-8B-Instruct-MultiMoose", + "developer": "stupidity-ai", + "scores": { + "IFEval": 0.2318, + "BBH": 0.2823, + "MATH Level 5": 0.0, + "GPQA": 0.2534, + "MUSR": 0.3485, + "MMLU-PRO": 0.1094 + } + }, + { + "model_id": "suayptalha/Clarus-7B-v0.1", + "name": "Clarus-7B-v0.1", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7454, + "BBH": 0.5497, + "MATH Level 5": 0.4924, + "GPQA": 0.307, + "MUSR": 0.443, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "suayptalha/Clarus-7B-v0.2", + "name": "Clarus-7B-v0.2", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7679, + "BBH": 0.549, + "MATH Level 5": 0.4856, + "GPQA": 0.302, + "MUSR": 0.4417, + "MMLU-PRO": 0.44 + } + }, + { + "model_id": "suayptalha/Clarus-7B-v0.3", + "name": "Clarus-7B-v0.3", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7509, + "BBH": 0.5526, + "MATH Level 5": 0.4879, + "GPQA": 0.3121, + "MUSR": 0.4402, + "MMLU-PRO": 0.4385 + } + }, + { + "model_id": "suayptalha/DeepSeek-R1-Distill-Llama-3B", + "name": "DeepSeek-R1-Distill-Llama-3B", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7093, + "BBH": 0.4452, + "MATH Level 5": 0.2092, + "GPQA": 0.2609, + "MUSR": 0.3396, + "MMLU-PRO": 0.2978 + } + }, + { + "model_id": "suayptalha/Falcon3-Jessi-v0.4-7B-Slerp", + "name": "Falcon3-Jessi-v0.4-7B-Slerp", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7676, + "BBH": 0.5591, + "MATH Level 5": 0.3965, + "GPQA": 0.3121, + "MUSR": 0.4812, + "MMLU-PRO": 0.406 + } + }, + { + "model_id": "suayptalha/HomerCreativeAnvita-Mix-Qw7B", + "name": "HomerCreativeAnvita-Mix-Qw7B", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7808, + "BBH": 0.5565, + "MATH Level 5": 0.361, + "GPQA": 0.3146, + "MUSR": 0.4416, + "MMLU-PRO": 0.4445 + } + }, + { + "model_id": "suayptalha/Komodo-Llama-3.2-3B-v2-fp16", + "name": "Komodo-Llama-3.2-3B-v2-fp16", + "developer": "suayptalha", + "scores": { + "IFEval": 0.6341, + "BBH": 0.4355, + "MATH Level 5": 0.1065, + "GPQA": 0.2777, + "MUSR": 0.3406, + "MMLU-PRO": 0.2852 + } + }, + { + "model_id": "suayptalha/Lamarckvergence-14B", + "name": "Lamarckvergence-14B", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7656, + "BBH": 0.6517, + "MATH Level 5": 0.54, + "GPQA": 0.3633, + "MUSR": 0.4422, + "MMLU-PRO": 0.5283 + } + }, + { + "model_id": "suayptalha/Lix-14B-v0.1", + "name": "Lix-14B-v0.1", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7813, + "BBH": 0.6608, + "MATH Level 5": 0.5295, + "GPQA": 0.37, + "MUSR": 0.4338, + "MMLU-PRO": 0.5314 + } + }, + { + "model_id": "suayptalha/Luminis-phi-4", + "name": "Luminis-phi-4", + "developer": "suayptalha", + "scores": { + "IFEval": 0.69, + "BBH": 0.692, + "MATH Level 5": 0.4637, + "GPQA": 0.3515, + "MUSR": 0.4572, + "MMLU-PRO": 0.5424 + } + }, + { + "model_id": "suayptalha/Maestro-10B", + "name": "Maestro-10B", + "developer": "suayptalha", + "scores": { + "IFEval": 0.7768, + "BBH": 0.5746, + "MATH Level 5": 0.1911, + "GPQA": 0.3331, + "MUSR": 0.4397, + "MMLU-PRO": 0.4218 + } + }, + { + "model_id": "suayptalha/Rombos-2.5-T.E-8.1", + "name": "Rombos-2.5-T.E-8.1", + "developer": "suayptalha", + "scores": { + "IFEval": 0.6925, + "BBH": 0.5515, + "MATH Level 5": 0.4924, + "GPQA": 0.3112, + "MUSR": 0.4166, + "MMLU-PRO": 0.4446 + } + }, + { + "model_id": "sumink/Qmerft", + "name": "Qmerft", + "developer": "sumink", + "scores": { + "IFEval": 0.1564, + "BBH": 0.2939, + "MATH Level 5": 0.0023, + "GPQA": 0.2525, + "MUSR": 0.3688, + "MMLU-PRO": 0.1157 + } + }, + { + "model_id": "sumink/Qwenftmodel", + "name": "Qwenftmodel", + "developer": "sumink", + "scores": { + "IFEval": 0.1729, + "BBH": 0.3823, + "MATH Level 5": 0.0891, + "GPQA": 0.2567, + "MUSR": 0.3617, + "MMLU-PRO": 0.2339 + } + }, + { + "model_id": "sumink/Qwenmplus", + "name": "Qwenmplus", + "developer": "sumink", + "scores": { + "IFEval": 0.204, + "BBH": 0.3676, + "MATH Level 5": 0.0249, + "GPQA": 0.2852, + "MUSR": 0.3828, + "MMLU-PRO": 0.1992 + } + }, + { + "model_id": "sumink/Qwensci", + "name": "Qwensci", + "developer": "sumink", + "scores": { + "IFEval": 0.174, + "BBH": 0.3282, + "MATH Level 5": 0.0204, + "GPQA": 0.2584, + "MUSR": 0.3609, + "MMLU-PRO": 0.126 + } + }, + { + "model_id": "sumink/bbhqwen", + "name": "bbhqwen", + "developer": "sumink", + "scores": { + "IFEval": 0.1809, + "BBH": 0.3388, + "MATH Level 5": 0.0106, + "GPQA": 0.2576, + "MUSR": 0.4352, + "MMLU-PRO": 0.1617 + } + }, + { + "model_id": "sumink/bbhqwen2", + "name": "bbhqwen2", + "developer": "sumink", + "scores": { + "IFEval": 0.1533, + "BBH": 0.3066, + "MATH Level 5": 0.006, + "GPQA": 0.2626, + "MUSR": 0.4431, + "MMLU-PRO": 0.1149 + } + }, + { + "model_id": "sumink/bbhqwen3", + "name": "bbhqwen3", + "developer": "sumink", + "scores": { + "IFEval": 0.1943, + "BBH": 0.2951, + "MATH Level 5": 0.0, + "GPQA": 0.2576, + "MUSR": 0.3796, + "MMLU-PRO": 0.1166 + } + }, + { + "model_id": "sumink/bbhqwen4", + "name": "bbhqwen4", + "developer": "sumink", + "scores": { + "IFEval": 0.1449, + "BBH": 0.3199, + "MATH Level 5": 0.006, + "GPQA": 0.2441, + "MUSR": 0.4029, + "MMLU-PRO": 0.1509 + } + }, + { + "model_id": "sumink/bbhqwen5", + "name": "bbhqwen5", + "developer": "sumink", + "scores": { + "IFEval": 0.1522, + "BBH": 0.2913, + "MATH Level 5": 0.0023, + "GPQA": 0.2601, + "MUSR": 0.4019, + "MMLU-PRO": 0.1131 + } + }, + { + "model_id": "sumink/bbhqwen6", + "name": "bbhqwen6", + "developer": "sumink", + "scores": { + "IFEval": 0.1893, + "BBH": 0.2782, + "MATH Level 5": 0.0008, + "GPQA": 0.2584, + "MUSR": 0.358, + "MMLU-PRO": 0.1153 + } + }, + { + "model_id": "sumink/flflmillama", + "name": "flflmillama", + "developer": "sumink", + "scores": { + "IFEval": 0.1676, + "BBH": 0.3851, + "MATH Level 5": 0.0196, + "GPQA": 0.2919, + "MUSR": 0.3591, + "MMLU-PRO": 0.2096 + } + }, + { + "model_id": "sumink/ftgpt", + "name": "ftgpt", + "developer": "sumink", + "scores": { + "IFEval": 0.0787, + "BBH": 0.2919, + "MATH Level 5": 0.0, + "GPQA": 0.2643, + "MUSR": 0.4138, + "MMLU-PRO": 0.1172 + } + }, + { + "model_id": "sumink/llamaft", + "name": "llamaft", + "developer": "sumink", + "scores": { + "IFEval": 0.1609, + "BBH": 0.3763, + "MATH Level 5": 0.0166, + "GPQA": 0.271, + "MUSR": 0.3498, + "MMLU-PRO": 0.2114 + } + }, + { + "model_id": "sumink/llamamerge", + "name": "llamamerge", + "developer": "sumink", + "scores": { + "IFEval": 0.2672, + "BBH": 0.4632, + "MATH Level 5": 0.0151, + "GPQA": 0.2987, + "MUSR": 0.424, + "MMLU-PRO": 0.259 + } + }, + { + "model_id": "sumink/llftfl7", + "name": "llftfl7", + "developer": "sumink", + "scores": { + "IFEval": 0.1714, + "BBH": 0.3786, + "MATH Level 5": 0.0106, + "GPQA": 0.281, + "MUSR": 0.3632, + "MMLU-PRO": 0.1743 + } + }, + { + "model_id": "sumink/llmer", + "name": "llmer", + "developer": "sumink", + "scores": { + "IFEval": 0.3191, + "BBH": 0.4885, + "MATH Level 5": 0.065, + "GPQA": 0.2978, + "MUSR": 0.4039, + "MMLU-PRO": 0.3529 + } + }, + { + "model_id": "sumink/qwft", + "name": "qwft", + "developer": "sumink", + "scores": { + "IFEval": 0.1197, + "BBH": 0.3002, + "MATH Level 5": 0.0, + "GPQA": 0.2525, + "MUSR": 0.3581, + "MMLU-PRO": 0.1129 + } + }, + { + "model_id": "sumink/qwmer", + "name": "qwmer", + "developer": "sumink", + "scores": { + "IFEval": 0.2212, + "BBH": 0.4299, + "MATH Level 5": 0.0008, + "GPQA": 0.2869, + "MUSR": 0.4032, + "MMLU-PRO": 0.2215 + } + }, + { + "model_id": "sumink/solarmer3", + "name": "solarmer3", + "developer": "sumink", + "scores": { + "IFEval": 0.3741, + "BBH": 0.5266, + "MATH Level 5": 0.0582, + "GPQA": 0.2911, + "MUSR": 0.4401, + "MMLU-PRO": 0.3323 + } + }, + { + "model_id": "sumink/somer", + "name": "somer", + "developer": "sumink", + "scores": { + "IFEval": 0.299, + "BBH": 0.5194, + "MATH Level 5": 0.0415, + "GPQA": 0.2987, + "MUSR": 0.465, + "MMLU-PRO": 0.3447 + } + }, + { + "model_id": "sumink/somer2", + "name": "somer2", + "developer": "sumink", + "scores": { + "IFEval": 0.3132, + "BBH": 0.5167, + "MATH Level 5": 0.0468, + "GPQA": 0.3037, + "MUSR": 0.4663, + "MMLU-PRO": 0.3433 + } + }, + { + "model_id": "sumink/somerft", + "name": "somerft", + "developer": "sumink", + "scores": { + "IFEval": 0.1431, + "BBH": 0.3093, + "MATH Level 5": 0.0144, + "GPQA": 0.2483, + "MUSR": 0.4045, + "MMLU-PRO": 0.1117 + } + }, + { + "model_id": "sunbaby/BrainCog-8B-0.1-Instruct", + "name": "BrainCog-8B-0.1-Instruct", + "developer": "sunbaby", + "scores": { + "IFEval": 0.4253, + "BBH": 0.4618, + "MATH Level 5": 0.0967, + "GPQA": 0.3012, + "MUSR": 0.3656, + "MMLU-PRO": 0.2858 + } + }, + { + "model_id": "swap-uniba/LLaMAntino-3-ANITA-8B-Inst-DPO-ITA", + "name": "LLaMAntino-3-ANITA-8B-Inst-DPO-ITA", + "developer": "swap-uniba", + "scores": { + "IFEval": 0.4815, + "BBH": 0.4936, + "MATH Level 5": 0.0483, + "GPQA": 0.2987, + "MUSR": 0.4387, + "MMLU-PRO": 0.3723 + } + }, + { + "model_id": "synergetic/FrankenQwen2.5-14B", + "name": "FrankenQwen2.5-14B", + "developer": "synergetic", + "scores": { + "IFEval": 0.1869, + "BBH": 0.6048, + "MATH Level 5": 0.0, + "GPQA": 0.2701, + "MUSR": 0.3843, + "MMLU-PRO": 0.4382 + } + }, + { + "model_id": "talha2001/Beast-Soul-new", + "name": "Beast-Soul-new", + "developer": "talha2001", + "scores": { + "IFEval": 0.4854, + "BBH": 0.5227, + "MATH Level 5": 0.074, + "GPQA": 0.2819, + "MUSR": 0.4459, + "MMLU-PRO": 0.3102 + } + }, + { + "model_id": "tangledgroup/tangled-llama-pints-1.5b-v0.1-instruct", + "name": "tangled-llama-pints-1.5b-v0.1-instruct", + "developer": "tangledgroup", + "scores": { + "IFEval": 0.1509, + "BBH": 0.3143, + "MATH Level 5": 0.0121, + "GPQA": 0.2399, + "MUSR": 0.3761, + "MMLU-PRO": 0.1109 + } + }, + { + "model_id": "tangledgroup/tangled-llama-pints-1.5b-v0.2-instruct", + "name": "tangled-llama-pints-1.5b-v0.2-instruct", + "developer": "tangledgroup", + "scores": { + "IFEval": 0.1724, + "BBH": 0.3158, + "MATH Level 5": 0.0128, + "GPQA": 0.2416, + "MUSR": 0.3643, + "MMLU-PRO": 0.1117 + } + }, + { + "model_id": "tanliboy/lambda-gemma-2-9b-dpo", + "name": "lambda-gemma-2-9b-dpo", + "developer": "tanliboy", + "scores": { + "IFEval": 0.1829, + "BBH": 0.5488, + "MATH Level 5": 0.0, + "GPQA": 0.3104, + "MUSR": 0.4056, + "MMLU-PRO": 0.3805 + } + }, + { + "model_id": "tanliboy/lambda-qwen2.5-14b-dpo-test", + "name": "lambda-qwen2.5-14b-dpo-test", + "developer": "tanliboy", + "scores": { + "IFEval": 0.8231, + "BBH": 0.6394, + "MATH Level 5": 0.5461, + "GPQA": 0.3624, + "MUSR": 0.426, + "MMLU-PRO": 0.4848 + } + }, + { + "model_id": "tanliboy/lambda-qwen2.5-32b-dpo-test", + "name": "lambda-qwen2.5-32b-dpo-test", + "developer": "tanliboy", + "scores": { + "IFEval": 0.8084, + "BBH": 0.6764, + "MATH Level 5": 0.6103, + "GPQA": 0.3565, + "MUSR": 0.4274, + "MMLU-PRO": 0.5657 + } + }, + { + "model_id": "tannedbum/Ellaria-9B", + "name": "Ellaria-9B", + "developer": "tannedbum", + "scores": { + "IFEval": 0.7826, + "BBH": 0.5942, + "MATH Level 5": 0.2077, + "GPQA": 0.3331, + "MUSR": 0.4151, + "MMLU-PRO": 0.4205 + } + }, + { + "model_id": "tannedbum/L3-Nymeria-Maid-8B", + "name": "L3-Nymeria-Maid-8B", + "developer": "tannedbum", + "scores": { + "IFEval": 0.725, + "BBH": 0.5146, + "MATH Level 5": 0.0937, + "GPQA": 0.2961, + "MUSR": 0.3751, + "MMLU-PRO": 0.3747 + } + }, + { + "model_id": "tannedbum/L3-Nymeria-v2-8B", + "name": "L3-Nymeria-v2-8B", + "developer": "tannedbum", + "scores": { + "IFEval": 0.7168, + "BBH": 0.5224, + "MATH Level 5": 0.0921, + "GPQA": 0.2903, + "MUSR": 0.3699, + "MMLU-PRO": 0.3753 + } + }, + { + "model_id": "tannedbum/L3-Rhaenys-8B", + "name": "L3-Rhaenys-8B", + "developer": "tannedbum", + "scores": { + "IFEval": 0.7363, + "BBH": 0.5299, + "MATH Level 5": 0.0876, + "GPQA": 0.2978, + "MUSR": 0.3725, + "MMLU-PRO": 0.3799 + } + }, + { + "model_id": "teknium/CollectiveCognition-v1.1-Mistral-7B", + "name": "CollectiveCognition-v1.1-Mistral-7B", + "developer": "teknium", + "scores": { + "IFEval": 0.279, + "BBH": 0.4493, + "MATH Level 5": 0.031, + "GPQA": 0.2869, + "MUSR": 0.3869, + "MMLU-PRO": 0.2837 + } + }, + { + "model_id": "teknium/OpenHermes-13B", + "name": "OpenHermes-13B", + "developer": "teknium", + "scores": { + "IFEval": 0.2668, + "BBH": 0.4206, + "MATH Level 5": 0.0121, + "GPQA": 0.2727, + "MUSR": 0.4043, + "MMLU-PRO": 0.2389 + } + }, + { + "model_id": "teknium/OpenHermes-2-Mistral-7B", + "name": "OpenHermes-2-Mistral-7B", + "developer": "teknium", + "scores": { + "IFEval": 0.5286, + "BBH": 0.4948, + "MATH Level 5": 0.0453, + "GPQA": 0.2836, + "MUSR": 0.452, + "MMLU-PRO": 0.2931 + } + }, + { + "model_id": "teknium/OpenHermes-2.5-Mistral-7B", + "name": "OpenHermes-2.5-Mistral-7B", + "developer": "teknium", + "scores": { + "IFEval": 0.5571, + "BBH": 0.487, + "MATH Level 5": 0.0506, + "GPQA": 0.2836, + "MUSR": 0.4242, + "MMLU-PRO": 0.3054 + } + }, + { + "model_id": "teknium/OpenHermes-7B", + "name": "OpenHermes-7B", + "developer": "teknium", + "scores": { + "IFEval": 0.1813, + "BBH": 0.362, + "MATH Level 5": 0.0159, + "GPQA": 0.2693, + "MUSR": 0.4324, + "MMLU-PRO": 0.1933 + } + }, + { + "model_id": "tensopolis/falcon3-10b-tensopolis-v1", + "name": "falcon3-10b-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.7817, + "BBH": 0.6182, + "MATH Level 5": 0.2749, + "GPQA": 0.3297, + "MUSR": 0.4375, + "MMLU-PRO": 0.442 + } + }, + { + "model_id": "tensopolis/falcon3-10b-tensopolis-v2", + "name": "falcon3-10b-tensopolis-v2", + "developer": "tensopolis", + "scores": { + "IFEval": 0.7792, + "BBH": 0.6182, + "MATH Level 5": 0.2666, + "GPQA": 0.3272, + "MUSR": 0.4297, + "MMLU-PRO": 0.4424 + } + }, + { + "model_id": "tensopolis/lamarckvergence-14b-tensopolis-v1", + "name": "lamarckvergence-14b-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.7604, + "BBH": 0.6561, + "MATH Level 5": 0.5166, + "GPQA": 0.3607, + "MUSR": 0.4475, + "MMLU-PRO": 0.525 + } + }, + { + "model_id": "tensopolis/mistral-small-2501-tensopolis-v1", + "name": "mistral-small-2501-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.7762, + "BBH": 0.6475, + "MATH Level 5": 0.4441, + "GPQA": 0.3574, + "MUSR": 0.428, + "MMLU-PRO": 0.4465 + } + }, + { + "model_id": "tensopolis/mistral-small-r1-tensopolis", + "name": "mistral-small-r1-tensopolis", + "developer": "tensopolis", + "scores": { + "IFEval": 0.4622, + "BBH": 0.5436, + "MATH Level 5": 0.2908, + "GPQA": 0.2819, + "MUSR": 0.3738, + "MMLU-PRO": 0.4035 + } + }, + { + "model_id": "tensopolis/phi-4-tensopolis-v1", + "name": "phi-4-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.6767, + "BBH": 0.6872, + "MATH Level 5": 0.494, + "GPQA": 0.3347, + "MUSR": 0.4141, + "MMLU-PRO": 0.5384 + } + }, + { + "model_id": "tensopolis/qwen2.5-14b-tensopolis-v1", + "name": "qwen2.5-14b-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.799, + "BBH": 0.6364, + "MATH Level 5": 0.5295, + "GPQA": 0.3347, + "MUSR": 0.4193, + "MMLU-PRO": 0.4911 + } + }, + { + "model_id": "tensopolis/qwen2.5-3b-or1-tensopolis", + "name": "qwen2.5-3b-or1-tensopolis", + "developer": "tensopolis", + "scores": { + "IFEval": 0.354, + "BBH": 0.4421, + "MATH Level 5": 0.173, + "GPQA": 0.2945, + "MUSR": 0.3749, + "MMLU-PRO": 0.3197 + } + }, + { + "model_id": "tensopolis/qwen2.5-7b-tensopolis-v1", + "name": "qwen2.5-7b-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.7661, + "BBH": 0.5379, + "MATH Level 5": 0.4562, + "GPQA": 0.2961, + "MUSR": 0.4339, + "MMLU-PRO": 0.4269 + } + }, + { + "model_id": "tensopolis/qwen2.5-7b-tensopolis-v2", + "name": "qwen2.5-7b-tensopolis-v2", + "developer": "tensopolis", + "scores": { + "IFEval": 0.7521, + "BBH": 0.5415, + "MATH Level 5": 0.4819, + "GPQA": 0.2903, + "MUSR": 0.4246, + "MMLU-PRO": 0.4243 + } + }, + { + "model_id": "tensopolis/virtuoso-lite-tensopolis-v1", + "name": "virtuoso-lite-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.8069, + "BBH": 0.6102, + "MATH Level 5": 0.2545, + "GPQA": 0.3448, + "MUSR": 0.4582, + "MMLU-PRO": 0.4435 + } + }, + { + "model_id": "tensopolis/virtuoso-lite-tensopolis-v2", + "name": "virtuoso-lite-tensopolis-v2", + "developer": "tensopolis", + "scores": { + "IFEval": 0.8029, + "BBH": 0.61, + "MATH Level 5": 0.25, + "GPQA": 0.3431, + "MUSR": 0.4595, + "MMLU-PRO": 0.444 + } + }, + { + "model_id": "tensopolis/virtuoso-small-tensopolis-v1", + "name": "virtuoso-small-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.7856, + "BBH": 0.6415, + "MATH Level 5": 0.3527, + "GPQA": 0.328, + "MUSR": 0.4326, + "MMLU-PRO": 0.4968 + } + }, + { + "model_id": "tensopolis/virtuoso-small-tensopolis-v2", + "name": "virtuoso-small-tensopolis-v2", + "developer": "tensopolis", + "scores": { + "IFEval": 0.802, + "BBH": 0.6516, + "MATH Level 5": 0.3875, + "GPQA": 0.3289, + "MUSR": 0.4352, + "MMLU-PRO": 0.5154 + } + }, + { + "model_id": "tensopolis/virtuoso-small-v2-tensopolis-v1", + "name": "virtuoso-small-v2-tensopolis-v1", + "developer": "tensopolis", + "scores": { + "IFEval": 0.8419, + "BBH": 0.6545, + "MATH Level 5": 0.4524, + "GPQA": 0.3465, + "MUSR": 0.4509, + "MMLU-PRO": 0.5175 + } + }, + { + "model_id": "tensoropera/Fox-1-1.6B", + "name": "Fox-1-1.6B", + "developer": "tensoropera", + "scores": { + "IFEval": 0.2766, + "BBH": 0.3307, + "MATH Level 5": 0.0174, + "GPQA": 0.2634, + "MUSR": 0.355, + "MMLU-PRO": 0.1371 + } + }, + { + "model_id": "tenyx/Llama3-TenyxChat-70B", + "name": "Llama3-TenyxChat-70B", + "developer": "tenyx", + "scores": { + "IFEval": 0.8087, + "BBH": 0.6511, + "MATH Level 5": 0.2356, + "GPQA": 0.3012, + "MUSR": 0.426, + "MMLU-PRO": 0.521 + } + }, + { + "model_id": "theo77186/Qwen2.5-Coder-7B-Instruct-20241106", + "name": "Qwen2.5-Coder-7B-Instruct-20241106", + "developer": "theo77186", + "scores": { + "IFEval": 0.6101, + "BBH": 0.5008, + "MATH Level 5": 0.3882, + "GPQA": 0.2919, + "MUSR": 0.4073, + "MMLU-PRO": 0.3353 + } + }, + { + "model_id": "theprint/Boptruth-Agatha-7B", + "name": "Boptruth-Agatha-7B", + "developer": "theprint", + "scores": { + "IFEval": 0.3124, + "BBH": 0.4984, + "MATH Level 5": 0.0551, + "GPQA": 0.2995, + "MUSR": 0.4277, + "MMLU-PRO": 0.2861 + } + }, + { + "model_id": "theprint/CleverBoi-7B-v2", + "name": "CleverBoi-7B-v2", + "developer": "theprint", + "scores": { + "IFEval": 0.217, + "BBH": 0.4532, + "MATH Level 5": 0.0264, + "GPQA": 0.2886, + "MUSR": 0.4695, + "MMLU-PRO": 0.2709 + } + }, + { + "model_id": "theprint/CleverBoi-7B-v3", + "name": "CleverBoi-7B-v3", + "developer": "theprint", + "scores": { + "IFEval": 0.2382, + "BBH": 0.4414, + "MATH Level 5": 0.04, + "GPQA": 0.2659, + "MUSR": 0.4072, + "MMLU-PRO": 0.2868 + } + }, + { + "model_id": "theprint/CleverBoi-Llama-3.1-8B-Instruct", + "name": "CleverBoi-Llama-3.1-8B-Instruct", + "developer": "theprint", + "scores": { + "IFEval": 0.1682, + "BBH": 0.456, + "MATH Level 5": 0.0491, + "GPQA": 0.3003, + "MUSR": 0.4014, + "MMLU-PRO": 0.3075 + } + }, + { + "model_id": "theprint/CleverBoi-Llama-3.1-8B-v2", + "name": "CleverBoi-Llama-3.1-8B-v2", + "developer": "theprint", + "scores": { + "IFEval": 0.1961, + "BBH": 0.4668, + "MATH Level 5": 0.0529, + "GPQA": 0.2861, + "MUSR": 0.3735, + "MMLU-PRO": 0.3188 + } + }, + { + "model_id": "theprint/CleverBoi-Nemo-12B-v2", + "name": "CleverBoi-Nemo-12B-v2", + "developer": "theprint", + "scores": { + "IFEval": 0.2046, + "BBH": 0.5241, + "MATH Level 5": 0.1035, + "GPQA": 0.3138, + "MUSR": 0.4187, + "MMLU-PRO": 0.3228 + } + }, + { + "model_id": "theprint/Code-Llama-Bagel-8B", + "name": "Code-Llama-Bagel-8B", + "developer": "theprint", + "scores": { + "IFEval": 0.253, + "BBH": 0.4697, + "MATH Level 5": 0.0612, + "GPQA": 0.276, + "MUSR": 0.368, + "MMLU-PRO": 0.2822 + } + }, + { + "model_id": "theprint/Conversely-Mistral-7B", + "name": "Conversely-Mistral-7B", + "developer": "theprint", + "scores": { + "IFEval": 0.2608, + "BBH": 0.4672, + "MATH Level 5": 0.0279, + "GPQA": 0.2852, + "MUSR": 0.4189, + "MMLU-PRO": 0.2826 + } + }, + { + "model_id": "theprint/Llama-3.2-3B-VanRossum", + "name": "Llama-3.2-3B-VanRossum", + "developer": "theprint", + "scores": { + "IFEval": 0.4783, + "BBH": 0.4279, + "MATH Level 5": 0.0974, + "GPQA": 0.2676, + "MUSR": 0.3442, + "MMLU-PRO": 0.277 + } + }, + { + "model_id": "theprint/ReWiz-7B", + "name": "ReWiz-7B", + "developer": "theprint", + "scores": { + "IFEval": 0.4048, + "BBH": 0.4564, + "MATH Level 5": 0.0408, + "GPQA": 0.2752, + "MUSR": 0.4612, + "MMLU-PRO": 0.267 + } + }, + { + "model_id": "theprint/ReWiz-Llama-3.1-8B-v2", + "name": "ReWiz-Llama-3.1-8B-v2", + "developer": "theprint", + "scores": { + "IFEval": 0.2379, + "BBH": 0.4632, + "MATH Level 5": 0.0574, + "GPQA": 0.3029, + "MUSR": 0.3814, + "MMLU-PRO": 0.331 + } + }, + { + "model_id": "theprint/ReWiz-Llama-3.2-3B", + "name": "ReWiz-Llama-3.2-3B", + "developer": "theprint", + "scores": { + "IFEval": 0.4649, + "BBH": 0.4343, + "MATH Level 5": 0.1095, + "GPQA": 0.2836, + "MUSR": 0.3614, + "MMLU-PRO": 0.2887 + } + }, + { + "model_id": "theprint/ReWiz-Nemo-12B-Instruct", + "name": "ReWiz-Nemo-12B-Instruct", + "developer": "theprint", + "scores": { + "IFEval": 0.1062, + "BBH": 0.5092, + "MATH Level 5": 0.1042, + "GPQA": 0.3238, + "MUSR": 0.4096, + "MMLU-PRO": 0.3339 + } + }, + { + "model_id": "theprint/ReWiz-Qwen-2.5-14B", + "name": "ReWiz-Qwen-2.5-14B", + "developer": "theprint", + "scores": { + "IFEval": 0.2785, + "BBH": 0.6179, + "MATH Level 5": 0.2923, + "GPQA": 0.38, + "MUSR": 0.4539, + "MMLU-PRO": 0.5092 + } + }, + { + "model_id": "theprint/ReWiz-Worldbuilder-7B", + "name": "ReWiz-Worldbuilder-7B", + "developer": "theprint", + "scores": { + "IFEval": 0.251, + "BBH": 0.4636, + "MATH Level 5": 0.037, + "GPQA": 0.2693, + "MUSR": 0.4572, + "MMLU-PRO": 0.2971 + } + }, + { + "model_id": "theprint/RuDolph-Hermes-7B", + "name": "RuDolph-Hermes-7B", + "developer": "theprint", + "scores": { + "IFEval": 0.3604, + "BBH": 0.5053, + "MATH Level 5": 0.0514, + "GPQA": 0.3121, + "MUSR": 0.4226, + "MMLU-PRO": 0.3073 + } + }, + { + "model_id": "theprint/WorldBuilder-12B", + "name": "WorldBuilder-12B", + "developer": "theprint", + "scores": { + "IFEval": 0.1374, + "BBH": 0.501, + "MATH Level 5": 0.0446, + "GPQA": 0.297, + "MUSR": 0.4066, + "MMLU-PRO": 0.3192 + } + }, + { + "model_id": "theprint/phi-3-mini-4k-python", + "name": "phi-3-mini-4k-python", + "developer": "theprint", + "scores": { + "IFEval": 0.2409, + "BBH": 0.4938, + "MATH Level 5": 0.105, + "GPQA": 0.2911, + "MUSR": 0.3922, + "MMLU-PRO": 0.3577 + } + }, + { + "model_id": "thinkcoder/llama3-8b-instruct-lora-8-sft", + "name": "llama3-8b-instruct-lora-8-sft", + "developer": "thinkcoder", + "scores": { + "IFEval": 0.648, + "BBH": 0.4865, + "MATH Level 5": 0.102, + "GPQA": 0.2668, + "MUSR": 0.3235, + "MMLU-PRO": 0.3476 + } + }, + { + "model_id": "thirdeyeai/elevate360m", + "name": "elevate360m", + "developer": "thirdeyeai", + "scores": { + "IFEval": 0.0445, + "BBH": 0.2963, + "MATH Level 5": 0.0159, + "GPQA": 0.2408, + "MUSR": 0.3462, + "MMLU-PRO": 0.1077 + } + }, + { + "model_id": "thomas-yanxin/XinYuan-Qwen2-1_5B", + "name": "XinYuan-Qwen2-1_5B", + "developer": "thomas-yanxin", + "scores": { + "IFEval": 0.2986, + "BBH": 0.3635, + "MATH Level 5": 0.0672, + "GPQA": 0.2701, + "MUSR": 0.3634, + "MMLU-PRO": 0.2357 + } + }, + { + "model_id": "thomas-yanxin/XinYuan-Qwen2-7B", + "name": "XinYuan-Qwen2-7B", + "developer": "thomas-yanxin", + "scores": { + "IFEval": 0.4438, + "BBH": 0.4937, + "MATH Level 5": 0.1458, + "GPQA": 0.2911, + "MUSR": 0.4058, + "MMLU-PRO": 0.3925 + } + }, + { + "model_id": "thomas-yanxin/XinYuan-Qwen2-7B-0917", + "name": "XinYuan-Qwen2-7B-0917", + "developer": "thomas-yanxin", + "scores": { + "IFEval": 0.3719, + "BBH": 0.5169, + "MATH Level 5": 0.1979, + "GPQA": 0.3096, + "MUSR": 0.4401, + "MMLU-PRO": 0.4245 + } + }, + { + "model_id": "thomas-yanxin/XinYuan-Qwen2.5-7B-0917", + "name": "XinYuan-Qwen2.5-7B-0917", + "developer": "thomas-yanxin", + "scores": { + "IFEval": 0.3577, + "BBH": 0.5184, + "MATH Level 5": 0.1934, + "GPQA": 0.281, + "MUSR": 0.3676, + "MMLU-PRO": 0.3882 + } + }, + { + "model_id": "tianyil1/MistralForCausalLM_Cal_DPO", + "name": "MistralForCausalLM_Cal_DPO", + "developer": "tianyil1", + "scores": { + "IFEval": 0.5328, + "BBH": 0.4381, + "MATH Level 5": 0.0287, + "GPQA": 0.276, + "MUSR": 0.3977, + "MMLU-PRO": 0.2763 + } + }, + { + "model_id": "tiiuae/Falcon3-10B-Base", + "name": "Falcon3-10B-Base", + "developer": "tiiuae", + "scores": { + "IFEval": 0.3648, + "BBH": 0.595, + "MATH Level 5": 0.2492, + "GPQA": 0.3456, + "MUSR": 0.4398, + "MMLU-PRO": 0.424 + } + }, + { + "model_id": "tiiuae/Falcon3-10B-Instruct", + "name": "Falcon3-10B-Instruct", + "developer": "tiiuae", + "scores": { + "IFEval": 0.7817, + "BBH": 0.617, + "MATH Level 5": 0.2764, + "GPQA": 0.3289, + "MUSR": 0.4323, + "MMLU-PRO": 0.4429 + } + }, + { + "model_id": "tiiuae/Falcon3-1B-Base", + "name": "Falcon3-1B-Base", + "developer": "tiiuae", + "scores": { + "IFEval": 0.2428, + "BBH": 0.3571, + "MATH Level 5": 0.0332, + "GPQA": 0.2794, + "MUSR": 0.4147, + "MMLU-PRO": 0.1608 + } + }, + { + "model_id": "tiiuae/Falcon3-1B-Instruct", + "name": "Falcon3-1B-Instruct", + "developer": "tiiuae", + "scores": { + "IFEval": 0.5557, + "BBH": 0.3745, + "MATH Level 5": 0.0634, + "GPQA": 0.2668, + "MUSR": 0.4189, + "MMLU-PRO": 0.1838 + } + }, + { + "model_id": "tiiuae/Falcon3-3B-Base", + "name": "Falcon3-3B-Base", + "developer": "tiiuae", + "scores": { + "IFEval": 0.2765, + "BBH": 0.4421, + "MATH Level 5": 0.1178, + "GPQA": 0.297, + "MUSR": 0.375, + "MMLU-PRO": 0.2879 + } + }, + { + "model_id": "tiiuae/Falcon3-3B-Instruct", + "name": "Falcon3-3B-Instruct", + "developer": "tiiuae", + "scores": { + "IFEval": 0.6977, + "BBH": 0.4754, + "MATH Level 5": 0.25, + "GPQA": 0.2886, + "MUSR": 0.4136, + "MMLU-PRO": 0.3005 + } + }, + { + "model_id": "tiiuae/Falcon3-7B-Base", + "name": "Falcon3-7B-Base", + "developer": "tiiuae", + "scores": { + "IFEval": 0.3416, + "BBH": 0.5099, + "MATH Level 5": 0.1941, + "GPQA": 0.3465, + "MUSR": 0.4702, + "MMLU-PRO": 0.391 + } + }, + { + "model_id": "tiiuae/Falcon3-7B-Instruct", + "name": "Falcon3-7B-Instruct", + "developer": "tiiuae", + "scores": { + "IFEval": 0.7612, + "BBH": 0.5632, + "MATH Level 5": 0.4086, + "GPQA": 0.3104, + "MUSR": 0.4827, + "MMLU-PRO": 0.4087 + } + }, + { + "model_id": "tiiuae/Falcon3-Mamba-7B-Base", + "name": "Falcon3-Mamba-7B-Base", + "developer": "tiiuae", + "scores": { + "IFEval": 0.2891, + "BBH": 0.4699, + "MATH Level 5": 0.1941, + "GPQA": 0.3096, + "MUSR": 0.3431, + "MMLU-PRO": 0.3038 + } + }, + { + "model_id": "tiiuae/Falcon3-Mamba-7B-Instruct", + "name": "Falcon3-Mamba-7B-Instruct", + "developer": "tiiuae", + "scores": { + "IFEval": 0.7165, + "BBH": 0.4679, + "MATH Level 5": 0.3006, + "GPQA": 0.3037, + "MUSR": 0.3869, + "MMLU-PRO": 0.3369 + } + }, + { + "model_id": "tiiuae/falcon-11B", + "name": "falcon-11B", + "developer": "tiiuae", + "scores": { + "IFEval": 0.3261, + "BBH": 0.4392, + "MATH Level 5": 0.0279, + "GPQA": 0.271, + "MUSR": 0.3986, + "MMLU-PRO": 0.2389 + } + }, + { + "model_id": "tiiuae/falcon-40b", + "name": "Falcon 40B", + "developer": "tiiuae", + "scores": { + "IFEval": 0.2496, + "BBH": 0.4019, + "MATH Level 5": 0.0181, + "GPQA": 0.2735, + "MUSR": 0.3631, + "MMLU-PRO": 0.2505 + } + }, + { + "model_id": "tiiuae/falcon-40b-instruct", + "name": "falcon-40b-instruct", + "developer": "tiiuae", + "scores": { + "IFEval": 0.2454, + "BBH": 0.4054, + "MATH Level 5": 0.0196, + "GPQA": 0.25, + "MUSR": 0.3762, + "MMLU-PRO": 0.2261 + } + }, + { + "model_id": "tiiuae/falcon-7b", + "name": "Falcon 7B", + "developer": "tiiuae", + "scores": { + "IFEval": 0.1821, + "BBH": 0.3285, + "MATH Level 5": 0.0098, + "GPQA": 0.245, + "MUSR": 0.3778, + "MMLU-PRO": 0.1125 + } + }, + { + "model_id": "tiiuae/falcon-7b-instruct", + "name": "falcon-7b-instruct", + "developer": "tiiuae", + "scores": { + "IFEval": 0.1969, + "BBH": 0.3203, + "MATH Level 5": 0.0121, + "GPQA": 0.2475, + "MUSR": 0.3634, + "MMLU-PRO": 0.1155 + } + }, + { + "model_id": "tiiuae/falcon-mamba-7b", + "name": "falcon-mamba-7b", + "developer": "tiiuae", + "scores": { + "IFEval": 0.3336, + "BBH": 0.4285, + "MATH Level 5": 0.0446, + "GPQA": 0.3104, + "MUSR": 0.421, + "MMLU-PRO": 0.2302 + } + }, + { + "model_id": "tinycompany/BiBo-v0.3", + "name": "BiBo-v0.3", + "developer": "tinycompany", + "scores": { + "IFEval": 0.5184, + "BBH": 0.4642, + "MATH Level 5": 0.0876, + "GPQA": 0.2676, + "MUSR": 0.395, + "MMLU-PRO": 0.2995 + } + }, + { + "model_id": "tinycompany/BiBo-v0.7", + "name": "BiBo-v0.7", + "developer": "tinycompany", + "scores": { + "IFEval": 0.3738, + "BBH": 0.4311, + "MATH Level 5": 0.0823, + "GPQA": 0.2768, + "MUSR": 0.4044, + "MMLU-PRO": 0.265 + } + }, + { + "model_id": "tinycompany/ShawtyIsBad-bgem3", + "name": "ShawtyIsBad-bgem3", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2608, + "BBH": 0.3853, + "MATH Level 5": 0.0483, + "GPQA": 0.3054, + "MUSR": 0.3695, + "MMLU-PRO": 0.2583 + } + }, + { + "model_id": "tinycompany/ShawtyIsBad-e5-large", + "name": "ShawtyIsBad-e5-large", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2468, + "BBH": 0.3873, + "MATH Level 5": 0.0453, + "GPQA": 0.302, + "MUSR": 0.372, + "MMLU-PRO": 0.2569 + } + }, + { + "model_id": "tinycompany/ShawtyIsBad-ib", + "name": "ShawtyIsBad-ib", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2565, + "BBH": 0.388, + "MATH Level 5": 0.0491, + "GPQA": 0.2987, + "MUSR": 0.3641, + "MMLU-PRO": 0.2581 + } + }, + { + "model_id": "tinycompany/ShawtyIsBad-nomic-moe", + "name": "ShawtyIsBad-nomic-moe", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2608, + "BBH": 0.3878, + "MATH Level 5": 0.0431, + "GPQA": 0.307, + "MUSR": 0.3747, + "MMLU-PRO": 0.2572 + } + }, + { + "model_id": "tinycompany/ShawtyIsBad-nomic1.5", + "name": "ShawtyIsBad-nomic1.5", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2544, + "BBH": 0.3874, + "MATH Level 5": 0.0431, + "GPQA": 0.3112, + "MUSR": 0.3628, + "MMLU-PRO": 0.2567 + } + }, + { + "model_id": "tinycompany/SigmaBoi-base", + "name": "SigmaBoi-base", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2447, + "BBH": 0.4314, + "MATH Level 5": 0.0778, + "GPQA": 0.2936, + "MUSR": 0.4343, + "MMLU-PRO": 0.2817 + } + }, + { + "model_id": "tinycompany/SigmaBoi-bge-m3", + "name": "SigmaBoi-bge-m3", + "developer": "tinycompany", + "scores": { + "IFEval": 0.245, + "BBH": 0.4351, + "MATH Level 5": 0.0763, + "GPQA": 0.2945, + "MUSR": 0.4383, + "MMLU-PRO": 0.2819 + } + }, + { + "model_id": "tinycompany/SigmaBoi-bgem3", + "name": "SigmaBoi-bgem3", + "developer": "tinycompany", + "scores": { + "IFEval": 0.245, + "BBH": 0.4351, + "MATH Level 5": 0.0763, + "GPQA": 0.2945, + "MUSR": 0.4383, + "MMLU-PRO": 0.2819 + } + }, + { + "model_id": "tinycompany/SigmaBoi-ib", + "name": "SigmaBoi-ib", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2477, + "BBH": 0.4344, + "MATH Level 5": 0.074, + "GPQA": 0.2878, + "MUSR": 0.429, + "MMLU-PRO": 0.2824 + } + }, + { + "model_id": "tinycompany/SigmaBoi-nomic-moe", + "name": "SigmaBoi-nomic-moe", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2474, + "BBH": 0.4334, + "MATH Level 5": 0.0718, + "GPQA": 0.2928, + "MUSR": 0.4316, + "MMLU-PRO": 0.2837 + } + }, + { + "model_id": "tinycompany/SigmaBoi-nomic1.5", + "name": "SigmaBoi-nomic1.5", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2447, + "BBH": 0.4371, + "MATH Level 5": 0.0831, + "GPQA": 0.2961, + "MUSR": 0.4316, + "MMLU-PRO": 0.2841 + } + }, + { + "model_id": "tinycompany/SigmaBoi-nomic1.5-fp32", + "name": "SigmaBoi-nomic1.5-fp32", + "developer": "tinycompany", + "scores": { + "IFEval": 0.2462, + "BBH": 0.4371, + "MATH Level 5": 0.0831, + "GPQA": 0.2961, + "MUSR": 0.4316, + "MMLU-PRO": 0.2841 + } + }, + { + "model_id": "tinycompany/Tamed-Shawty", + "name": "Tamed-Shawty", + "developer": "tinycompany", + "scores": { + "IFEval": 0.3831, + "BBH": 0.3837, + "MATH Level 5": 0.0718, + "GPQA": 0.2626, + "MUSR": 0.3501, + "MMLU-PRO": 0.2601 + } + }, + { + "model_id": "tklohj/WindyFloLLM", + "name": "WindyFloLLM", + "developer": "tklohj", + "scores": { + "IFEval": 0.2669, + "BBH": 0.4637, + "MATH Level 5": 0.0159, + "GPQA": 0.2752, + "MUSR": 0.4253, + "MMLU-PRO": 0.2581 + } + }, + { + "model_id": "togethercomputer/GPT-JT-6B-v1", + "name": "GPT-JT-6B-v1", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.2061, + "BBH": 0.3303, + "MATH Level 5": 0.0106, + "GPQA": 0.2609, + "MUSR": 0.3737, + "MMLU-PRO": 0.1626 + } + }, + { + "model_id": "togethercomputer/GPT-NeoXT-Chat-Base-20B", + "name": "GPT-NeoXT-Chat-Base-20B", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.183, + "BBH": 0.3321, + "MATH Level 5": 0.0234, + "GPQA": 0.25, + "MUSR": 0.3461, + "MMLU-PRO": 0.1145 + } + }, + { + "model_id": "togethercomputer/LLaMA-2-7B-32K", + "name": "LLaMA-2-7B-32K", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.1865, + "BBH": 0.34, + "MATH Level 5": 0.0144, + "GPQA": 0.25, + "MUSR": 0.3754, + "MMLU-PRO": 0.1768 + } + }, + { + "model_id": "togethercomputer/Llama-2-7B-32K-Instruct", + "name": "Llama-2-7B-32K-Instruct", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.213, + "BBH": 0.3443, + "MATH Level 5": 0.0159, + "GPQA": 0.2517, + "MUSR": 0.4056, + "MMLU-PRO": 0.1781 + } + }, + { + "model_id": "togethercomputer/RedPajama-INCITE-7B-Base", + "name": "RedPajama-INCITE-7B-Base", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.2082, + "BBH": 0.3195, + "MATH Level 5": 0.0159, + "GPQA": 0.255, + "MUSR": 0.362, + "MMLU-PRO": 0.1197 + } + }, + { + "model_id": "togethercomputer/RedPajama-INCITE-7B-Chat", + "name": "RedPajama-INCITE-7B-Chat", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.1558, + "BBH": 0.3175, + "MATH Level 5": 0.0068, + "GPQA": 0.2525, + "MUSR": 0.3448, + "MMLU-PRO": 0.1121 + } + }, + { + "model_id": "togethercomputer/RedPajama-INCITE-7B-Instruct", + "name": "RedPajama-INCITE-7B-Instruct", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.2055, + "BBH": 0.3377, + "MATH Level 5": 0.0211, + "GPQA": 0.2508, + "MUSR": 0.3685, + "MMLU-PRO": 0.1272 + } + }, + { + "model_id": "togethercomputer/RedPajama-INCITE-Base-3B-v1", + "name": "RedPajama-INCITE-Base-3B-v1", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.2294, + "BBH": 0.306, + "MATH Level 5": 0.0144, + "GPQA": 0.2433, + "MUSR": 0.3739, + "MMLU-PRO": 0.1111 + } + }, + { + "model_id": "togethercomputer/RedPajama-INCITE-Chat-3B-v1", + "name": "RedPajama-INCITE-Chat-3B-v1", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.1652, + "BBH": 0.3217, + "MATH Level 5": 0.0091, + "GPQA": 0.2441, + "MUSR": 0.3684, + "MMLU-PRO": 0.1127 + } + }, + { + "model_id": "togethercomputer/RedPajama-INCITE-Instruct-3B-v1", + "name": "RedPajama-INCITE-Instruct-3B-v1", + "developer": "togethercomputer", + "scores": { + "IFEval": 0.2124, + "BBH": 0.3146, + "MATH Level 5": 0.0128, + "GPQA": 0.2475, + "MUSR": 0.3886, + "MMLU-PRO": 0.111 + } + }, + { + "model_id": "tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1", + "name": "Llama-3-Swallow-8B-Instruct-v0.1", + "developer": "tokyotech-llm", + "scores": { + "IFEval": 0.5508, + "BBH": 0.5009, + "MATH Level 5": 0.0748, + "GPQA": 0.2894, + "MUSR": 0.4357, + "MMLU-PRO": 0.3088 + } + }, + { + "model_id": "tomasmcm/sky-t1-coder-32b-flash", + "name": "sky-t1-coder-32b-flash", + "developer": "tomasmcm", + "scores": { + "IFEval": 0.778, + "BBH": 0.6822, + "MATH Level 5": 0.5423, + "GPQA": 0.3683, + "MUSR": 0.4233, + "MMLU-PRO": 0.5782 + } + }, + { + "model_id": "trthminh1112/autotrain-llama32-1b-finetune", + "name": "autotrain-llama32-1b-finetune", + "developer": "trthminh1112", + "scores": { + "IFEval": 0.1769, + "BBH": 0.2996, + "MATH Level 5": 0.0151, + "GPQA": 0.2567, + "MUSR": 0.3513, + "MMLU-PRO": 0.1099 + } + }, + { + "model_id": "tugstugi/Qwen2.5-7B-Instruct-QwQ-v0.1", + "name": "Qwen2.5-7B-Instruct-QwQ-v0.1", + "developer": "tugstugi", + "scores": { + "IFEval": 0.6017, + "BBH": 0.5101, + "MATH Level 5": 0.3814, + "GPQA": 0.2685, + "MUSR": 0.3794, + "MMLU-PRO": 0.4081 + } + }, + { + "model_id": "universalml/NepaliGPT-2.0", + "name": "NepaliGPT-2.0", + "developer": "universalml", + "scores": { + "IFEval": 0.0365, + "BBH": 0.466, + "MATH Level 5": 0.0045, + "GPQA": 0.281, + "MUSR": 0.4657, + "MMLU-PRO": 0.33 + } + }, + { + "model_id": "unsloth/Llama-3.2-1B-Instruct", + "name": "Llama-3.2-1B-Instruct", + "developer": "unsloth", + "scores": { + "IFEval": 0.581, + "BBH": 0.3485, + "MATH Level 5": 0.0823, + "GPQA": 0.2676, + "MUSR": 0.3196, + "MMLU-PRO": 0.1742 + } + }, + { + "model_id": "unsloth/Llama-3.2-1B-Instruct-no-system-message", + "name": "Llama-3.2-1B-Instruct-no-system-message", + "developer": "unsloth", + "scores": { + "IFEval": 0.565, + "BBH": 0.3544, + "MATH Level 5": 0.0755, + "GPQA": 0.2727, + "MUSR": 0.3341, + "MMLU-PRO": 0.1669 + } + }, + { + "model_id": "unsloth/Phi-3-mini-4k-instruct", + "name": "Phi-3-mini-4k-instruct", + "developer": "unsloth", + "scores": { + "IFEval": 0.544, + "BBH": 0.55, + "MATH Level 5": 0.1639, + "GPQA": 0.323, + "MUSR": 0.4284, + "MMLU-PRO": 0.4031 + } + }, + { + "model_id": "unsloth/phi-4", + "name": "phi-4", + "developer": "unsloth", + "scores": { + "IFEval": 0.6882, + "BBH": 0.6886, + "MATH Level 5": 0.5, + "GPQA": 0.3364, + "MUSR": 0.4114, + "MMLU-PRO": 0.5378 + } + }, + { + "model_id": "unsloth/phi-4-bnb-4bit", + "name": "phi-4-bnb-4bit", + "developer": "unsloth", + "scores": { + "IFEval": 0.673, + "BBH": 0.677, + "MATH Level 5": 0.4607, + "GPQA": 0.3381, + "MUSR": 0.4007, + "MMLU-PRO": 0.5256 + } + }, + { + "model_id": "unsloth/phi-4-unsloth-bnb-4bit", + "name": "phi-4-unsloth-bnb-4bit", + "developer": "unsloth", + "scores": { + "IFEval": 0.6794, + "BBH": 0.6791, + "MATH Level 5": 0.4562, + "GPQA": 0.3364, + "MUSR": 0.4034, + "MMLU-PRO": 0.5286 + } + }, + { + "model_id": "upstage/SOLAR-10.7B-Instruct-v1.0", + "name": "SOLAR-10.7B-Instruct-v1.0", + "developer": "upstage", + "scores": { + "IFEval": 0.4737, + "BBH": 0.5162, + "MATH Level 5": 0.0566, + "GPQA": 0.3087, + "MUSR": 0.3899, + "MMLU-PRO": 0.3138 + } + }, + { + "model_id": "upstage/SOLAR-10.7B-v1.0", + "name": "SOLAR-10.7B-v1.0", + "developer": "upstage", + "scores": { + "IFEval": 0.2421, + "BBH": 0.5094, + "MATH Level 5": 0.0264, + "GPQA": 0.281, + "MUSR": 0.4372, + "MMLU-PRO": 0.34 + } + }, + { + "model_id": "upstage/solar-pro-preview-instruct", + "name": "solar-pro-preview-instruct", + "developer": "upstage", + "scores": { + "IFEval": 0.8416, + "BBH": 0.6817, + "MATH Level 5": 0.2205, + "GPQA": 0.3708, + "MUSR": 0.4417, + "MMLU-PRO": 0.5273 + } + }, + { + "model_id": "utkmst/chimera-beta-test2-lora-merged", + "name": "chimera-beta-test2-lora-merged", + "developer": "utkmst", + "scores": { + "IFEval": 0.6054, + "BBH": 0.4796, + "MATH Level 5": 0.0952, + "GPQA": 0.3037, + "MUSR": 0.4118, + "MMLU-PRO": 0.2992 + } + }, + { + "model_id": "uukuguy/speechless-code-mistral-7b-v1.0", + "name": "speechless-code-mistral-7b-v1.0", + "developer": "uukuguy", + "scores": { + "IFEval": 0.3665, + "BBH": 0.4572, + "MATH Level 5": 0.0521, + "GPQA": 0.2844, + "MUSR": 0.4502, + "MMLU-PRO": 0.3146 + } + }, + { + "model_id": "uukuguy/speechless-codellama-34b-v2.0", + "name": "speechless-codellama-34b-v2.0", + "developer": "uukuguy", + "scores": { + "IFEval": 0.4604, + "BBH": 0.4813, + "MATH Level 5": 0.0431, + "GPQA": 0.2693, + "MUSR": 0.3787, + "MMLU-PRO": 0.2542 + } + }, + { + "model_id": "uukuguy/speechless-coder-ds-6.7b", + "name": "speechless-coder-ds-6.7b", + "developer": "uukuguy", + "scores": { + "IFEval": 0.2505, + "BBH": 0.4036, + "MATH Level 5": 0.0211, + "GPQA": 0.2643, + "MUSR": 0.3819, + "MMLU-PRO": 0.1719 + } + }, + { + "model_id": "uukuguy/speechless-instruct-mistral-7b-v0.2", + "name": "speechless-instruct-mistral-7b-v0.2", + "developer": "uukuguy", + "scores": { + "IFEval": 0.3261, + "BBH": 0.4607, + "MATH Level 5": 0.0491, + "GPQA": 0.2819, + "MUSR": 0.4902, + "MMLU-PRO": 0.2902 + } + }, + { + "model_id": "uukuguy/speechless-llama2-hermes-orca-platypus-wizardlm-13b", + "name": "speechless-llama2-hermes-orca-platypus-wizardlm-13b", + "developer": "uukuguy", + "scores": { + "IFEval": 0.4562, + "BBH": 0.4846, + "MATH Level 5": 0.0204, + "GPQA": 0.2701, + "MUSR": 0.4655, + "MMLU-PRO": 0.2559 + } + }, + { + "model_id": "uukuguy/speechless-mistral-dolphin-orca-platypus-samantha-7b", + "name": "speechless-mistral-dolphin-orca-platypus-samantha-7b", + "developer": "uukuguy", + "scores": { + "IFEval": 0.37, + "BBH": 0.4983, + "MATH Level 5": 0.0295, + "GPQA": 0.2836, + "MUSR": 0.4361, + "MMLU-PRO": 0.299 + } + }, + { + "model_id": "uukuguy/speechless-zephyr-code-functionary-7b", + "name": "speechless-zephyr-code-functionary-7b", + "developer": "uukuguy", + "scores": { + "IFEval": 0.2696, + "BBH": 0.4664, + "MATH Level 5": 0.0423, + "GPQA": 0.3003, + "MUSR": 0.4268, + "MMLU-PRO": 0.3094 + } + }, + { + "model_id": "v000000/L3-8B-Stheno-v3.2-abliterated", + "name": "L3-8B-Stheno-v3.2-abliterated", + "developer": "v000000", + "scores": { + "IFEval": 0.6718, + "BBH": 0.5141, + "MATH Level 5": 0.0695, + "GPQA": 0.3096, + "MUSR": 0.362, + "MMLU-PRO": 0.3604 + } + }, + { + "model_id": "v000000/L3.1-Niitorm-8B-DPO-t0.0001", + "name": "L3.1-Niitorm-8B-DPO-t0.0001", + "developer": "v000000", + "scores": { + "IFEval": 0.7689, + "BBH": 0.5134, + "MATH Level 5": 0.1624, + "GPQA": 0.2945, + "MUSR": 0.388, + "MMLU-PRO": 0.3866 + } + }, + { + "model_id": "v000000/L3.1-Storniitova-8B", + "name": "L3.1-Storniitova-8B", + "developer": "v000000", + "scores": { + "IFEval": 0.7817, + "BBH": 0.5151, + "MATH Level 5": 0.1465, + "GPQA": 0.2894, + "MUSR": 0.4029, + "MMLU-PRO": 0.3776 + } + }, + { + "model_id": "v000000/Qwen2.5-14B-Gutenberg-1e-Delta", + "name": "Qwen2.5-14B-Gutenberg-1e-Delta", + "developer": "v000000", + "scores": { + "IFEval": 0.8045, + "BBH": 0.6398, + "MATH Level 5": 0.5264, + "GPQA": 0.3289, + "MUSR": 0.4073, + "MMLU-PRO": 0.493 + } + }, + { + "model_id": "v000000/Qwen2.5-14B-Gutenberg-Instruct-Slerpeno", + "name": "Qwen2.5-14B-Gutenberg-Instruct-Slerpeno", + "developer": "v000000", + "scores": { + "IFEval": 0.8197, + "BBH": 0.639, + "MATH Level 5": 0.5325, + "GPQA": 0.3314, + "MUSR": 0.4114, + "MMLU-PRO": 0.4924 + } + }, + { + "model_id": "v000000/Qwen2.5-Lumen-14B", + "name": "Qwen2.5-Lumen-14B", + "developer": "v000000", + "scores": { + "IFEval": 0.8064, + "BBH": 0.6391, + "MATH Level 5": 0.5363, + "GPQA": 0.328, + "MUSR": 0.4114, + "MMLU-PRO": 0.4903 + } + }, + { + "model_id": "vhab10/Llama-3.1-8B-Base-Instruct-SLERP", + "name": "Llama-3.1-8B-Base-Instruct-SLERP", + "developer": "vhab10", + "scores": { + "IFEval": 0.2907, + "BBH": 0.5057, + "MATH Level 5": 0.1201, + "GPQA": 0.2961, + "MUSR": 0.4011, + "MMLU-PRO": 0.3621 + } + }, + { + "model_id": "vhab10/Llama-3.2-Instruct-3B-TIES", + "name": "Llama-3.2-Instruct-3B-TIES", + "developer": "vhab10", + "scores": { + "IFEval": 0.4727, + "BBH": 0.4332, + "MATH Level 5": 0.0982, + "GPQA": 0.2693, + "MUSR": 0.3497, + "MMLU-PRO": 0.2916 + } + }, + { + "model_id": "vhab10/llama-3-8b-merged-linear", + "name": "llama-3-8b-merged-linear", + "developer": "vhab10", + "scores": { + "IFEval": 0.5917, + "BBH": 0.4937, + "MATH Level 5": 0.0816, + "GPQA": 0.2995, + "MUSR": 0.4191, + "MMLU-PRO": 0.3704 + } + }, + { + "model_id": "vicgalle/CarbonBeagle-11B", + "name": "CarbonBeagle-11B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.5415, + "BBH": 0.5294, + "MATH Level 5": 0.0619, + "GPQA": 0.302, + "MUSR": 0.402, + "MMLU-PRO": 0.3276 + } + }, + { + "model_id": "vicgalle/CarbonBeagle-11B-truthy", + "name": "CarbonBeagle-11B-truthy", + "developer": "vicgalle", + "scores": { + "IFEval": 0.5212, + "BBH": 0.5348, + "MATH Level 5": 0.0491, + "GPQA": 0.2995, + "MUSR": 0.374, + "MMLU-PRO": 0.3357 + } + }, + { + "model_id": "vicgalle/Configurable-Hermes-2-Pro-Llama-3-8B", + "name": "Configurable-Hermes-2-Pro-Llama-3-8B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.5763, + "BBH": 0.5055, + "MATH Level 5": 0.0763, + "GPQA": 0.297, + "MUSR": 0.4184, + "MMLU-PRO": 0.3098 + } + }, + { + "model_id": "vicgalle/Configurable-Llama-3.1-8B-Instruct", + "name": "Configurable-Llama-3.1-8B-Instruct", + "developer": "vicgalle", + "scores": { + "IFEval": 0.8312, + "BBH": 0.5045, + "MATH Level 5": 0.173, + "GPQA": 0.2743, + "MUSR": 0.3845, + "MMLU-PRO": 0.3592 + } + }, + { + "model_id": "vicgalle/Configurable-Yi-1.5-9B-Chat", + "name": "Configurable-Yi-1.5-9B-Chat", + "developer": "vicgalle", + "scores": { + "IFEval": 0.4323, + "BBH": 0.5452, + "MATH Level 5": 0.2047, + "GPQA": 0.3431, + "MUSR": 0.4271, + "MMLU-PRO": 0.4015 + } + }, + { + "model_id": "vicgalle/ConfigurableBeagle-11B", + "name": "ConfigurableBeagle-11B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.5834, + "BBH": 0.5287, + "MATH Level 5": 0.0431, + "GPQA": 0.302, + "MUSR": 0.3953, + "MMLU-PRO": 0.3374 + } + }, + { + "model_id": "vicgalle/ConfigurableHermes-7B", + "name": "ConfigurableHermes-7B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.5411, + "BBH": 0.4573, + "MATH Level 5": 0.0476, + "GPQA": 0.2768, + "MUSR": 0.4057, + "MMLU-PRO": 0.3025 + } + }, + { + "model_id": "vicgalle/ConfigurableSOLAR-10.7B", + "name": "ConfigurableSOLAR-10.7B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.51, + "BBH": 0.4867, + "MATH Level 5": 0.0665, + "GPQA": 0.2987, + "MUSR": 0.3805, + "MMLU-PRO": 0.3173 + } + }, + { + "model_id": "vicgalle/Humanish-RP-Llama-3.1-8B", + "name": "Humanish-RP-Llama-3.1-8B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.6669, + "BBH": 0.51, + "MATH Level 5": 0.1518, + "GPQA": 0.2869, + "MUSR": 0.3952, + "MMLU-PRO": 0.3477 + } + }, + { + "model_id": "vicgalle/Merge-Mistral-Prometheus-7B", + "name": "Merge-Mistral-Prometheus-7B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.4848, + "BBH": 0.4201, + "MATH Level 5": 0.0181, + "GPQA": 0.2634, + "MUSR": 0.41, + "MMLU-PRO": 0.2717 + } + }, + { + "model_id": "vicgalle/Merge-Mixtral-Prometheus-8x7B", + "name": "Merge-Mixtral-Prometheus-8x7B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.5744, + "BBH": 0.5351, + "MATH Level 5": 0.0929, + "GPQA": 0.3087, + "MUSR": 0.4098, + "MMLU-PRO": 0.3684 + } + }, + { + "model_id": "vicgalle/Roleplay-Llama-3-8B", + "name": "Roleplay-Llama-3-8B", + "developer": "vicgalle", + "scores": { + "IFEval": 0.732, + "BBH": 0.5012, + "MATH Level 5": 0.0914, + "GPQA": 0.2609, + "MUSR": 0.3529, + "MMLU-PRO": 0.3708 + } + }, + { + "model_id": "viettelsecurity-ai/security-llama3.2-3b", + "name": "security-llama3.2-3b", + "developer": "viettelsecurity-ai", + "scores": { + "IFEval": 0.5909, + "BBH": 0.4401, + "MATH Level 5": 0.1261, + "GPQA": 0.2743, + "MUSR": 0.3379, + "MMLU-PRO": 0.2837 + } + }, + { + "model_id": "vihangd/smart-dan-sft-v0.1", + "name": "smart-dan-sft-v0.1", + "developer": "vihangd", + "scores": { + "IFEval": 0.1576, + "BBH": 0.3062, + "MATH Level 5": 0.0098, + "GPQA": 0.255, + "MUSR": 0.3502, + "MMLU-PRO": 0.1142 + } + }, + { + "model_id": "voidful/smol-360m-ft", + "name": "smol-360m-ft", + "developer": "voidful", + "scores": { + "IFEval": 0.2013, + "BBH": 0.3012, + "MATH Level 5": 0.0083, + "GPQA": 0.2458, + "MUSR": 0.3714, + "MMLU-PRO": 0.1087 + } + }, + { + "model_id": "vonjack/MobileLLM-125M-HF", + "name": "MobileLLM-125M-HF", + "developer": "vonjack", + "scores": { + "IFEval": 0.2107, + "BBH": 0.3027, + "MATH Level 5": 0.0091, + "GPQA": 0.2601, + "MUSR": 0.3782, + "MMLU-PRO": 0.1164 + } + }, + { + "model_id": "vonjack/Phi-3-mini-4k-instruct-LLaMAfied", + "name": "Phi-3-mini-4k-instruct-LLaMAfied", + "developer": "vonjack", + "scores": { + "IFEval": 0.5787, + "BBH": 0.5741, + "MATH Level 5": 0.1382, + "GPQA": 0.3305, + "MUSR": 0.3924, + "MMLU-PRO": 0.3885 + } + }, + { + "model_id": "vonjack/Phi-3.5-mini-instruct-hermes-fc-json", + "name": "Phi-3.5-mini-instruct-hermes-fc-json", + "developer": "vonjack", + "scores": { + "IFEval": 0.1416, + "BBH": 0.2975, + "MATH Level 5": 0.0076, + "GPQA": 0.2542, + "MUSR": 0.4041, + "MMLU-PRO": 0.1139 + } + }, + { + "model_id": "vonjack/Qwen2.5-Coder-0.5B-Merged", + "name": "Qwen2.5-Coder-0.5B-Merged", + "developer": "vonjack", + "scores": { + "IFEval": 0.31, + "BBH": 0.3076, + "MATH Level 5": 0.0378, + "GPQA": 0.2534, + "MUSR": 0.3303, + "MMLU-PRO": 0.1202 + } + }, + { + "model_id": "vonjack/SmolLM2-1.7B-Merged", + "name": "SmolLM2-1.7B-Merged", + "developer": "vonjack", + "scores": { + "IFEval": 0.3698, + "BBH": 0.3587, + "MATH Level 5": 0.0627, + "GPQA": 0.2794, + "MUSR": 0.3408, + "MMLU-PRO": 0.2048 + } + }, + { + "model_id": "vonjack/SmolLM2-135M-Merged", + "name": "SmolLM2-135M-Merged", + "developer": "vonjack", + "scores": { + "IFEval": 0.2483, + "BBH": 0.31, + "MATH Level 5": 0.0113, + "GPQA": 0.2383, + "MUSR": 0.3662, + "MMLU-PRO": 0.1112 + } + }, + { + "model_id": "vonjack/SmolLM2-360M-Merged", + "name": "SmolLM2-360M-Merged", + "developer": "vonjack", + "scores": { + "IFEval": 0.3206, + "BBH": 0.3155, + "MATH Level 5": 0.0174, + "GPQA": 0.2559, + "MUSR": 0.3527, + "MMLU-PRO": 0.1098 + } + }, + { + "model_id": "w4r10ck/SOLAR-10.7B-Instruct-v1.0-uncensored", + "name": "SOLAR-10.7B-Instruct-v1.0-uncensored", + "developer": "w4r10ck", + "scores": { + "IFEval": 0.3884, + "BBH": 0.5302, + "MATH Level 5": 0.0657, + "GPQA": 0.2945, + "MUSR": 0.4639, + "MMLU-PRO": 0.3344 + } + }, + { + "model_id": "wanlige/li-14b-v0.4", + "name": "li-14b-v0.4", + "developer": "wanlige", + "scores": { + "IFEval": 0.8133, + "BBH": 0.6544, + "MATH Level 5": 0.5574, + "GPQA": 0.3389, + "MUSR": 0.446, + "MMLU-PRO": 0.5167 + } + }, + { + "model_id": "wanlige/li-14b-v0.4-slerp", + "name": "li-14b-v0.4-slerp", + "developer": "wanlige", + "scores": { + "IFEval": 0.4606, + "BBH": 0.6587, + "MATH Level 5": 0.4192, + "GPQA": 0.4002, + "MUSR": 0.4768, + "MMLU-PRO": 0.5372 + } + }, + { + "model_id": "wanlige/li-14b-v0.4-slerp0.1", + "name": "li-14b-v0.4-slerp0.1", + "developer": "wanlige", + "scores": { + "IFEval": 0.7923, + "BBH": 0.6572, + "MATH Level 5": 0.5332, + "GPQA": 0.3591, + "MUSR": 0.4207, + "MMLU-PRO": 0.5294 + } + }, + { + "model_id": "wannaphong/KhanomTanLLM-Instruct", + "name": "KhanomTanLLM-Instruct", + "developer": "wannaphong", + "scores": { + "IFEval": 0.1621, + "BBH": 0.3093, + "MATH Level 5": 0.0136, + "GPQA": 0.2634, + "MUSR": 0.3701, + "MMLU-PRO": 0.1119 + } + }, + { + "model_id": "waqasali1707/Beast-Soul-new", + "name": "Beast-Soul-new", + "developer": "waqasali1707", + "scores": { + "IFEval": 0.503, + "BBH": 0.5225, + "MATH Level 5": 0.0702, + "GPQA": 0.2827, + "MUSR": 0.4486, + "MMLU-PRO": 0.3108 + } + }, + { + "model_id": "wave-on-discord/qwent-7b", + "name": "qwent-7b", + "developer": "wave-on-discord", + "scores": { + "IFEval": 0.2015, + "BBH": 0.4228, + "MATH Level 5": 0.0038, + "GPQA": 0.2651, + "MUSR": 0.3817, + "MMLU-PRO": 0.1603 + } + }, + { + "model_id": "weathermanj/Menda-3B-500", + "name": "Menda-3B-500", + "developer": "weathermanj", + "scores": { + "IFEval": 0.6353, + "BBH": 0.4766, + "MATH Level 5": 0.3724, + "GPQA": 0.2878, + "MUSR": 0.3968, + "MMLU-PRO": 0.3475 + } + }, + { + "model_id": "weathermanj/Menda-3b-750", + "name": "Menda-3b-750", + "developer": "weathermanj", + "scores": { + "IFEval": 0.6335, + "BBH": 0.4737, + "MATH Level 5": 0.3716, + "GPQA": 0.2878, + "MUSR": 0.3942, + "MMLU-PRO": 0.3506 + } + }, + { + "model_id": "weathermanj/Menda-3b-Optim-100", + "name": "Menda-3b-Optim-100", + "developer": "weathermanj", + "scores": { + "IFEval": 0.6398, + "BBH": 0.4735, + "MATH Level 5": 0.3716, + "GPQA": 0.2894, + "MUSR": 0.3993, + "MMLU-PRO": 0.3461 + } + }, + { + "model_id": "weathermanj/Menda-3b-Optim-200", + "name": "Menda-3b-Optim-200", + "developer": "weathermanj", + "scores": { + "IFEval": 0.6375, + "BBH": 0.4746, + "MATH Level 5": 0.3731, + "GPQA": 0.2827, + "MUSR": 0.4033, + "MMLU-PRO": 0.3484 + } + }, + { + "model_id": "win10/ArliAI-RPMax-v1.3-merge-13.3B", + "name": "ArliAI-RPMax-v1.3-merge-13.3B", + "developer": "win10", + "scores": { + "IFEval": 0.3038, + "BBH": 0.4581, + "MATH Level 5": 0.0393, + "GPQA": 0.2743, + "MUSR": 0.4325, + "MMLU-PRO": 0.32 + } + }, + { + "model_id": "win10/Breeze-13B-32k-Instruct-v1_0", + "name": "Breeze-13B-32k-Instruct-v1_0", + "developer": "win10", + "scores": { + "IFEval": 0.3584, + "BBH": 0.4611, + "MATH Level 5": 0.0128, + "GPQA": 0.2643, + "MUSR": 0.4202, + "MMLU-PRO": 0.2568 + } + }, + { + "model_id": "win10/EVA-Norns-Qwen2.5-v0.1", + "name": "EVA-Norns-Qwen2.5-v0.1", + "developer": "win10", + "scores": { + "IFEval": 0.622, + "BBH": 0.5072, + "MATH Level 5": 0.2613, + "GPQA": 0.2852, + "MUSR": 0.4045, + "MMLU-PRO": 0.3425 + } + }, + { + "model_id": "win10/Llama-3.2-3B-Instruct-24-9-29", + "name": "Llama-3.2-3B-Instruct-24-9-29", + "developer": "win10", + "scores": { + "IFEval": 0.7332, + "BBH": 0.4614, + "MATH Level 5": 0.1707, + "GPQA": 0.2743, + "MUSR": 0.3555, + "MMLU-PRO": 0.3228 + } + }, + { + "model_id": "win10/Norns-Qwen2.5-12B", + "name": "Norns-Qwen2.5-12B", + "developer": "win10", + "scores": { + "IFEval": 0.4897, + "BBH": 0.4619, + "MATH Level 5": 0.0838, + "GPQA": 0.2836, + "MUSR": 0.3555, + "MMLU-PRO": 0.266 + } + }, + { + "model_id": "win10/Norns-Qwen2.5-7B", + "name": "Norns-Qwen2.5-7B", + "developer": "win10", + "scores": { + "IFEval": 0.6122, + "BBH": 0.5073, + "MATH Level 5": 0.2628, + "GPQA": 0.2844, + "MUSR": 0.4085, + "MMLU-PRO": 0.3413 + } + }, + { + "model_id": "win10/Qwen2.5-2B-Instruct", + "name": "Qwen2.5-2B-Instruct", + "developer": "win10", + "scores": { + "IFEval": 0.2273, + "BBH": 0.3706, + "MATH Level 5": 0.0227, + "GPQA": 0.2676, + "MUSR": 0.4378, + "MMLU-PRO": 0.1934 + } + }, + { + "model_id": "win10/llama3-13.45b-Instruct", + "name": "llama3-13.45b-Instruct", + "developer": "win10", + "scores": { + "IFEval": 0.4144, + "BBH": 0.4865, + "MATH Level 5": 0.0242, + "GPQA": 0.2584, + "MUSR": 0.3848, + "MMLU-PRO": 0.3345 + } + }, + { + "model_id": "win10/miscii-14b-1M-0128", + "name": "miscii-14b-1M-0128", + "developer": "win10", + "scores": { + "IFEval": 0.4181, + "BBH": 0.5742, + "MATH Level 5": 0.4773, + "GPQA": 0.3826, + "MUSR": 0.5431, + "MMLU-PRO": 0.4491 + } + }, + { + "model_id": "winglian/Llama-3-8b-64k-PoSE", + "name": "Llama-3-8b-64k-PoSE", + "developer": "winglian", + "scores": { + "IFEval": 0.2857, + "BBH": 0.3702, + "MATH Level 5": 0.0415, + "GPQA": 0.2609, + "MUSR": 0.3396, + "MMLU-PRO": 0.2467 + } + }, + { + "model_id": "winglian/llama-3-8b-256k-PoSE", + "name": "llama-3-8b-256k-PoSE", + "developer": "winglian", + "scores": { + "IFEval": 0.2909, + "BBH": 0.3157, + "MATH Level 5": 0.0196, + "GPQA": 0.2576, + "MUSR": 0.3316, + "MMLU-PRO": 0.1116 + } + }, + { + "model_id": "wzhouad/gemma-2-9b-it-WPO-HB", + "name": "gemma-2-9b-it-WPO-HB", + "developer": "wzhouad", + "scores": { + "IFEval": 0.5437, + "BBH": 0.5629, + "MATH Level 5": 0.1533, + "GPQA": 0.3498, + "MUSR": 0.3675, + "MMLU-PRO": 0.336 + } + }, + { + "model_id": "x0000001/Deepseek-Lumen-R1-Qwen2.5-14B", + "name": "Deepseek-Lumen-R1-Qwen2.5-14B", + "developer": "x0000001", + "scores": { + "IFEval": 0.4436, + "BBH": 0.4569, + "MATH Level 5": 0.2779, + "GPQA": 0.2852, + "MUSR": 0.474, + "MMLU-PRO": 0.4379 + } + }, + { + "model_id": "xMaulana/FinMatcha-3B-Instruct", + "name": "FinMatcha-3B-Instruct", + "developer": "xMaulana", + "scores": { + "IFEval": 0.7548, + "BBH": 0.4536, + "MATH Level 5": 0.1435, + "GPQA": 0.2693, + "MUSR": 0.3633, + "MMLU-PRO": 0.3182 + } + }, + { + "model_id": "xinchen9/Llama3.1_8B_Instruct_CoT", + "name": "Llama3.1_8B_Instruct_CoT", + "developer": "xinchen9", + "scores": { + "IFEval": 0.2974, + "BBH": 0.4398, + "MATH Level 5": 0.0604, + "GPQA": 0.302, + "MUSR": 0.4371, + "MMLU-PRO": 0.2879 + } + }, + { + "model_id": "xinchen9/Llama3.1_CoT", + "name": "Llama3.1_CoT", + "developer": "xinchen9", + "scores": { + "IFEval": 0.2246, + "BBH": 0.4341, + "MATH Level 5": 0.0385, + "GPQA": 0.2886, + "MUSR": 0.4305, + "MMLU-PRO": 0.2739 + } + }, + { + "model_id": "xinchen9/Llama3.1_CoT_V1", + "name": "Llama3.1_CoT_V1", + "developer": "xinchen9", + "scores": { + "IFEval": 0.2453, + "BBH": 0.4376, + "MATH Level 5": 0.0332, + "GPQA": 0.2794, + "MUSR": 0.4572, + "MMLU-PRO": 0.2805 + } + }, + { + "model_id": "xinchen9/Mistral-7B-CoT", + "name": "Mistral-7B-CoT", + "developer": "xinchen9", + "scores": { + "IFEval": 0.2783, + "BBH": 0.3873, + "MATH Level 5": 0.0249, + "GPQA": 0.2492, + "MUSR": 0.3994, + "MMLU-PRO": 0.2284 + } + }, + { + "model_id": "xinchen9/llama3-b8-ft-dis", + "name": "llama3-b8-ft-dis", + "developer": "xinchen9", + "scores": { + "IFEval": 0.1546, + "BBH": 0.4626, + "MATH Level 5": 0.0393, + "GPQA": 0.3129, + "MUSR": 0.3654, + "MMLU-PRO": 0.3244 + } + }, + { + "model_id": "xkp24/Llama-3-8B-Instruct-SPPO-Iter2_bt_2b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter2_bt_2b-table", + "developer": "xkp24", + "scores": { + "IFEval": 0.6375, + "BBH": 0.4912, + "MATH Level 5": 0.0921, + "GPQA": 0.2592, + "MUSR": 0.382, + "MMLU-PRO": 0.3686 + } + }, + { + "model_id": "xkp24/Llama-3-8B-Instruct-SPPO-Iter2_bt_8b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter2_bt_8b-table", + "developer": "xkp24", + "scores": { + "IFEval": 0.7275, + "BBH": 0.5057, + "MATH Level 5": 0.0846, + "GPQA": 0.2601, + "MUSR": 0.3819, + "MMLU-PRO": 0.3697 + } + }, + { + "model_id": "xkp24/Llama-3-8B-Instruct-SPPO-Iter2_gp_2b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter2_gp_2b-table", + "developer": "xkp24", + "scores": { + "IFEval": 0.6569, + "BBH": 0.4952, + "MATH Level 5": 0.0891, + "GPQA": 0.2592, + "MUSR": 0.3594, + "MMLU-PRO": 0.3702 + } + }, + { + "model_id": "xkp24/Llama-3-8B-Instruct-SPPO-Iter2_gp_8b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter2_gp_8b-table", + "developer": "xkp24", + "scores": { + "IFEval": 0.6621, + "BBH": 0.5004, + "MATH Level 5": 0.0861, + "GPQA": 0.2592, + "MUSR": 0.3805, + "MMLU-PRO": 0.36 + } + }, + { + "model_id": "xkp24/Llama-3-8B-Instruct-SPPO-score-Iter2_bt_2b-table-0.001", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter2_bt_2b-table-0.001", + "developer": "xkp24", + "scores": { + "IFEval": 0.6042, + "BBH": 0.4936, + "MATH Level 5": 0.0997, + "GPQA": 0.2592, + "MUSR": 0.3793, + "MMLU-PRO": 0.3708 + } + }, + { + "model_id": "xkp24/Llama-3-8B-Instruct-SPPO-score-Iter2_bt_8b-table-0.002", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter2_bt_8b-table-0.002", + "developer": "xkp24", + "scores": { + "IFEval": 0.7132, + "BBH": 0.4996, + "MATH Level 5": 0.0853, + "GPQA": 0.2584, + "MUSR": 0.3872, + "MMLU-PRO": 0.3664 + } + }, + { + "model_id": "xkp24/Llama-3-8B-Instruct-SPPO-score-Iter2_gp_2b-table-0.001", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter2_gp_2b-table-0.001", + "developer": "xkp24", + "scores": { + "IFEval": 0.5947, + "BBH": 0.4899, + "MATH Level 5": 0.1073, + "GPQA": 0.2592, + "MUSR": 0.3581, + "MMLU-PRO": 0.3704 + } + }, + { + "model_id": "xkp24/Llama-3-8B-Instruct-SPPO-score-Iter2_gp_8b-table-0.002", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter2_gp_8b-table-0.002", + "developer": "xkp24", + "scores": { + "IFEval": 0.6453, + "BBH": 0.4951, + "MATH Level 5": 0.0937, + "GPQA": 0.2601, + "MUSR": 0.3939, + "MMLU-PRO": 0.353 + } + }, + { + "model_id": "xukp20/Llama-3-8B-Instruct-SPPO-Iter3_bt_2b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter3_bt_2b-table", + "developer": "xukp20", + "scores": { + "IFEval": 0.5756, + "BBH": 0.4901, + "MATH Level 5": 0.0997, + "GPQA": 0.2592, + "MUSR": 0.366, + "MMLU-PRO": 0.3659 + } + }, + { + "model_id": "xukp20/Llama-3-8B-Instruct-SPPO-Iter3_bt_8b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter3_bt_8b-table", + "developer": "xukp20", + "scores": { + "IFEval": 0.7034, + "BBH": 0.5092, + "MATH Level 5": 0.0967, + "GPQA": 0.2592, + "MUSR": 0.3739, + "MMLU-PRO": 0.3693 + } + }, + { + "model_id": "xukp20/Llama-3-8B-Instruct-SPPO-Iter3_gp_2b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter3_gp_2b-table", + "developer": "xukp20", + "scores": { + "IFEval": 0.6024, + "BBH": 0.497, + "MATH Level 5": 0.1042, + "GPQA": 0.2592, + "MUSR": 0.3674, + "MMLU-PRO": 0.3658 + } + }, + { + "model_id": "xukp20/Llama-3-8B-Instruct-SPPO-Iter3_gp_8b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter3_gp_8b-table", + "developer": "xukp20", + "scores": { + "IFEval": 0.662, + "BBH": 0.5, + "MATH Level 5": 0.0937, + "GPQA": 0.2592, + "MUSR": 0.3818, + "MMLU-PRO": 0.3615 + } + }, + { + "model_id": "xukp20/Llama-3-8B-Instruct-SPPO-score-Iter3_bt_2b-table-0.001", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter3_bt_2b-table-0.001", + "developer": "xukp20", + "scores": { + "IFEval": 0.5336, + "BBH": 0.4915, + "MATH Level 5": 0.0982, + "GPQA": 0.2592, + "MUSR": 0.378, + "MMLU-PRO": 0.3625 + } + }, + { + "model_id": "xukp20/Llama-3-8B-Instruct-SPPO-score-Iter3_bt_8b-table-0.002", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter3_bt_8b-table-0.002", + "developer": "xukp20", + "scores": { + "IFEval": 0.6852, + "BBH": 0.5075, + "MATH Level 5": 0.0718, + "GPQA": 0.2584, + "MUSR": 0.3832, + "MMLU-PRO": 0.3621 + } + }, + { + "model_id": "xukp20/Llama-3-8B-Instruct-SPPO-score-Iter3_gp_2b-table-0.001", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter3_gp_2b-table-0.001", + "developer": "xukp20", + "scores": { + "IFEval": 0.5482, + "BBH": 0.4887, + "MATH Level 5": 0.0891, + "GPQA": 0.2609, + "MUSR": 0.3633, + "MMLU-PRO": 0.3671 + } + }, + { + "model_id": "xukp20/llama-3-8b-instruct-sppo-iter1-gp-2b-tau01-table", + "name": "llama-3-8b-instruct-sppo-iter1-gp-2b-tau01-table", + "developer": "xukp20", + "scores": { + "IFEval": 0.69, + "BBH": 0.4978, + "MATH Level 5": 0.105, + "GPQA": 0.2592, + "MUSR": 0.3673, + "MMLU-PRO": 0.3716 + } + }, + { + "model_id": "xwen-team/Xwen-7B-Chat", + "name": "Xwen-7B-Chat", + "developer": "xwen-team", + "scores": { + "IFEval": 0.6864, + "BBH": 0.5068, + "MATH Level 5": 0.4509, + "GPQA": 0.2609, + "MUSR": 0.3914, + "MMLU-PRO": 0.429 + } + }, + { + "model_id": "xxx777xxxASD/L3.1-ClaudeMaid-4x8B", + "name": "L3.1-ClaudeMaid-4x8B", + "developer": "xxx777xxxASD", + "scores": { + "IFEval": 0.6696, + "BBH": 0.5071, + "MATH Level 5": 0.1412, + "GPQA": 0.2911, + "MUSR": 0.4289, + "MMLU-PRO": 0.358 + } + }, + { + "model_id": "yam-peleg/Hebrew-Gemma-11B-Instruct", + "name": "Hebrew-Gemma-11B-Instruct", + "developer": "yam-peleg", + "scores": { + "IFEval": 0.3021, + "BBH": 0.4036, + "MATH Level 5": 0.0657, + "GPQA": 0.276, + "MUSR": 0.4089, + "MMLU-PRO": 0.2554 + } + }, + { + "model_id": "yam-peleg/Hebrew-Mistral-7B", + "name": "Hebrew-Mistral-7B", + "developer": "yam-peleg", + "scores": { + "IFEval": 0.2328, + "BBH": 0.4334, + "MATH Level 5": 0.0498, + "GPQA": 0.2794, + "MUSR": 0.3977, + "MMLU-PRO": 0.278 + } + }, + { + "model_id": "yam-peleg/Hebrew-Mistral-7B-200K", + "name": "Hebrew-Mistral-7B-200K", + "developer": "yam-peleg", + "scores": { + "IFEval": 0.177, + "BBH": 0.3411, + "MATH Level 5": 0.031, + "GPQA": 0.2534, + "MUSR": 0.374, + "MMLU-PRO": 0.2529 + } + }, + { + "model_id": "yanng1242/Marcoro14-7B-slerp", + "name": "Marcoro14-7B-slerp", + "developer": "yanng1242", + "scores": { + "IFEval": 0.406, + "BBH": 0.5252, + "MATH Level 5": 0.0748, + "GPQA": 0.3146, + "MUSR": 0.4686, + "MMLU-PRO": 0.3168 + } + }, + { + "model_id": "yasserrmd/Coder-GRPO-3B", + "name": "Coder-GRPO-3B", + "developer": "yasserrmd", + "scores": { + "IFEval": 0.6208, + "BBH": 0.4469, + "MATH Level 5": 0.3202, + "GPQA": 0.2777, + "MUSR": 0.4115, + "MMLU-PRO": 0.3197 + } + }, + { + "model_id": "yasserrmd/Text2SQL-1.5B", + "name": "Text2SQL-1.5B", + "developer": "yasserrmd", + "scores": { + "IFEval": 0.2857, + "BBH": 0.3858, + "MATH Level 5": 0.068, + "GPQA": 0.2878, + "MUSR": 0.3942, + "MMLU-PRO": 0.2363 + } + }, + { + "model_id": "ycros/BagelMIsteryTour-v2-8x7B", + "name": "BagelMIsteryTour-v2-8x7B", + "developer": "ycros", + "scores": { + "IFEval": 0.6262, + "BBH": 0.5142, + "MATH Level 5": 0.0937, + "GPQA": 0.3079, + "MUSR": 0.4138, + "MMLU-PRO": 0.3481 + } + }, + { + "model_id": "yfzp/Llama-3-8B-Instruct-SPPO-Iter1_bt_2b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter1_bt_2b-table", + "developer": "yfzp", + "scores": { + "IFEval": 0.6709, + "BBH": 0.4987, + "MATH Level 5": 0.1118, + "GPQA": 0.2592, + "MUSR": 0.3727, + "MMLU-PRO": 0.3716 + } + }, + { + "model_id": "yfzp/Llama-3-8B-Instruct-SPPO-Iter1_bt_8b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter1_bt_8b-table", + "developer": "yfzp", + "scores": { + "IFEval": 0.7333, + "BBH": 0.508, + "MATH Level 5": 0.1035, + "GPQA": 0.2601, + "MUSR": 0.3806, + "MMLU-PRO": 0.3748 + } + }, + { + "model_id": "yfzp/Llama-3-8B-Instruct-SPPO-Iter1_gp_2b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter1_gp_2b-table", + "developer": "yfzp", + "scores": { + "IFEval": 0.6785, + "BBH": 0.4941, + "MATH Level 5": 0.1125, + "GPQA": 0.2592, + "MUSR": 0.3647, + "MMLU-PRO": 0.3718 + } + }, + { + "model_id": "yfzp/Llama-3-8B-Instruct-SPPO-Iter1_gp_8b-table", + "name": "Llama-3-8B-Instruct-SPPO-Iter1_gp_8b-table", + "developer": "yfzp", + "scores": { + "IFEval": 0.7132, + "BBH": 0.5025, + "MATH Level 5": 0.0989, + "GPQA": 0.2592, + "MUSR": 0.3713, + "MMLU-PRO": 0.3683 + } + }, + { + "model_id": "yfzp/Llama-3-8B-Instruct-SPPO-score-Iter1_bt_2b-table-0.001", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter1_bt_2b-table-0.001", + "developer": "yfzp", + "scores": { + "IFEval": 0.6496, + "BBH": 0.4979, + "MATH Level 5": 0.1012, + "GPQA": 0.2592, + "MUSR": 0.378, + "MMLU-PRO": 0.372 + } + }, + { + "model_id": "yfzp/Llama-3-8B-Instruct-SPPO-score-Iter1_bt_8b-table-0.002", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter1_bt_8b-table-0.002", + "developer": "yfzp", + "scores": { + "IFEval": 0.7196, + "BBH": 0.5045, + "MATH Level 5": 0.0876, + "GPQA": 0.2601, + "MUSR": 0.3831, + "MMLU-PRO": 0.3734 + } + }, + { + "model_id": "yfzp/Llama-3-8B-Instruct-SPPO-score-Iter1_gp_2b-table-0.001", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter1_gp_2b-table-0.001", + "developer": "yfzp", + "scores": { + "IFEval": 0.6504, + "BBH": 0.4958, + "MATH Level 5": 0.0937, + "GPQA": 0.2592, + "MUSR": 0.366, + "MMLU-PRO": 0.3703 + } + }, + { + "model_id": "yfzp/Llama-3-8B-Instruct-SPPO-score-Iter1_gp_8b-table-0.002", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter1_gp_8b-table-0.002", + "developer": "yfzp", + "scores": { + "IFEval": 0.7016, + "BBH": 0.4992, + "MATH Level 5": 0.0869, + "GPQA": 0.2592, + "MUSR": 0.3779, + "MMLU-PRO": 0.3669 + } + }, + { + "model_id": "yifAI/Llama-3-8B-Instruct-SPPO-score-Iter3_gp_8b-table-0.002", + "name": "Llama-3-8B-Instruct-SPPO-score-Iter3_gp_8b-table-0.002", + "developer": "yifAI", + "scores": { + "IFEval": 0.649, + "BBH": 0.4915, + "MATH Level 5": 0.0755, + "GPQA": 0.2617, + "MUSR": 0.3899, + "MMLU-PRO": 0.352 + } + }, + { + "model_id": "ylalain/ECE-PRYMMAL-YL-1B-SLERP-V8", + "name": "ECE-PRYMMAL-YL-1B-SLERP-V8", + "developer": "ylalain", + "scores": { + "IFEval": 0.1505, + "BBH": 0.3976, + "MATH Level 5": 0.0045, + "GPQA": 0.2894, + "MUSR": 0.3875, + "MMLU-PRO": 0.2384 + } + }, + { + "model_id": "ymcki/Llama-3.1-8B-GRPO-Instruct", + "name": "Llama-3.1-8B-GRPO-Instruct", + "developer": "ymcki", + "scores": { + "IFEval": 0.7445, + "BBH": 0.5132, + "MATH Level 5": 0.2024, + "GPQA": 0.2945, + "MUSR": 0.3817, + "MMLU-PRO": 0.3738 + } + }, + { + "model_id": "ymcki/Llama-3.1-8B-SFT-GRPO-Instruct", + "name": "Llama-3.1-8B-SFT-GRPO-Instruct", + "developer": "ymcki", + "scores": { + "IFEval": 0.3354, + "BBH": 0.3126, + "MATH Level 5": 0.04, + "GPQA": 0.2534, + "MUSR": 0.3526, + "MMLU-PRO": 0.1098 + } + }, + { + "model_id": "ymcki/gemma-2-2b-ORPO-jpn-it-abliterated-18", + "name": "gemma-2-2b-ORPO-jpn-it-abliterated-18", + "developer": "ymcki", + "scores": { + "IFEval": 0.4631, + "BBH": 0.4053, + "MATH Level 5": 0.0431, + "GPQA": 0.2886, + "MUSR": 0.3754, + "MMLU-PRO": 0.2345 + } + }, + { + "model_id": "ymcki/gemma-2-2b-ORPO-jpn-it-abliterated-18-merge", + "name": "gemma-2-2b-ORPO-jpn-it-abliterated-18-merge", + "developer": "ymcki", + "scores": { + "IFEval": 0.5218, + "BBH": 0.4147, + "MATH Level 5": 0.0544, + "GPQA": 0.2836, + "MUSR": 0.3514, + "MMLU-PRO": 0.2461 + } + }, + { + "model_id": "ymcki/gemma-2-2b-jpn-it-abliterated-17", + "name": "gemma-2-2b-jpn-it-abliterated-17", + "developer": "ymcki", + "scores": { + "IFEval": 0.5082, + "BBH": 0.4076, + "MATH Level 5": 0.0385, + "GPQA": 0.2718, + "MUSR": 0.3701, + "MMLU-PRO": 0.2455 + } + }, + { + "model_id": "ymcki/gemma-2-2b-jpn-it-abliterated-17-18-24", + "name": "gemma-2-2b-jpn-it-abliterated-17-18-24", + "developer": "ymcki", + "scores": { + "IFEval": 0.5055, + "BBH": 0.3812, + "MATH Level 5": 0.0257, + "GPQA": 0.281, + "MUSR": 0.3502, + "MMLU-PRO": 0.2282 + } + }, + { + "model_id": "ymcki/gemma-2-2b-jpn-it-abliterated-17-ORPO", + "name": "gemma-2-2b-jpn-it-abliterated-17-ORPO", + "developer": "ymcki", + "scores": { + "IFEval": 0.4748, + "BBH": 0.3898, + "MATH Level 5": 0.0619, + "GPQA": 0.2743, + "MUSR": 0.3768, + "MMLU-PRO": 0.2191 + } + }, + { + "model_id": "ymcki/gemma-2-2b-jpn-it-abliterated-17-ORPO-alpaca", + "name": "gemma-2-2b-jpn-it-abliterated-17-ORPO-alpaca", + "developer": "ymcki", + "scores": { + "IFEval": 0.3065, + "BBH": 0.4072, + "MATH Level 5": 0.0325, + "GPQA": 0.2693, + "MUSR": 0.3969, + "MMLU-PRO": 0.2249 + } + }, + { + "model_id": "ymcki/gemma-2-2b-jpn-it-abliterated-18", + "name": "gemma-2-2b-jpn-it-abliterated-18", + "developer": "ymcki", + "scores": { + "IFEval": 0.5175, + "BBH": 0.4132, + "MATH Level 5": 0.0446, + "GPQA": 0.2735, + "MUSR": 0.3742, + "MMLU-PRO": 0.2505 + } + }, + { + "model_id": "ymcki/gemma-2-2b-jpn-it-abliterated-18-ORPO", + "name": "gemma-2-2b-jpn-it-abliterated-18-ORPO", + "developer": "ymcki", + "scores": { + "IFEval": 0.4742, + "BBH": 0.4039, + "MATH Level 5": 0.0468, + "GPQA": 0.2617, + "MUSR": 0.3953, + "MMLU-PRO": 0.2185 + } + }, + { + "model_id": "ymcki/gemma-2-2b-jpn-it-abliterated-24", + "name": "gemma-2-2b-jpn-it-abliterated-24", + "developer": "ymcki", + "scores": { + "IFEval": 0.4979, + "BBH": 0.411, + "MATH Level 5": 0.0438, + "GPQA": 0.2777, + "MUSR": 0.3915, + "MMLU-PRO": 0.2473 + } + }, + { + "model_id": "yuchenxie/ArlowGPT-3B-Multilingual", + "name": "ArlowGPT-3B-Multilingual", + "developer": "yuchenxie", + "scores": { + "IFEval": 0.6395, + "BBH": 0.4301, + "MATH Level 5": 0.1125, + "GPQA": 0.2802, + "MUSR": 0.3727, + "MMLU-PRO": 0.2817 + } + }, + { + "model_id": "yuchenxie/ArlowGPT-8B", + "name": "ArlowGPT-8B", + "developer": "yuchenxie", + "scores": { + "IFEval": 0.7847, + "BBH": 0.508, + "MATH Level 5": 0.2039, + "GPQA": 0.2936, + "MUSR": 0.3882, + "MMLU-PRO": 0.3787 + } + }, + { + "model_id": "yuvraj17/Llama3-8B-SuperNova-Spectrum-Hermes-DPO", + "name": "Llama3-8B-SuperNova-Spectrum-Hermes-DPO", + "developer": "yuvraj17", + "scores": { + "IFEval": 0.4691, + "BBH": 0.44, + "MATH Level 5": 0.0566, + "GPQA": 0.302, + "MUSR": 0.4012, + "MMLU-PRO": 0.2635 + } + }, + { + "model_id": "yuvraj17/Llama3-8B-SuperNova-Spectrum-dare_ties", + "name": "Llama3-8B-SuperNova-Spectrum-dare_ties", + "developer": "yuvraj17", + "scores": { + "IFEval": 0.4013, + "BBH": 0.4616, + "MATH Level 5": 0.0846, + "GPQA": 0.2752, + "MUSR": 0.4211, + "MMLU-PRO": 0.3574 + } + }, + { + "model_id": "yuvraj17/Llama3-8B-abliterated-Spectrum-slerp", + "name": "Llama3-8B-abliterated-Spectrum-slerp", + "developer": "yuvraj17", + "scores": { + "IFEval": 0.2885, + "BBH": 0.4978, + "MATH Level 5": 0.0604, + "GPQA": 0.3012, + "MUSR": 0.3998, + "MMLU-PRO": 0.3257 + } + }, + { + "model_id": "zake7749/gemma-2-2b-it-chinese-kyara-dpo", + "name": "gemma-2-2b-it-chinese-kyara-dpo", + "developer": "zake7749", + "scores": { + "IFEval": 0.5382, + "BBH": 0.4257, + "MATH Level 5": 0.0838, + "GPQA": 0.2668, + "MUSR": 0.4576, + "MMLU-PRO": 0.2573 + } + }, + { + "model_id": "zake7749/gemma-2-9b-it-chinese-kyara", + "name": "gemma-2-9b-it-chinese-kyara", + "developer": "zake7749", + "scores": { + "IFEval": 0.1764, + "BBH": 0.5954, + "MATH Level 5": 0.105, + "GPQA": 0.3381, + "MUSR": 0.4242, + "MMLU-PRO": 0.4179 + } + }, + { + "model_id": "zelk12/Gemma-2-TM-9B", + "name": "Gemma-2-TM-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.8045, + "BBH": 0.5987, + "MATH Level 5": 0.2024, + "GPQA": 0.3465, + "MUSR": 0.4152, + "MMLU-PRO": 0.4088 + } + }, + { + "model_id": "zelk12/MT-Gen1-gemma-2-9B", + "name": "MT-Gen1-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7886, + "BBH": 0.61, + "MATH Level 5": 0.2221, + "GPQA": 0.3465, + "MUSR": 0.4217, + "MMLU-PRO": 0.4381 + } + }, + { + "model_id": "zelk12/MT-Gen2-GI-gemma-2-9B", + "name": "MT-Gen2-GI-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7914, + "BBH": 0.6096, + "MATH Level 5": 0.2205, + "GPQA": 0.3507, + "MUSR": 0.4283, + "MMLU-PRO": 0.4356 + } + }, + { + "model_id": "zelk12/MT-Gen2-gemma-2-9B", + "name": "MT-Gen2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7907, + "BBH": 0.61, + "MATH Level 5": 0.219, + "GPQA": 0.3465, + "MUSR": 0.4323, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "zelk12/MT-Gen3-gemma-2-9B", + "name": "MT-Gen3-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.802, + "BBH": 0.6097, + "MATH Level 5": 0.2296, + "GPQA": 0.349, + "MUSR": 0.4217, + "MMLU-PRO": 0.4356 + } + }, + { + "model_id": "zelk12/MT-Gen4-gemma-2-9B", + "name": "MT-Gen4-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7883, + "BBH": 0.611, + "MATH Level 5": 0.2236, + "GPQA": 0.3549, + "MUSR": 0.4228, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "zelk12/MT-Gen5-gemma-2-9B", + "name": "MT-Gen5-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7923, + "BBH": 0.6133, + "MATH Level 5": 0.2153, + "GPQA": 0.3515, + "MUSR": 0.4202, + "MMLU-PRO": 0.4402 + } + }, + { + "model_id": "zelk12/MT-Gen6-gemma-2-9B", + "name": "MT-Gen6-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1616, + "BBH": 0.5845, + "MATH Level 5": 0.0823, + "GPQA": 0.3331, + "MUSR": 0.4069, + "MMLU-PRO": 0.4166 + } + }, + { + "model_id": "zelk12/MT-Gen6fix-gemma-2-9B", + "name": "MT-Gen6fix-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1576, + "BBH": 0.5917, + "MATH Level 5": 0.0816, + "GPQA": 0.3372, + "MUSR": 0.4084, + "MMLU-PRO": 0.412 + } + }, + { + "model_id": "zelk12/MT-Gen7-gemma-2-9B", + "name": "MT-Gen7-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1664, + "BBH": 0.5935, + "MATH Level 5": 0.0891, + "GPQA": 0.3356, + "MUSR": 0.4098, + "MMLU-PRO": 0.4122 + } + }, + { + "model_id": "zelk12/MT-Max-Merge_02012025163610-gemma-2-9B", + "name": "MT-Max-Merge_02012025163610-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7907, + "BBH": 0.6142, + "MATH Level 5": 0.2213, + "GPQA": 0.3515, + "MUSR": 0.4228, + "MMLU-PRO": 0.4396 + } + }, + { + "model_id": "zelk12/MT-Merge-gemma-2-9B", + "name": "MT-Merge-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.8035, + "BBH": 0.6118, + "MATH Level 5": 0.2205, + "GPQA": 0.3482, + "MUSR": 0.4256, + "MMLU-PRO": 0.4362 + } + }, + { + "model_id": "zelk12/MT-Merge1-gemma-2-9B", + "name": "MT-Merge1-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7901, + "BBH": 0.61, + "MATH Level 5": 0.2289, + "GPQA": 0.3515, + "MUSR": 0.4244, + "MMLU-PRO": 0.4374 + } + }, + { + "model_id": "zelk12/MT-Merge2-MU-gemma-2-MTg2MT1g2-9B", + "name": "MT-Merge2-MU-gemma-2-MTg2MT1g2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7956, + "BBH": 0.6084, + "MATH Level 5": 0.2183, + "GPQA": 0.3507, + "MUSR": 0.4322, + "MMLU-PRO": 0.4373 + } + }, + { + "model_id": "zelk12/MT-Merge2-gemma-2-9B", + "name": "MT-Merge2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7877, + "BBH": 0.6107, + "MATH Level 5": 0.2349, + "GPQA": 0.3507, + "MUSR": 0.4217, + "MMLU-PRO": 0.4382 + } + }, + { + "model_id": "zelk12/MT-Merge3-gemma-2-9B", + "name": "MT-Merge3-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7859, + "BBH": 0.6102, + "MATH Level 5": 0.2205, + "GPQA": 0.349, + "MUSR": 0.4258, + "MMLU-PRO": 0.4373 + } + }, + { + "model_id": "zelk12/MT-Merge4-gemma-2-9B", + "name": "MT-Merge4-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7807, + "BBH": 0.6118, + "MATH Level 5": 0.2168, + "GPQA": 0.3523, + "MUSR": 0.4294, + "MMLU-PRO": 0.439 + } + }, + { + "model_id": "zelk12/MT-Merge5-gemma-2-9B", + "name": "MT-Merge5-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7844, + "BBH": 0.6123, + "MATH Level 5": 0.2183, + "GPQA": 0.3532, + "MUSR": 0.4281, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "zelk12/MT-Merge6-gemma-2-9B", + "name": "MT-Merge6-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1695, + "BBH": 0.5949, + "MATH Level 5": 0.0801, + "GPQA": 0.3289, + "MUSR": 0.4098, + "MMLU-PRO": 0.4115 + } + }, + { + "model_id": "zelk12/MT-gemma-2-9B", + "name": "MT-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7968, + "BBH": 0.6064, + "MATH Level 5": 0.2054, + "GPQA": 0.3456, + "MUSR": 0.4071, + "MMLU-PRO": 0.4224 + } + }, + { + "model_id": "zelk12/MT1-Gen1-gemma-2-9B", + "name": "MT1-Gen1-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7974, + "BBH": 0.6118, + "MATH Level 5": 0.2243, + "GPQA": 0.344, + "MUSR": 0.431, + "MMLU-PRO": 0.4376 + } + }, + { + "model_id": "zelk12/MT1-Gen2-gemma-2-9B", + "name": "MT1-Gen2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7984, + "BBH": 0.6096, + "MATH Level 5": 0.2251, + "GPQA": 0.3523, + "MUSR": 0.4284, + "MMLU-PRO": 0.4355 + } + }, + { + "model_id": "zelk12/MT1-Gen3-gemma-2-9B", + "name": "MT1-Gen3-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.796, + "BBH": 0.6102, + "MATH Level 5": 0.2243, + "GPQA": 0.349, + "MUSR": 0.4243, + "MMLU-PRO": 0.4349 + } + }, + { + "model_id": "zelk12/MT1-Gen4-gemma-2-9B", + "name": "MT1-Gen4-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7941, + "BBH": 0.6058, + "MATH Level 5": 0.216, + "GPQA": 0.3473, + "MUSR": 0.4231, + "MMLU-PRO": 0.4286 + } + }, + { + "model_id": "zelk12/MT1-Gen5-IF-gemma-2-S2DMv1-9B", + "name": "MT1-Gen5-IF-gemma-2-S2DMv1-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7929, + "BBH": 0.6, + "MATH Level 5": 0.2032, + "GPQA": 0.344, + "MUSR": 0.4245, + "MMLU-PRO": 0.4218 + } + }, + { + "model_id": "zelk12/MT1-Gen5-gemma-2-9B", + "name": "MT1-Gen5-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7795, + "BBH": 0.6017, + "MATH Level 5": 0.2077, + "GPQA": 0.3465, + "MUSR": 0.4191, + "MMLU-PRO": 0.4222 + } + }, + { + "model_id": "zelk12/MT1-Gen6-gemma-2-9B", + "name": "MT1-Gen6-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1634, + "BBH": 0.5944, + "MATH Level 5": 0.0808, + "GPQA": 0.328, + "MUSR": 0.4044, + "MMLU-PRO": 0.4133 + } + }, + { + "model_id": "zelk12/MT1-Gen7-gemma-2-9B", + "name": "MT1-Gen7-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1634, + "BBH": 0.5938, + "MATH Level 5": 0.0831, + "GPQA": 0.328, + "MUSR": 0.4111, + "MMLU-PRO": 0.4145 + } + }, + { + "model_id": "zelk12/MT1-Max-Merge_02012025163610-gemma-2-9B", + "name": "MT1-Max-Merge_02012025163610-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7929, + "BBH": 0.6123, + "MATH Level 5": 0.2228, + "GPQA": 0.3549, + "MUSR": 0.4255, + "MMLU-PRO": 0.4382 + } + }, + { + "model_id": "zelk12/MT1-gemma-2-9B", + "name": "MT1-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7947, + "BBH": 0.6109, + "MATH Level 5": 0.2236, + "GPQA": 0.3456, + "MUSR": 0.4322, + "MMLU-PRO": 0.4358 + } + }, + { + "model_id": "zelk12/MT2-Gen1-gemma-2-9B", + "name": "MT2-Gen1-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7856, + "BBH": 0.6101, + "MATH Level 5": 0.2213, + "GPQA": 0.3431, + "MUSR": 0.4243, + "MMLU-PRO": 0.4377 + } + }, + { + "model_id": "zelk12/MT2-Gen2-gemma-2-9B", + "name": "MT2-Gen2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7889, + "BBH": 0.6093, + "MATH Level 5": 0.2183, + "GPQA": 0.3465, + "MUSR": 0.427, + "MMLU-PRO": 0.4388 + } + }, + { + "model_id": "zelk12/MT2-Gen3-gemma-2-9B", + "name": "MT2-Gen3-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.781, + "BBH": 0.6105, + "MATH Level 5": 0.2107, + "GPQA": 0.3465, + "MUSR": 0.4231, + "MMLU-PRO": 0.4374 + } + }, + { + "model_id": "zelk12/MT2-Gen4-gemma-2-9B", + "name": "MT2-Gen4-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7896, + "BBH": 0.6097, + "MATH Level 5": 0.2236, + "GPQA": 0.3456, + "MUSR": 0.4125, + "MMLU-PRO": 0.4321 + } + }, + { + "model_id": "zelk12/MT2-Gen5-gemma-2-9B", + "name": "MT2-Gen5-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7749, + "BBH": 0.6064, + "MATH Level 5": 0.2107, + "GPQA": 0.3515, + "MUSR": 0.4244, + "MMLU-PRO": 0.4302 + } + }, + { + "model_id": "zelk12/MT2-Gen6-gemma-2-9B", + "name": "MT2-Gen6-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1664, + "BBH": 0.596, + "MATH Level 5": 0.0846, + "GPQA": 0.3381, + "MUSR": 0.4137, + "MMLU-PRO": 0.421 + } + }, + { + "model_id": "zelk12/MT2-Gen7-gemma-2-9B", + "name": "MT2-Gen7-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1762, + "BBH": 0.6079, + "MATH Level 5": 0.102, + "GPQA": 0.3549, + "MUSR": 0.4203, + "MMLU-PRO": 0.4311 + } + }, + { + "model_id": "zelk12/MT2-Max-Merge_02012025163610-gemma-2-9B", + "name": "MT2-Max-Merge_02012025163610-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7901, + "BBH": 0.6108, + "MATH Level 5": 0.2243, + "GPQA": 0.3515, + "MUSR": 0.4228, + "MMLU-PRO": 0.4391 + } + }, + { + "model_id": "zelk12/MT2-gemma-2-9B", + "name": "MT2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7886, + "BBH": 0.6115, + "MATH Level 5": 0.2213, + "GPQA": 0.3473, + "MUSR": 0.4217, + "MMLU-PRO": 0.4368 + } + }, + { + "model_id": "zelk12/MT3-Gen1-gemma-2-9B", + "name": "MT3-Gen1-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7838, + "BBH": 0.6107, + "MATH Level 5": 0.2145, + "GPQA": 0.3465, + "MUSR": 0.4151, + "MMLU-PRO": 0.4327 + } + }, + { + "model_id": "zelk12/MT3-Gen2-gemma-2-9B", + "name": "MT3-Gen2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7843, + "BBH": 0.6091, + "MATH Level 5": 0.2236, + "GPQA": 0.3574, + "MUSR": 0.4111, + "MMLU-PRO": 0.4333 + } + }, + { + "model_id": "zelk12/MT3-Gen3-gemma-2-9B", + "name": "MT3-Gen3-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7856, + "BBH": 0.6089, + "MATH Level 5": 0.2153, + "GPQA": 0.3515, + "MUSR": 0.4258, + "MMLU-PRO": 0.4303 + } + }, + { + "model_id": "zelk12/MT3-Gen4-gemma-2-9B", + "name": "MT3-Gen4-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7737, + "BBH": 0.6101, + "MATH Level 5": 0.2062, + "GPQA": 0.3473, + "MUSR": 0.4476, + "MMLU-PRO": 0.4387 + } + }, + { + "model_id": "zelk12/MT3-Gen5-gemma-2-9B", + "name": "MT3-Gen5-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.799, + "BBH": 0.6099, + "MATH Level 5": 0.2266, + "GPQA": 0.3532, + "MUSR": 0.4191, + "MMLU-PRO": 0.4317 + } + }, + { + "model_id": "zelk12/MT3-Gen5-gemma-2-9B_v1", + "name": "MT3-Gen5-gemma-2-9B_v1", + "developer": "zelk12", + "scores": { + "IFEval": 0.7996, + "BBH": 0.6113, + "MATH Level 5": 0.2228, + "GPQA": 0.349, + "MUSR": 0.4204, + "MMLU-PRO": 0.4359 + } + }, + { + "model_id": "zelk12/MT3-Gen6-gemma-2-9B", + "name": "MT3-Gen6-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1762, + "BBH": 0.602, + "MATH Level 5": 0.0884, + "GPQA": 0.3431, + "MUSR": 0.4126, + "MMLU-PRO": 0.4102 + } + }, + { + "model_id": "zelk12/MT3-Max-Merge_02012025163610-gemma-2-9B", + "name": "MT3-Max-Merge_02012025163610-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1762, + "BBH": 0.6123, + "MATH Level 5": 0.1012, + "GPQA": 0.3507, + "MUSR": 0.4255, + "MMLU-PRO": 0.4389 + } + }, + { + "model_id": "zelk12/MT3-gemma-2-9B", + "name": "MT3-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7786, + "BBH": 0.6131, + "MATH Level 5": 0.2168, + "GPQA": 0.3448, + "MUSR": 0.4243, + "MMLU-PRO": 0.4327 + } + }, + { + "model_id": "zelk12/MT4-Gen1-gemma-2-9B", + "name": "MT4-Gen1-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7895, + "BBH": 0.6094, + "MATH Level 5": 0.2198, + "GPQA": 0.344, + "MUSR": 0.4322, + "MMLU-PRO": 0.4389 + } + }, + { + "model_id": "zelk12/MT4-Gen2-gemma-2-9B", + "name": "MT4-Gen2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.8051, + "BBH": 0.6108, + "MATH Level 5": 0.2326, + "GPQA": 0.3456, + "MUSR": 0.4257, + "MMLU-PRO": 0.4368 + } + }, + { + "model_id": "zelk12/MT4-Gen3-gemma-2-9B", + "name": "MT4-Gen3-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7841, + "BBH": 0.6087, + "MATH Level 5": 0.219, + "GPQA": 0.344, + "MUSR": 0.4243, + "MMLU-PRO": 0.4381 + } + }, + { + "model_id": "zelk12/MT4-Gen4-gemma-2-9B", + "name": "MT4-Gen4-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7874, + "BBH": 0.6076, + "MATH Level 5": 0.2145, + "GPQA": 0.3523, + "MUSR": 0.4244, + "MMLU-PRO": 0.4323 + } + }, + { + "model_id": "zelk12/MT4-Gen5-gemma-2-9B", + "name": "MT4-Gen5-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7789, + "BBH": 0.6107, + "MATH Level 5": 0.2266, + "GPQA": 0.3565, + "MUSR": 0.4268, + "MMLU-PRO": 0.4384 + } + }, + { + "model_id": "zelk12/MT4-Max-Merge_02012025163610-gemma-2-9B", + "name": "MT4-Max-Merge_02012025163610-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1771, + "BBH": 0.612, + "MATH Level 5": 0.0952, + "GPQA": 0.3515, + "MUSR": 0.4228, + "MMLU-PRO": 0.4391 + } + }, + { + "model_id": "zelk12/MT4-gemma-2-9B", + "name": "MT4-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7762, + "BBH": 0.6073, + "MATH Level 5": 0.2085, + "GPQA": 0.3381, + "MUSR": 0.4309, + "MMLU-PRO": 0.4366 + } + }, + { + "model_id": "zelk12/MT5-Gen1-gemma-2-9B", + "name": "MT5-Gen1-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7831, + "BBH": 0.611, + "MATH Level 5": 0.2213, + "GPQA": 0.3473, + "MUSR": 0.4204, + "MMLU-PRO": 0.4368 + } + }, + { + "model_id": "zelk12/MT5-Gen2-gemma-2-9B", + "name": "MT5-Gen2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7962, + "BBH": 0.6105, + "MATH Level 5": 0.2205, + "GPQA": 0.3515, + "MUSR": 0.4163, + "MMLU-PRO": 0.4379 + } + }, + { + "model_id": "zelk12/MT5-Gen3-gemma-2-9B", + "name": "MT5-Gen3-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7825, + "BBH": 0.609, + "MATH Level 5": 0.2168, + "GPQA": 0.3515, + "MUSR": 0.4231, + "MMLU-PRO": 0.4375 + } + }, + { + "model_id": "zelk12/MT5-Gen4-gemma-2-9B", + "name": "MT5-Gen4-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7835, + "BBH": 0.6131, + "MATH Level 5": 0.2243, + "GPQA": 0.3532, + "MUSR": 0.4228, + "MMLU-PRO": 0.4397 + } + }, + { + "model_id": "zelk12/MT5-Gen5-gemma-2-9B", + "name": "MT5-Gen5-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7947, + "BBH": 0.6112, + "MATH Level 5": 0.2258, + "GPQA": 0.3482, + "MUSR": 0.4191, + "MMLU-PRO": 0.4329 + } + }, + { + "model_id": "zelk12/MT5-Max-Merge_02012025163610-gemma-2-9B", + "name": "MT5-Max-Merge_02012025163610-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1762, + "BBH": 0.6127, + "MATH Level 5": 0.0982, + "GPQA": 0.3515, + "MUSR": 0.4228, + "MMLU-PRO": 0.439 + } + }, + { + "model_id": "zelk12/MT5-gemma-2-9B", + "name": "MT5-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.8048, + "BBH": 0.6112, + "MATH Level 5": 0.2258, + "GPQA": 0.3431, + "MUSR": 0.4204, + "MMLU-PRO": 0.4367 + } + }, + { + "model_id": "zelk12/MTM-Merge-gemma-2-9B", + "name": "MTM-Merge-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7798, + "BBH": 0.6133, + "MATH Level 5": 0.2175, + "GPQA": 0.3549, + "MUSR": 0.4268, + "MMLU-PRO": 0.4388 + } + }, + { + "model_id": "zelk12/MTMaMe-Merge_02012025163610-gemma-2-9B", + "name": "MTMaMe-Merge_02012025163610-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.1786, + "BBH": 0.6117, + "MATH Level 5": 0.0959, + "GPQA": 0.3523, + "MUSR": 0.4241, + "MMLU-PRO": 0.4382 + } + }, + { + "model_id": "zelk12/Rv0.4DMv1t0.25-gemma-2-9B", + "name": "Rv0.4DMv1t0.25-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7497, + "BBH": 0.607, + "MATH Level 5": 0.2258, + "GPQA": 0.3456, + "MUSR": 0.4309, + "MMLU-PRO": 0.4401 + } + }, + { + "model_id": "zelk12/Rv0.4DMv1t0.25Tt0.25-gemma-2-9B", + "name": "Rv0.4DMv1t0.25Tt0.25-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7646, + "BBH": 0.6098, + "MATH Level 5": 0.2069, + "GPQA": 0.3423, + "MUSR": 0.4283, + "MMLU-PRO": 0.4347 + } + }, + { + "model_id": "zelk12/Rv0.4MT4g2-gemma-2-9B", + "name": "Rv0.4MT4g2-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.732, + "BBH": 0.6041, + "MATH Level 5": 0.1949, + "GPQA": 0.3532, + "MUSR": 0.4231, + "MMLU-PRO": 0.4417 + } + }, + { + "model_id": "zelk12/T31122024203920-gemma-2-9B", + "name": "T31122024203920-gemma-2-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7676, + "BBH": 0.6096, + "MATH Level 5": 0.2054, + "GPQA": 0.3507, + "MUSR": 0.4322, + "MMLU-PRO": 0.4373 + } + }, + { + "model_id": "zelk12/Test01012025155054", + "name": "Test01012025155054", + "developer": "zelk12", + "scores": { + "IFEval": 0.1555, + "BBH": 0.283, + "MATH Level 5": 0.0, + "GPQA": 0.2416, + "MUSR": 0.367, + "MMLU-PRO": 0.109 + } + }, + { + "model_id": "zelk12/Test01012025155054t0.5_gemma-2", + "name": "Test01012025155054t0.5_gemma-2", + "developer": "zelk12", + "scores": { + "IFEval": 0.1555, + "BBH": 0.283, + "MATH Level 5": 0.0, + "GPQA": 0.2416, + "MUSR": 0.367, + "MMLU-PRO": 0.109 + } + }, + { + "model_id": "zelk12/gemma-2-S2MTM-9B", + "name": "gemma-2-S2MTM-9B", + "developer": "zelk12", + "scores": { + "IFEval": 0.7823, + "BBH": 0.6061, + "MATH Level 5": 0.2047, + "GPQA": 0.3456, + "MUSR": 0.4218, + "MMLU-PRO": 0.4297 + } + }, + { + "model_id": "zelk12/recoilme-gemma-2-Ataraxy-9B-v0.1", + "name": "recoilme-gemma-2-Ataraxy-9B-v0.1", + "developer": "zelk12", + "scores": { + "IFEval": 0.7649, + "BBH": 0.6075, + "MATH Level 5": 0.2281, + "GPQA": 0.3498, + "MUSR": 0.4136, + "MMLU-PRO": 0.4321 + } + }, + { + "model_id": "zelk12/recoilme-gemma-2-Ataraxy-9B-v0.1-t0.25", + "name": "recoilme-gemma-2-Ataraxy-9B-v0.1-t0.25", + "developer": "zelk12", + "scores": { + "IFEval": 0.7707, + "BBH": 0.6075, + "MATH Level 5": 0.2145, + "GPQA": 0.3431, + "MUSR": 0.4323, + "MMLU-PRO": 0.44 + } + }, + { + "model_id": "zelk12/recoilme-gemma-2-Ataraxy-9B-v0.1-t0.75", + "name": "recoilme-gemma-2-Ataraxy-9B-v0.1-t0.75", + "developer": "zelk12", + "scores": { + "IFEval": 0.7208, + "BBH": 0.5995, + "MATH Level 5": 0.2017, + "GPQA": 0.3498, + "MUSR": 0.3951, + "MMLU-PRO": 0.4141 + } + }, + { + "model_id": "zelk12/recoilme-gemma-2-Ataraxy-9B-v0.2", + "name": "recoilme-gemma-2-Ataraxy-9B-v0.2", + "developer": "zelk12", + "scores": { + "IFEval": 0.76, + "BBH": 0.6066, + "MATH Level 5": 0.2228, + "GPQA": 0.3482, + "MUSR": 0.411, + "MMLU-PRO": 0.4323 + } + }, + { + "model_id": "zelk12/recoilme-gemma-2-Gutenberg-Doppel-9B-v0.1", + "name": "recoilme-gemma-2-Gutenberg-Doppel-9B-v0.1", + "developer": "zelk12", + "scores": { + "IFEval": 0.7615, + "BBH": 0.6099, + "MATH Level 5": 0.21, + "GPQA": 0.3414, + "MUSR": 0.431, + "MMLU-PRO": 0.4315 + } + }, + { + "model_id": "zelk12/recoilme-gemma-2-Ifable-9B-v0.1", + "name": "recoilme-gemma-2-Ifable-9B-v0.1", + "developer": "zelk12", + "scores": { + "IFEval": 0.7944, + "BBH": 0.6064, + "MATH Level 5": 0.2205, + "GPQA": 0.3515, + "MUSR": 0.4202, + "MMLU-PRO": 0.4323 + } + }, + { + "model_id": "zelk12/recoilme-gemma-2-psy10k-mental_healt-9B-v0.1", + "name": "recoilme-gemma-2-psy10k-mental_healt-9B-v0.1", + "developer": "zelk12", + "scores": { + "IFEval": 0.7445, + "BBH": 0.5978, + "MATH Level 5": 0.1888, + "GPQA": 0.344, + "MUSR": 0.4295, + "MMLU-PRO": 0.4181 + } + }, + { + "model_id": "zetasepic/Qwen2.5-32B-Instruct-abliterated-v2", + "name": "Qwen2.5-32B-Instruct-abliterated-v2", + "developer": "zetasepic", + "scores": { + "IFEval": 0.8334, + "BBH": 0.6934, + "MATH Level 5": 0.5952, + "GPQA": 0.3674, + "MUSR": 0.4354, + "MMLU-PRO": 0.5622 + } + }, + { + "model_id": "zetasepic/Qwen2.5-72B-Instruct-abliterated", + "name": "Qwen2.5-72B-Instruct-abliterated", + "developer": "zetasepic", + "scores": { + "IFEval": 0.7153, + "BBH": 0.7152, + "MATH Level 5": 0.5242, + "GPQA": 0.4069, + "MUSR": 0.4719, + "MMLU-PRO": 0.5872 + } + }, + { + "model_id": "zhengr/MixTAO-7Bx2-MoE-v8.1", + "name": "MixTAO-7Bx2-MoE-v8.1", + "developer": "zhengr", + "scores": { + "IFEval": 0.4188, + "BBH": 0.4202, + "MATH Level 5": 0.0604, + "GPQA": 0.2987, + "MUSR": 0.3976, + "MMLU-PRO": 0.2847 + } + } + ] +} \ No newline at end of file