Upload eval_results.csv
Browse files- eval_results.csv +335 -0
eval_results.csv
CHANGED
|
@@ -320,6 +320,73 @@ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.16
|
|
| 320 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.26785714285714285,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 321 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 322 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 323 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 324 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 325 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
|
@@ -966,6 +1033,73 @@ google/gemma-2-2b-it:W4A16,task_logiqa,acc,0.271889400921659,W4A16,espressor/goo
|
|
| 966 |
google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 967 |
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 968 |
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 969 |
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 970 |
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 971 |
google/gemma-2-2b-it:W4A16,task_mmlu,acc,0.5548354935194417,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
|
@@ -2574,6 +2708,140 @@ google/gemma-2-2b-it:W8A8_FP8,task_openbookqa,acc,0.36,W8A8_FP8,espressor/google
|
|
| 2574 |
google/gemma-2-2b-it:W8A8_FP8,task_piqa,acc,0.7861806311207835,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2575 |
google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.3733170134638923,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2576 |
google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.5289090993939894,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2577 |
google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2578 |
google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2579 |
google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
|
@@ -2716,6 +2984,73 @@ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_physics,acc,0.2185430463576
|
|
| 2716 |
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.22685185185185186,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2717 |
google/gemma-2-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.25892857142857145,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2718 |
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_boolq,acc,0.7804281345565749,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2719 |
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.29292929292929293,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2720 |
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.3181818181818182,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2721 |
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.29120879120879123,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
|
|
|
| 320 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.26785714285714285,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 321 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 322 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 323 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu,acc,0.23394103404073494,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 324 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_humanities,acc,0.24654622741764082,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 325 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_formal_logic,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 326 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_european_history,acc,0.23636363636363636,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 327 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_us_history,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 328 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_world_history,acc,0.26582278481012656,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 329 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_international_law,acc,0.24793388429752067,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 330 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_jurisprudence,acc,0.25925925925925924,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 331 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_logical_fallacies,acc,0.26993865030674846,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 332 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_moral_disputes,acc,0.2543352601156069,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 333 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 334 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_philosophy,acc,0.22186495176848875,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 335 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_prehistory,acc,0.23765432098765432,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 336 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_law,acc,0.24445893089960888,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 337 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_world_religions,acc,0.2807017543859649,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 338 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_other,acc,0.2281943997425169,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 339 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_business_ethics,acc,0.21,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 340 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_clinical_knowledge,acc,0.26037735849056604,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 341 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_medicine,acc,0.27167630057803466,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 342 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_global_facts,acc,0.15,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 343 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_human_aging,acc,0.17937219730941703,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 344 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_management,acc,0.33980582524271846,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 345 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_marketing,acc,0.25213675213675213,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 346 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_medical_genetics,acc,0.31,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 347 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_miscellaneous,acc,0.20689655172413793,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 348 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_nutrition,acc,0.21895424836601307,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 349 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_accounting,acc,0.24113475177304963,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 350 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_medicine,acc,0.17279411764705882,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 351 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_virology,acc,0.2891566265060241,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 352 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_social_sciences,acc,0.23366915827104323,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 353 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_econometrics,acc,0.2543859649122807,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 354 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_geography,acc,0.26262626262626265,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 355 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_government_and_politics,acc,0.18652849740932642,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 356 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_macroeconomics,acc,0.22564102564102564,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 357 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_microeconomics,acc,0.226890756302521,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 358 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_psychology,acc,0.25321100917431194,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 359 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_human_sexuality,acc,0.2595419847328244,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 360 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_psychology,acc,0.22712418300653595,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 361 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_public_relations,acc,0.2727272727272727,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 362 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_security_studies,acc,0.19183673469387755,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 363 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_sociology,acc,0.23383084577114427,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 364 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_us_foreign_policy,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 365 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_stem,acc,0.2210593085949889,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 366 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_abstract_algebra,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 367 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_anatomy,acc,0.2074074074074074,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 368 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_astronomy,acc,0.2236842105263158,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 369 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_biology,acc,0.22916666666666666,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 370 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_chemistry,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 371 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_computer_science,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 372 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_mathematics,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 373 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_physics,acc,0.23529411764705882,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 374 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_computer_security,acc,0.27,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 375 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_conceptual_physics,acc,0.19574468085106383,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 376 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_electrical_engineering,acc,0.2206896551724138,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 377 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_elementary_mathematics,acc,0.24867724867724866,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 378 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_biology,acc,0.2032258064516129,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 379 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_chemistry,acc,0.20689655172413793,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 380 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_computer_science,acc,0.2,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 381 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_mathematics,acc,0.21851851851851853,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 382 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_physics,acc,0.23178807947019867,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 383 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.16666666666666666,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 384 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.26785714285714285,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 385 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 386 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 387 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 388 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 389 |
+
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 390 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 391 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
| 392 |
meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
|
|
|
|
| 1033 |
google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1034 |
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1035 |
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1036 |
+
google/gemma-2-2b-it:W4A16,task_boolq,acc,0.8333333333333334,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1037 |
+
google/gemma-2-2b-it:W4A16,task_logiqa,acc,0.271889400921659,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1038 |
+
google/gemma-2-2b-it:W4A16,task_mmlu,acc,0.5548354935194417,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1039 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_humanities,acc,0.491817215727949,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1040 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_formal_logic,acc,0.3412698412698413,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1041 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_european_history,acc,0.7272727272727273,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1042 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_us_history,acc,0.7450980392156863,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1043 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_world_history,acc,0.7468354430379747,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1044 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_international_law,acc,0.6942148760330579,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1045 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_jurisprudence,acc,0.6296296296296297,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1046 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_logical_fallacies,acc,0.6809815950920245,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1047 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_moral_disputes,acc,0.5982658959537572,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1048 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1049 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_philosophy,acc,0.6205787781350482,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1050 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_prehistory,acc,0.595679012345679,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1051 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_professional_law,acc,0.41134289439374183,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1052 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_world_religions,acc,0.7134502923976608,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1053 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_other,acc,0.618925008046347,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1054 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_business_ethics,acc,0.5,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1055 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_clinical_knowledge,acc,0.6,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1056 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_college_medicine,acc,0.5838150289017341,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1057 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_global_facts,acc,0.29,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1058 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_human_aging,acc,0.5560538116591929,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1059 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_management,acc,0.7961165048543689,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1060 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_marketing,acc,0.7863247863247863,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1061 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_medical_genetics,acc,0.61,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1062 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_miscellaneous,acc,0.7535121328224776,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1063 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_nutrition,acc,0.6437908496732027,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1064 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_professional_accounting,acc,0.3971631205673759,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1065 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_professional_medicine,acc,0.5625,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1066 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_virology,acc,0.4879518072289157,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1067 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_social_sciences,acc,0.6564835879103023,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1068 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_econometrics,acc,0.3508771929824561,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1069 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_geography,acc,0.7373737373737373,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1070 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_government_and_politics,acc,0.772020725388601,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1071 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_macroeconomics,acc,0.5897435897435898,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1072 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_microeconomics,acc,0.5714285714285714,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1073 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_psychology,acc,0.8073394495412844,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1074 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_human_sexuality,acc,0.6564885496183206,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1075 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_professional_psychology,acc,0.5392156862745098,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1076 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_public_relations,acc,0.6454545454545455,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1077 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_security_studies,acc,0.6653061224489796,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1078 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_sociology,acc,0.746268656716418,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1079 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_us_foreign_policy,acc,0.79,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1080 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_stem,acc,0.4865207738661592,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1081 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_abstract_algebra,acc,0.37,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1082 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_anatomy,acc,0.5555555555555556,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1083 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_astronomy,acc,0.5986842105263158,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1084 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_college_biology,acc,0.6944444444444444,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1085 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_college_chemistry,acc,0.44,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1086 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_college_computer_science,acc,0.47,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1087 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_college_mathematics,acc,0.37,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1088 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_college_physics,acc,0.3137254901960784,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1089 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_computer_security,acc,0.68,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1090 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_conceptual_physics,acc,0.4297872340425532,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1091 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_electrical_engineering,acc,0.5586206896551724,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1092 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_elementary_mathematics,acc,0.42063492063492064,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1093 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_biology,acc,0.7322580645161291,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1094 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_chemistry,acc,0.4236453201970443,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1095 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_computer_science,acc,0.59,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1096 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_mathematics,acc,0.34814814814814815,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1097 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_physics,acc,0.31125827814569534,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1098 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_high_school_statistics,acc,0.5,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1099 |
+
google/gemma-2-2b-it:W4A16,task_mmlu_machine_learning,acc,0.36607142857142855,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1100 |
+
google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1101 |
+
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1102 |
+
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1103 |
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1104 |
google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
| 1105 |
google/gemma-2-2b-it:W4A16,task_mmlu,acc,0.5548354935194417,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
|
|
|
|
| 2708 |
google/gemma-2-2b-it:W8A8_FP8,task_piqa,acc,0.7861806311207835,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2709 |
google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.3733170134638923,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2710 |
google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.5289090993939894,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2711 |
+
google/gemma-2-2b-it:W8A8_FP8,task_boolq,acc,0.8388379204892966,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2712 |
+
google/gemma-2-2b-it:W8A8_FP8,task_logiqa,acc,0.2764976958525346,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2713 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu,acc,0.5704315624554906,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2714 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_humanities,acc,0.5092454835281616,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2715 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_formal_logic,acc,0.35714285714285715,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2716 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.7333333333333333,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2717 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.7450980392156863,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2718 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.759493670886076,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2719 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_international_law,acc,0.7107438016528925,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2720 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_jurisprudence,acc,0.6851851851851852,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2721 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.7361963190184049,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2722 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_moral_disputes,acc,0.6329479768786127,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2723 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.24916201117318434,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2724 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_philosophy,acc,0.6495176848874598,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2725 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_prehistory,acc,0.6141975308641975,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2726 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_law,acc,0.42633637548891784,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2727 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_world_religions,acc,0.7076023391812866,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2728 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_other,acc,0.6411329256517541,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2729 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_business_ethics,acc,0.52,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2730 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.6339622641509434,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2731 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_medicine,acc,0.6184971098265896,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2732 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_global_facts,acc,0.29,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2733 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_human_aging,acc,0.5964125560538116,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2734 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_management,acc,0.7864077669902912,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2735 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_marketing,acc,0.811965811965812,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2736 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_medical_genetics,acc,0.65,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2737 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_miscellaneous,acc,0.7675606641123882,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2738 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_nutrition,acc,0.6601307189542484,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2739 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_accounting,acc,0.425531914893617,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2740 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_medicine,acc,0.5661764705882353,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2741 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_virology,acc,0.5421686746987951,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2742 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_social_sciences,acc,0.6766330841728957,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2743 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_econometrics,acc,0.40350877192982454,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2744 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_geography,acc,0.7373737373737373,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2745 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.7927461139896373,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2746 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.6205128205128205,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2747 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.5756302521008403,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2748 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.8238532110091743,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2749 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_human_sexuality,acc,0.6870229007633588,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2750 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_psychology,acc,0.5571895424836601,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2751 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_public_relations,acc,0.6727272727272727,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2752 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_security_studies,acc,0.689795918367347,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2753 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_sociology,acc,0.7860696517412935,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2754 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.77,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2755 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_stem,acc,0.48842372343799556,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2756 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.39,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2757 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_anatomy,acc,0.5333333333333333,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2758 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_astronomy,acc,0.5657894736842105,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2759 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_biology,acc,0.6875,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2760 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_chemistry,acc,0.45,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2761 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_computer_science,acc,0.44,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2762 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_mathematics,acc,0.37,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2763 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_physics,acc,0.35294117647058826,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2764 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_computer_security,acc,0.63,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2765 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.46382978723404256,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2766 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.5862068965517241,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2767 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.4126984126984127,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2768 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_biology,acc,0.7548387096774194,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2769 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.4433497536945813,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2770 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.6,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2771 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.362962962962963,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2772 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_physics,acc,0.2781456953642384,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2773 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.49074074074074076,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2774 |
+
google/gemma-2-2b-it:W8A8_FP8,task_mmlu_machine_learning,acc,0.3482142857142857,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2775 |
+
google/gemma-2-2b-it:W8A8_FP8,task_openbookqa,acc,0.36,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2776 |
+
google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.3733170134638923,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2777 |
+
google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.5289090993939894,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
|
| 2778 |
+
google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2779 |
+
google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2780 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu,acc,0.2457627118644068,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2781 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_humanities,acc,0.24187035069075452,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2782 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_formal_logic,acc,0.23015873015873015,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2783 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_european_history,acc,0.24848484848484848,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2784 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_us_history,acc,0.23529411764705882,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2785 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_world_history,acc,0.22362869198312235,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2786 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_international_law,acc,0.23140495867768596,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2787 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_jurisprudence,acc,0.3148148148148148,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2788 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_logical_fallacies,acc,0.2331288343558282,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2789 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_moral_disputes,acc,0.2630057803468208,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2790 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_moral_scenarios,acc,0.23798882681564246,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2791 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_philosophy,acc,0.2379421221864952,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2792 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_prehistory,acc,0.23765432098765432,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2793 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_law,acc,0.2470664928292047,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2794 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_world_religions,acc,0.19298245614035087,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2795 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_other,acc,0.25523012552301255,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2796 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_business_ethics,acc,0.25,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2797 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.26037735849056604,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2798 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_medicine,acc,0.2023121387283237,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2799 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_global_facts,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2800 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_human_aging,acc,0.34977578475336324,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2801 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_management,acc,0.2524271844660194,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2802 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_marketing,acc,0.24358974358974358,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2803 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_medical_genetics,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2804 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_miscellaneous,acc,0.2707535121328225,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2805 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_nutrition,acc,0.22549019607843138,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2806 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_accounting,acc,0.19858156028368795,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2807 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_medicine,acc,0.22794117647058823,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2808 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_virology,acc,0.3373493975903614,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2809 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_social_sciences,acc,0.24731881702957426,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2810 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_econometrics,acc,0.22807017543859648,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2811 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_geography,acc,0.20707070707070707,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2812 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.22279792746113988,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2813 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.24358974358974358,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2814 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.23949579831932774,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2815 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_psychology,acc,0.25321100917431194,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2816 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_human_sexuality,acc,0.22137404580152673,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2817 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_psychology,acc,0.2679738562091503,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2818 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_public_relations,acc,0.32727272727272727,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2819 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_security_studies,acc,0.21224489795918366,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2820 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_sociology,acc,0.27860696517412936,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2821 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2822 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_stem,acc,0.2407231208372978,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2823 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_abstract_algebra,acc,0.25,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2824 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_anatomy,acc,0.1925925925925926,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2825 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_astronomy,acc,0.23026315789473684,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2826 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_biology,acc,0.2152777777777778,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2827 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_chemistry,acc,0.23,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2828 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_computer_science,acc,0.21,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2829 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_mathematics,acc,0.21,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2830 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_physics,acc,0.22549019607843138,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2831 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_computer_security,acc,0.23,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2832 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_conceptual_physics,acc,0.3148936170212766,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2833 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_electrical_engineering,acc,0.21379310344827587,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2834 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.24338624338624337,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2835 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_biology,acc,0.22903225806451613,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2836 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.2660098522167488,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2837 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.26,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2838 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.26666666666666666,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2839 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_physics,acc,0.2185430463576159,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2840 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.22685185185185186,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2841 |
+
google/gemma-2-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.25892857142857145,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2842 |
+
google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2843 |
+
google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc1,acc,0.23378212974296206,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2844 |
+
google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc2,acc,,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2845 |
google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2846 |
google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2847 |
google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
|
|
|
| 2984 |
google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.22685185185185186,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2985 |
google/gemma-2-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.25892857142857145,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
|
| 2986 |
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_boolq,acc,0.7804281345565749,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2987 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_logiqa,acc,0.250384024577573,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2988 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu,acc,0.5977068793619142,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2989 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_humanities,acc,0.5844845908607864,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2990 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_formal_logic,acc,0.3412698412698413,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2991 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.7212121212121212,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2992 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.7450980392156863,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2993 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.7763713080168776,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2994 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_international_law,acc,0.743801652892562,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2995 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_jurisprudence,acc,0.6203703703703703,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2996 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.7055214723926381,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2997 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_moral_disputes,acc,0.6416184971098265,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2998 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.5698324022346368,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 2999 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_philosophy,acc,0.6720257234726688,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3000 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_prehistory,acc,0.6512345679012346,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3001 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_professional_law,acc,0.4556714471968709,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3002 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_world_religions,acc,0.7543859649122807,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3003 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_other,acc,0.663018989378822,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3004 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_business_ethics,acc,0.58,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3005 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.6339622641509434,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3006 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_medicine,acc,0.5953757225433526,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3007 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_global_facts,acc,0.33,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3008 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_human_aging,acc,0.5695067264573991,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3009 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_management,acc,0.7572815533980582,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3010 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_marketing,acc,0.8803418803418803,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3011 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_medical_genetics,acc,0.71,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3012 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_miscellaneous,acc,0.7675606641123882,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3013 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_nutrition,acc,0.6633986928104575,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3014 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_professional_accounting,acc,0.4645390070921986,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3015 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_professional_medicine,acc,0.75,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3016 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_virology,acc,0.463855421686747,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3017 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_social_sciences,acc,0.6590835229119272,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3018 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_econometrics,acc,0.38596491228070173,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3019 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_geography,acc,0.7070707070707071,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3020 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.7461139896373057,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3021 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.5538461538461539,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3022 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.592436974789916,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3023 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.7651376146788991,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3024 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_human_sexuality,acc,0.6870229007633588,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3025 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_professional_psychology,acc,0.5931372549019608,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3026 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_public_relations,acc,0.6181818181818182,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3027 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_security_studies,acc,0.6571428571428571,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3028 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_sociology,acc,0.8059701492537313,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3029 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.82,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3030 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_stem,acc,0.4931810973675864,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3031 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.29,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3032 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_anatomy,acc,0.5703703703703704,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3033 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_astronomy,acc,0.6776315789473685,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3034 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_biology,acc,0.7083333333333334,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3035 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_chemistry,acc,0.36,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3036 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_computer_science,acc,0.48,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3037 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_mathematics,acc,0.32,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3038 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_physics,acc,0.3431372549019608,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3039 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_computer_security,acc,0.7,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3040 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.4978723404255319,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3041 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.5862068965517241,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3042 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.3915343915343915,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3043 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_biology,acc,0.7064516129032258,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3044 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.5467980295566502,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3045 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.58,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3046 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.3333333333333333,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3047 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_physics,acc,0.36423841059602646,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3048 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.3888888888888889,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3049 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_machine_learning,acc,0.5,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3050 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_openbookqa,acc,0.278,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3051 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_truthfulqa_mc1,acc,0.31701346389228885,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3052 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_truthfulqa_mc2,acc,0.49237827622660857,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3053 |
+
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_boolq,acc,0.7804281345565749,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3054 |
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.29292929292929293,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3055 |
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.3181818181818182,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|
| 3056 |
meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.29120879120879123,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
|