model,task,metric,value,precision,hf_name,model_physical_size google/gemma-7b-it:Default (bf16/fp16),task_mmlu,acc,0.5014242985329725,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_humanities,acc,0.4486716259298619,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_formal_logic,acc,0.373015873015873,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_european_history,acc,0.6303030303030303,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_us_history,acc,0.5980392156862745,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_world_history,acc,0.6962025316455697,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_international_law,acc,0.6611570247933884,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_jurisprudence,acc,0.6388888888888888,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_logical_fallacies,acc,0.5705521472392638,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_moral_disputes,acc,0.5606936416184971,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_moral_scenarios,acc,0.23128491620111732,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_philosophy,acc,0.5787781350482315,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_prehistory,acc,0.5524691358024691,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_professional_law,acc,0.3644067796610169,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_world_religions,acc,0.6549707602339181,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_other,acc,0.5774058577405857,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_business_ethics,acc,0.52,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_clinical_knowledge,acc,0.539622641509434,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_college_medicine,acc,0.4393063583815029,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_global_facts,acc,0.41,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_human_aging,acc,0.6322869955156951,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_management,acc,0.6893203883495146,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_marketing,acc,0.8205128205128205,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_medical_genetics,acc,0.59,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_miscellaneous,acc,0.7011494252873564,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_nutrition,acc,0.5686274509803921,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_professional_accounting,acc,0.35106382978723405,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_professional_medicine,acc,0.45588235294117646,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_virology,acc,0.4397590361445783,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_social_sciences,acc,0.5833604159896003,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_econometrics,acc,0.3157894736842105,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_geography,acc,0.696969696969697,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_government_and_politics,acc,0.694300518134715,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_macroeconomics,acc,0.48205128205128206,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_microeconomics,acc,0.4831932773109244,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_psychology,acc,0.7357798165137615,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_human_sexuality,acc,0.6259541984732825,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_professional_psychology,acc,0.4918300653594771,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_public_relations,acc,0.6636363636363637,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_security_studies,acc,0.5061224489795918,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_sociology,acc,0.6666666666666666,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_us_foreign_policy,acc,0.69,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_stem,acc,0.4253092293054234,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_abstract_algebra,acc,0.29,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_anatomy,acc,0.4888888888888889,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_astronomy,acc,0.506578947368421,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_college_biology,acc,0.5555555555555556,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_college_chemistry,acc,0.37,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_college_computer_science,acc,0.5,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_college_mathematics,acc,0.34,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_college_physics,acc,0.24509803921568626,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_computer_security,acc,0.73,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_conceptual_physics,acc,0.4808510638297872,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_electrical_engineering,acc,0.47586206896551725,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_elementary_mathematics,acc,0.32275132275132273,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_biology,acc,0.603225806451613,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_chemistry,acc,0.39408866995073893,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_computer_science,acc,0.53,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_mathematics,acc,0.2962962962962963,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_physics,acc,0.3443708609271523,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_high_school_statistics,acc,0.3055555555555556,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-7b-it:Default (bf16/fp16),task_mmlu_machine_learning,acc,0.42857142857142855,Default (bf16/fp16),google/gemma-7b-it,17075361792 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu,acc,0.7182737501780373,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_humanities,acc,0.6505844845908608,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_formal_logic,acc,0.5396825396825397,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_european_history,acc,0.8545454545454545,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_us_history,acc,0.8774509803921569,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_world_history,acc,0.9071729957805907,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_international_law,acc,0.8760330578512396,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_jurisprudence,acc,0.8333333333333334,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_logical_fallacies,acc,0.8220858895705522,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_moral_disputes,acc,0.7601156069364162,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_moral_scenarios,acc,0.4,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_philosophy,acc,0.7684887459807074,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_prehistory,acc,0.808641975308642,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_professional_law,acc,0.560625814863103,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_world_religions,acc,0.8538011695906432,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_other,acc,0.7682652075957516,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_business_ethics,acc,0.71,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_clinical_knowledge,acc,0.769811320754717,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_college_medicine,acc,0.7225433526011561,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_global_facts,acc,0.44,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_human_aging,acc,0.7757847533632287,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_management,acc,0.8640776699029126,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_marketing,acc,0.9145299145299145,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_medical_genetics,acc,0.84,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_miscellaneous,acc,0.8722860791826309,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_nutrition,acc,0.7418300653594772,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_professional_accounting,acc,0.599290780141844,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_professional_medicine,acc,0.7941176470588235,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_virology,acc,0.5301204819277109,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_social_sciences,acc,0.8358791030224244,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_econometrics,acc,0.5964912280701754,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_geography,acc,0.898989898989899,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_government_and_politics,acc,0.9481865284974094,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_macroeconomics,acc,0.8,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_microeconomics,acc,0.8277310924369747,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_psychology,acc,0.9155963302752294,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_human_sexuality,acc,0.8091603053435115,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_professional_psychology,acc,0.7826797385620915,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_public_relations,acc,0.7545454545454545,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_security_studies,acc,0.8163265306122449,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_sociology,acc,0.8656716417910447,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_us_foreign_policy,acc,0.93,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_stem,acc,0.6552489692356486,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_abstract_algebra,acc,0.43,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_anatomy,acc,0.7111111111111111,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_astronomy,acc,0.8026315789473685,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_college_biology,acc,0.8611111111111112,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_college_chemistry,acc,0.53,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_college_computer_science,acc,0.56,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_college_mathematics,acc,0.42,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_college_physics,acc,0.5,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_computer_security,acc,0.81,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_conceptual_physics,acc,0.676595744680851,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_electrical_engineering,acc,0.7103448275862069,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_elementary_mathematics,acc,0.6058201058201058,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_biology,acc,0.9064516129032258,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_chemistry,acc,0.6847290640394089,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_computer_science,acc,0.79,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_mathematics,acc,0.45555555555555555,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_physics,acc,0.5695364238410596,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_high_school_statistics,acc,0.6481481481481481,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-9b-it:Default (bf16/fp16),task_mmlu_machine_learning,acc,0.5267857142857143,Default (bf16/fp16),google/gemma-2-9b-it,18483411968 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu,acc,0.568651189289275,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_humanities,acc,0.5086078639744952,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_formal_logic,acc,0.36507936507936506,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_european_history,acc,0.7090909090909091,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_us_history,acc,0.7401960784313726,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_world_history,acc,0.7721518987341772,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_international_law,acc,0.7107438016528925,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_jurisprudence,acc,0.6666666666666666,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_logical_fallacies,acc,0.7177914110429447,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_moral_disputes,acc,0.653179190751445,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_moral_scenarios,acc,0.24581005586592178,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_philosophy,acc,0.6430868167202572,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_prehistory,acc,0.6203703703703703,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_professional_law,acc,0.42633637548891784,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_world_religions,acc,0.7017543859649122,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_other,acc,0.6433859028001288,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_business_ethics,acc,0.54,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_clinical_knowledge,acc,0.6226415094339622,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_college_medicine,acc,0.6184971098265896,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_global_facts,acc,0.28,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_human_aging,acc,0.6143497757847534,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_management,acc,0.7864077669902912,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_marketing,acc,0.811965811965812,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_medical_genetics,acc,0.67,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_miscellaneous,acc,0.7726692209450831,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_nutrition,acc,0.6503267973856209,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_professional_accounting,acc,0.4326241134751773,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_professional_medicine,acc,0.5698529411764706,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_virology,acc,0.536144578313253,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_social_sciences,acc,0.6704582385440364,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_econometrics,acc,0.38596491228070173,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_geography,acc,0.7373737373737373,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_government_and_politics,acc,0.7927461139896373,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_macroeconomics,acc,0.6128205128205129,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_microeconomics,acc,0.5840336134453782,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_psychology,acc,0.8128440366972477,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_human_sexuality,acc,0.6870229007633588,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_professional_psychology,acc,0.5522875816993464,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_public_relations,acc,0.6727272727272727,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_security_studies,acc,0.6693877551020408,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_sociology,acc,0.7761194029850746,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_us_foreign_policy,acc,0.77,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_stem,acc,0.48525214081826834,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_abstract_algebra,acc,0.36,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_anatomy,acc,0.5185185185185185,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_astronomy,acc,0.5592105263157895,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_college_biology,acc,0.7013888888888888,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_college_chemistry,acc,0.44,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_college_computer_science,acc,0.44,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_college_mathematics,acc,0.36,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_college_physics,acc,0.3333333333333333,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_computer_security,acc,0.66,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_conceptual_physics,acc,0.4553191489361702,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_electrical_engineering,acc,0.5862068965517241,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_elementary_mathematics,acc,0.4126984126984127,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_biology,acc,0.7451612903225806,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_chemistry,acc,0.43842364532019706,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_computer_science,acc,0.61,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_mathematics,acc,0.37407407407407406,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_physics,acc,0.2582781456953642,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_high_school_statistics,acc,0.48148148148148145,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2-2b-it:Default (bf16/fp16),task_mmlu_machine_learning,acc,0.36607142857142855,Default (bf16/fp16),google/gemma-2-2b-it,5228683776 google/gemma-2b-it:Default (bf16/fp16),task_mmlu,acc,0.3812135023500926,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_humanities,acc,0.35430393198724763,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_formal_logic,acc,0.35714285714285715,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_european_history,acc,0.5212121212121212,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_us_history,acc,0.4264705882352941,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_world_history,acc,0.540084388185654,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_international_law,acc,0.5206611570247934,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_jurisprudence,acc,0.49074074074074076,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_logical_fallacies,acc,0.37423312883435583,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_moral_disputes,acc,0.41040462427745666,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_moral_scenarios,acc,0.2424581005586592,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_philosophy,acc,0.3408360128617363,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_prehistory,acc,0.37962962962962965,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_professional_law,acc,0.3109517601043025,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_world_religions,acc,0.4619883040935672,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_other,acc,0.4293530737045381,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_business_ethics,acc,0.44,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_clinical_knowledge,acc,0.41132075471698115,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_college_medicine,acc,0.3583815028901734,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_global_facts,acc,0.23,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_human_aging,acc,0.4484304932735426,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_management,acc,0.4854368932038835,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_marketing,acc,0.6025641025641025,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_medical_genetics,acc,0.4,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_miscellaneous,acc,0.4955300127713921,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_nutrition,acc,0.47058823529411764,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_professional_accounting,acc,0.31560283687943264,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_professional_medicine,acc,0.30514705882352944,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_virology,acc,0.3674698795180723,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_social_sciences,acc,0.4280142996425089,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_econometrics,acc,0.24561403508771928,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_geography,acc,0.4444444444444444,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_government_and_politics,acc,0.5077720207253886,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_macroeconomics,acc,0.3769230769230769,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_microeconomics,acc,0.3403361344537815,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_psychology,acc,0.5192660550458715,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_human_sexuality,acc,0.40458015267175573,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_professional_psychology,acc,0.3839869281045752,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_public_relations,acc,0.4090909090909091,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_security_studies,acc,0.3836734693877551,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_sociology,acc,0.5373134328358209,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_us_foreign_policy,acc,0.57,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_stem,acc,0.32825880114176975,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_abstract_algebra,acc,0.3,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_anatomy,acc,0.4,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_astronomy,acc,0.375,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_college_biology,acc,0.4444444444444444,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_college_chemistry,acc,0.3,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_college_computer_science,acc,0.37,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_college_mathematics,acc,0.32,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_college_physics,acc,0.18627450980392157,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_computer_security,acc,0.5,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_conceptual_physics,acc,0.33191489361702126,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_electrical_engineering,acc,0.4896551724137931,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_elementary_mathematics,acc,0.24603174603174602,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_biology,acc,0.44193548387096776,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_chemistry,acc,0.2857142857142857,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_computer_science,acc,0.37,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_mathematics,acc,0.2222222222222222,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_physics,acc,0.2847682119205298,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_high_school_statistics,acc,0.22685185185185186,Default (bf16/fp16),google/gemma-2b-it,5012344832 google/gemma-2b-it:Default (bf16/fp16),task_mmlu_machine_learning,acc,0.32142857142857145,Default (bf16/fp16),google/gemma-2b-it,5012344832 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_piqa,acc,0.5957562568008705,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_piqa,acc,0.5957562568008705,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu,acc,0.23394103404073494,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_humanities,acc,0.24654622741764082,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_formal_logic,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_european_history,acc,0.23636363636363636,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_us_history,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_world_history,acc,0.26582278481012656,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_international_law,acc,0.24793388429752067,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_jurisprudence,acc,0.25925925925925924,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_logical_fallacies,acc,0.26993865030674846,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_moral_disputes,acc,0.2543352601156069,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_philosophy,acc,0.22186495176848875,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_prehistory,acc,0.23765432098765432,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_law,acc,0.24445893089960888,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_world_religions,acc,0.2807017543859649,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_other,acc,0.2281943997425169,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_business_ethics,acc,0.21,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_clinical_knowledge,acc,0.26037735849056604,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_medicine,acc,0.27167630057803466,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_global_facts,acc,0.15,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_human_aging,acc,0.17937219730941703,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_management,acc,0.33980582524271846,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_marketing,acc,0.25213675213675213,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_medical_genetics,acc,0.31,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_miscellaneous,acc,0.20689655172413793,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_nutrition,acc,0.21895424836601307,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_accounting,acc,0.24113475177304963,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_medicine,acc,0.17279411764705882,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_virology,acc,0.2891566265060241,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_social_sciences,acc,0.23366915827104323,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_econometrics,acc,0.2543859649122807,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_geography,acc,0.26262626262626265,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_government_and_politics,acc,0.18652849740932642,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_macroeconomics,acc,0.22564102564102564,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_microeconomics,acc,0.226890756302521,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_psychology,acc,0.25321100917431194,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_human_sexuality,acc,0.2595419847328244,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_psychology,acc,0.22712418300653595,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_public_relations,acc,0.2727272727272727,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_security_studies,acc,0.19183673469387755,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_sociology,acc,0.23383084577114427,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_us_foreign_policy,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_stem,acc,0.2210593085949889,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_abstract_algebra,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_anatomy,acc,0.2074074074074074,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_astronomy,acc,0.2236842105263158,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_biology,acc,0.22916666666666666,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_chemistry,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_computer_science,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_mathematics,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_physics,acc,0.23529411764705882,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_computer_security,acc,0.27,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_conceptual_physics,acc,0.19574468085106383,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_electrical_engineering,acc,0.2206896551724138,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_elementary_mathematics,acc,0.24867724867724866,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_biology,acc,0.2032258064516129,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_chemistry,acc,0.20689655172413793,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_computer_science,acc,0.2,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_mathematics,acc,0.21851851851851853,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_physics,acc,0.23178807947019867,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.16666666666666666,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.26785714285714285,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu,acc,0.23394103404073494,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_humanities,acc,0.24654622741764082,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_formal_logic,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_european_history,acc,0.23636363636363636,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_us_history,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_world_history,acc,0.26582278481012656,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_international_law,acc,0.24793388429752067,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_jurisprudence,acc,0.25925925925925924,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_logical_fallacies,acc,0.26993865030674846,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_moral_disputes,acc,0.2543352601156069,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_philosophy,acc,0.22186495176848875,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_prehistory,acc,0.23765432098765432,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_law,acc,0.24445893089960888,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_world_religions,acc,0.2807017543859649,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_other,acc,0.2281943997425169,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_business_ethics,acc,0.21,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_clinical_knowledge,acc,0.26037735849056604,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_medicine,acc,0.27167630057803466,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_global_facts,acc,0.15,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_human_aging,acc,0.17937219730941703,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_management,acc,0.33980582524271846,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_marketing,acc,0.25213675213675213,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_medical_genetics,acc,0.31,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_miscellaneous,acc,0.20689655172413793,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_nutrition,acc,0.21895424836601307,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_accounting,acc,0.24113475177304963,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_medicine,acc,0.17279411764705882,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_virology,acc,0.2891566265060241,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_social_sciences,acc,0.23366915827104323,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_econometrics,acc,0.2543859649122807,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_geography,acc,0.26262626262626265,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_government_and_politics,acc,0.18652849740932642,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_macroeconomics,acc,0.22564102564102564,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_microeconomics,acc,0.226890756302521,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_psychology,acc,0.25321100917431194,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_human_sexuality,acc,0.2595419847328244,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_psychology,acc,0.22712418300653595,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_public_relations,acc,0.2727272727272727,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_security_studies,acc,0.19183673469387755,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_sociology,acc,0.23383084577114427,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_us_foreign_policy,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_stem,acc,0.2210593085949889,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_abstract_algebra,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_anatomy,acc,0.2074074074074074,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_astronomy,acc,0.2236842105263158,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_biology,acc,0.22916666666666666,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_chemistry,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_computer_science,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_mathematics,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_physics,acc,0.23529411764705882,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_computer_security,acc,0.27,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_conceptual_physics,acc,0.19574468085106383,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_electrical_engineering,acc,0.2206896551724138,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_elementary_mathematics,acc,0.24867724867724866,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_biology,acc,0.2032258064516129,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_chemistry,acc,0.20689655172413793,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_computer_science,acc,0.2,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_mathematics,acc,0.21851851851851853,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_physics,acc,0.23178807947019867,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.16666666666666666,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.26785714285714285,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408 meta-llama/Llama-3.1-8B-Instruct:W8A8_FP8,task_boolq,acc,0.8406727828746178,W8A8_FP8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.3383838383838384,W8A8_FP8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.31313131313131315,W8A8_FP8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.31684981684981683,W8A8_FP8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.32051282051282054,W8A8_FP8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_FP8,task_gpqa_main_n_shot,acc,0.3482142857142857,W8A8_FP8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.3236607142857143,W8A8_FP8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_FP8,task_logiqa,acc,0.31797235023041476,W8A8_FP8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu,acc,0.4585529126904999,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_humanities,acc,0.4257173219978746,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_formal_logic,acc,0.24603174603174602,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_european_history,acc,0.6,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_us_history,acc,0.6568627450980392,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_world_history,acc,0.6160337552742616,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_international_law,acc,0.5950413223140496,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_jurisprudence,acc,0.5462962962962963,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_logical_fallacies,acc,0.5644171779141104,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_moral_disputes,acc,0.4913294797687861,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_moral_scenarios,acc,0.2424581005586592,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_philosophy,acc,0.5305466237942122,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_prehistory,acc,0.5277777777777778,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_law,acc,0.34615384615384615,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_world_religions,acc,0.6783625730994152,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_other,acc,0.5448986160283231,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_business_ethics,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.5283018867924528,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_medicine,acc,0.37572254335260113,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_global_facts,acc,0.4,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_human_aging,acc,0.5650224215246636,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_management,acc,0.6407766990291263,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_marketing,acc,0.7435897435897436,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_medical_genetics,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_miscellaneous,acc,0.6922094508301405,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_nutrition,acc,0.5,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_accounting,acc,0.3546099290780142,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_medicine,acc,0.41544117647058826,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_virology,acc,0.4819277108433735,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_social_sciences,acc,0.5206369840753982,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_econometrics,acc,0.30701754385964913,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_geography,acc,0.5808080808080808,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.6683937823834197,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.38974358974358975,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.3697478991596639,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_psychology,acc,0.6128440366972477,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_human_sexuality,acc,0.5572519083969466,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_psychology,acc,0.4542483660130719,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_public_relations,acc,0.5454545454545454,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_security_studies,acc,0.4857142857142857,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_sociology,acc,0.7313432835820896,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.72,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_stem,acc,0.3618775769108785,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_abstract_algebra,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_anatomy,acc,0.4666666666666667,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_astronomy,acc,0.4934210526315789,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_biology,acc,0.4375,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_chemistry,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_computer_science,acc,0.34,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_mathematics,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_physics,acc,0.19607843137254902,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_computer_security,acc,0.61,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_conceptual_physics,acc,0.39574468085106385,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_electrical_engineering,acc,0.503448275862069,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.2724867724867725,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_biology,acc,0.5096774193548387,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.33497536945812806,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.38,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.2777777777777778,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_physics,acc,0.271523178807947,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_statistics,acc,0.25462962962962965,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_machine_learning,acc,0.33035714285714285,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu,acc,0.4585529126904999,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_humanities,acc,0.4257173219978746,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_formal_logic,acc,0.24603174603174602,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_european_history,acc,0.6,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_us_history,acc,0.6568627450980392,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_world_history,acc,0.6160337552742616,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_international_law,acc,0.5950413223140496,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_jurisprudence,acc,0.5462962962962963,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_logical_fallacies,acc,0.5644171779141104,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_moral_disputes,acc,0.4913294797687861,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_moral_scenarios,acc,0.2424581005586592,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_philosophy,acc,0.5305466237942122,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_prehistory,acc,0.5277777777777778,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_law,acc,0.34615384615384615,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_world_religions,acc,0.6783625730994152,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_other,acc,0.5448986160283231,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_business_ethics,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.5283018867924528,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_medicine,acc,0.37572254335260113,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_global_facts,acc,0.4,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_human_aging,acc,0.5650224215246636,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_management,acc,0.6407766990291263,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_marketing,acc,0.7435897435897436,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_medical_genetics,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_miscellaneous,acc,0.6922094508301405,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_nutrition,acc,0.5,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_accounting,acc,0.3546099290780142,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_medicine,acc,0.41544117647058826,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_virology,acc,0.4819277108433735,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_social_sciences,acc,0.5206369840753982,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_econometrics,acc,0.30701754385964913,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_geography,acc,0.5808080808080808,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.6683937823834197,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.38974358974358975,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.3697478991596639,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_psychology,acc,0.6128440366972477,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_human_sexuality,acc,0.5572519083969466,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_psychology,acc,0.4542483660130719,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_public_relations,acc,0.5454545454545454,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_security_studies,acc,0.4857142857142857,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_sociology,acc,0.7313432835820896,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.72,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_stem,acc,0.3618775769108785,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_abstract_algebra,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_anatomy,acc,0.4666666666666667,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_astronomy,acc,0.4934210526315789,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_biology,acc,0.4375,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_chemistry,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_computer_science,acc,0.34,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_mathematics,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_physics,acc,0.19607843137254902,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_computer_security,acc,0.61,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_conceptual_physics,acc,0.39574468085106385,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_electrical_engineering,acc,0.503448275862069,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.2724867724867725,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_biology,acc,0.5096774193548387,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.33497536945812806,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.38,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.2777777777777778,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_physics,acc,0.271523178807947,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_statistics,acc,0.25462962962962965,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_machine_learning,acc,0.33035714285714285,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_gpqa_diamond_n_shot,acc,0.29292929292929293,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_gpqa_diamond_zeroshot,acc,0.23737373737373738,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_gpqa_extended_n_shot,acc,0.27106227106227104,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_gpqa_extended_zeroshot,acc,0.25824175824175827,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_gpqa_main_n_shot,acc,0.30580357142857145,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_gpqa_main_zeroshot,acc,0.23883928571428573,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_boolq,acc,0.8021406727828746,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_logiqa,acc,0.27035330261136714,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_openbookqa,acc,0.332,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_truthfulqa_mc1,acc,0.2962056303549572,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_truthfulqa_mc2,acc,0.44121470505156096,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_boolq,acc,0.8021406727828746,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_logiqa,acc,0.27035330261136714,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_piqa,acc,0.764417845484222,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_openbookqa,acc,0.332,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu,acc,0.4585529126904999,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_humanities,acc,0.4257173219978746,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_formal_logic,acc,0.24603174603174602,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_european_history,acc,0.6,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_us_history,acc,0.6568627450980392,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_world_history,acc,0.6160337552742616,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_international_law,acc,0.5950413223140496,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_jurisprudence,acc,0.5462962962962963,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_logical_fallacies,acc,0.5644171779141104,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_moral_disputes,acc,0.4913294797687861,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_moral_scenarios,acc,0.2424581005586592,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_philosophy,acc,0.5305466237942122,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_prehistory,acc,0.5277777777777778,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_law,acc,0.34615384615384615,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_world_religions,acc,0.6783625730994152,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_other,acc,0.5448986160283231,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_business_ethics,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.5283018867924528,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_medicine,acc,0.37572254335260113,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_global_facts,acc,0.4,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_human_aging,acc,0.5650224215246636,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_management,acc,0.6407766990291263,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_marketing,acc,0.7435897435897436,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_medical_genetics,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_miscellaneous,acc,0.6922094508301405,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_nutrition,acc,0.5,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_accounting,acc,0.3546099290780142,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_medicine,acc,0.41544117647058826,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_virology,acc,0.4819277108433735,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_social_sciences,acc,0.5206369840753982,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_econometrics,acc,0.30701754385964913,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_geography,acc,0.5808080808080808,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.6683937823834197,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.38974358974358975,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.3697478991596639,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_psychology,acc,0.6128440366972477,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_human_sexuality,acc,0.5572519083969466,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_psychology,acc,0.4542483660130719,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_public_relations,acc,0.5454545454545454,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_security_studies,acc,0.4857142857142857,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_sociology,acc,0.7313432835820896,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.72,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_stem,acc,0.3618775769108785,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_abstract_algebra,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_anatomy,acc,0.4666666666666667,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_astronomy,acc,0.4934210526315789,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_biology,acc,0.4375,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_chemistry,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_computer_science,acc,0.34,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_mathematics,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_physics,acc,0.19607843137254902,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_computer_security,acc,0.61,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_conceptual_physics,acc,0.39574468085106385,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_electrical_engineering,acc,0.503448275862069,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.2724867724867725,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_biology,acc,0.5096774193548387,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.33497536945812806,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.38,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.2777777777777778,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_physics,acc,0.271523178807947,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_statistics,acc,0.25462962962962965,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_machine_learning,acc,0.33035714285714285,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_boolq,acc,0.8021406727828746,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_logiqa,acc,0.27035330261136714,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_openbookqa,acc,0.332,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_piqa,acc,0.764417845484222,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_truthfulqa_mc1,acc,0.2962056303549572,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_truthfulqa_mc2,acc,0.44121470505156096,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_truthfulqa_mc1,acc,0.2962056303549572,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_truthfulqa_mc2,acc,0.44121470505156096,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu,acc,0.4585529126904999,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_humanities,acc,0.4257173219978746,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_formal_logic,acc,0.24603174603174602,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_european_history,acc,0.6,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_us_history,acc,0.6568627450980392,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_world_history,acc,0.6160337552742616,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_international_law,acc,0.5950413223140496,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_jurisprudence,acc,0.5462962962962963,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_logical_fallacies,acc,0.5644171779141104,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_moral_disputes,acc,0.4913294797687861,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_moral_scenarios,acc,0.2424581005586592,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_philosophy,acc,0.5305466237942122,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_prehistory,acc,0.5277777777777778,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_law,acc,0.34615384615384615,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_world_religions,acc,0.6783625730994152,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_other,acc,0.5448986160283231,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_business_ethics,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.5283018867924528,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_medicine,acc,0.37572254335260113,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_global_facts,acc,0.4,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_human_aging,acc,0.5650224215246636,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_management,acc,0.6407766990291263,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_marketing,acc,0.7435897435897436,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_medical_genetics,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_miscellaneous,acc,0.6922094508301405,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_nutrition,acc,0.5,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_accounting,acc,0.3546099290780142,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_medicine,acc,0.41544117647058826,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_virology,acc,0.4819277108433735,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_social_sciences,acc,0.5206369840753982,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_econometrics,acc,0.30701754385964913,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_geography,acc,0.5808080808080808,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.6683937823834197,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.38974358974358975,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.3697478991596639,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_psychology,acc,0.6128440366972477,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_human_sexuality,acc,0.5572519083969466,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_professional_psychology,acc,0.4542483660130719,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_public_relations,acc,0.5454545454545454,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_security_studies,acc,0.4857142857142857,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_sociology,acc,0.7313432835820896,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.72,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_stem,acc,0.3618775769108785,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_abstract_algebra,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_anatomy,acc,0.4666666666666667,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_astronomy,acc,0.4934210526315789,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_biology,acc,0.4375,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_chemistry,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_computer_science,acc,0.34,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_mathematics,acc,0.28,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_college_physics,acc,0.19607843137254902,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_computer_security,acc,0.61,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_conceptual_physics,acc,0.39574468085106385,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_electrical_engineering,acc,0.503448275862069,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.2724867724867725,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_biology,acc,0.5096774193548387,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.33497536945812806,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.38,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.2777777777777778,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_physics,acc,0.271523178807947,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_high_school_statistics,acc,0.25462962962962965,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_int8,task_mmlu_machine_learning,acc,0.33035714285714285,W8A8_int8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_int8,6476005376 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_FP8,task_boolq,acc,0.8314984709480122,W8A8_FP8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.3333333333333333,W8A8_FP8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.30808080808080807,W8A8_FP8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.3076923076923077,W8A8_FP8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.304029304029304,W8A8_FP8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_FP8,task_gpqa_main_n_shot,acc,0.3013392857142857,W8A8_FP8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.31026785714285715,W8A8_FP8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_FP8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_FP8,task_logiqa,acc,0.27035330261136714,W8A8_FP8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_FP8,9083953152 google/gemma-2-2b-it:W4A16,task_boolq,acc,0.8333333333333334,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_logiqa,acc,0.271889400921659,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_piqa,acc,0.780739934711643,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu,acc,0.5548354935194417,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_humanities,acc,0.491817215727949,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_formal_logic,acc,0.3412698412698413,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_european_history,acc,0.7272727272727273,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_us_history,acc,0.7450980392156863,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_world_history,acc,0.7468354430379747,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_international_law,acc,0.6942148760330579,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_jurisprudence,acc,0.6296296296296297,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_logical_fallacies,acc,0.6809815950920245,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_moral_disputes,acc,0.5982658959537572,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_philosophy,acc,0.6205787781350482,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_prehistory,acc,0.595679012345679,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_professional_law,acc,0.41134289439374183,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_world_religions,acc,0.7134502923976608,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_other,acc,0.618925008046347,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_business_ethics,acc,0.5,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_clinical_knowledge,acc,0.6,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_medicine,acc,0.5838150289017341,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_global_facts,acc,0.29,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_human_aging,acc,0.5560538116591929,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_management,acc,0.7961165048543689,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_marketing,acc,0.7863247863247863,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_medical_genetics,acc,0.61,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_miscellaneous,acc,0.7535121328224776,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_nutrition,acc,0.6437908496732027,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_professional_accounting,acc,0.3971631205673759,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_professional_medicine,acc,0.5625,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_virology,acc,0.4879518072289157,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_social_sciences,acc,0.6564835879103023,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_econometrics,acc,0.3508771929824561,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_geography,acc,0.7373737373737373,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_government_and_politics,acc,0.772020725388601,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_macroeconomics,acc,0.5897435897435898,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_microeconomics,acc,0.5714285714285714,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_psychology,acc,0.8073394495412844,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_human_sexuality,acc,0.6564885496183206,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_professional_psychology,acc,0.5392156862745098,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_public_relations,acc,0.6454545454545455,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_security_studies,acc,0.6653061224489796,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_sociology,acc,0.746268656716418,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_us_foreign_policy,acc,0.79,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_stem,acc,0.4865207738661592,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_abstract_algebra,acc,0.37,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_anatomy,acc,0.5555555555555556,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_astronomy,acc,0.5986842105263158,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_biology,acc,0.6944444444444444,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_chemistry,acc,0.44,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_computer_science,acc,0.47,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_mathematics,acc,0.37,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_physics,acc,0.3137254901960784,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_computer_security,acc,0.68,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_conceptual_physics,acc,0.4297872340425532,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_electrical_engineering,acc,0.5586206896551724,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_elementary_mathematics,acc,0.42063492063492064,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_biology,acc,0.7322580645161291,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_chemistry,acc,0.4236453201970443,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_computer_science,acc,0.59,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_mathematics,acc,0.34814814814814815,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_physics,acc,0.31125827814569534,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_statistics,acc,0.5,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_machine_learning,acc,0.36607142857142855,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_boolq,acc,0.8333333333333334,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_logiqa,acc,0.271889400921659,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_piqa,acc,0.780739934711643,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_boolq,acc,0.8333333333333334,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_logiqa,acc,0.271889400921659,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu,acc,0.5548354935194417,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_humanities,acc,0.491817215727949,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_formal_logic,acc,0.3412698412698413,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_european_history,acc,0.7272727272727273,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_us_history,acc,0.7450980392156863,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_world_history,acc,0.7468354430379747,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_international_law,acc,0.6942148760330579,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_jurisprudence,acc,0.6296296296296297,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_logical_fallacies,acc,0.6809815950920245,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_moral_disputes,acc,0.5982658959537572,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_philosophy,acc,0.6205787781350482,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_prehistory,acc,0.595679012345679,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_professional_law,acc,0.41134289439374183,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_world_religions,acc,0.7134502923976608,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_other,acc,0.618925008046347,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_business_ethics,acc,0.5,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_clinical_knowledge,acc,0.6,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_medicine,acc,0.5838150289017341,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_global_facts,acc,0.29,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_human_aging,acc,0.5560538116591929,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_management,acc,0.7961165048543689,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_marketing,acc,0.7863247863247863,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_medical_genetics,acc,0.61,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_miscellaneous,acc,0.7535121328224776,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_nutrition,acc,0.6437908496732027,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_professional_accounting,acc,0.3971631205673759,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_professional_medicine,acc,0.5625,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_virology,acc,0.4879518072289157,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_social_sciences,acc,0.6564835879103023,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_econometrics,acc,0.3508771929824561,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_geography,acc,0.7373737373737373,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_government_and_politics,acc,0.772020725388601,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_macroeconomics,acc,0.5897435897435898,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_microeconomics,acc,0.5714285714285714,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_psychology,acc,0.8073394495412844,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_human_sexuality,acc,0.6564885496183206,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_professional_psychology,acc,0.5392156862745098,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_public_relations,acc,0.6454545454545455,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_security_studies,acc,0.6653061224489796,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_sociology,acc,0.746268656716418,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_us_foreign_policy,acc,0.79,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_stem,acc,0.4865207738661592,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_abstract_algebra,acc,0.37,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_anatomy,acc,0.5555555555555556,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_astronomy,acc,0.5986842105263158,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_biology,acc,0.6944444444444444,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_chemistry,acc,0.44,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_computer_science,acc,0.47,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_mathematics,acc,0.37,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_college_physics,acc,0.3137254901960784,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_computer_security,acc,0.68,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_conceptual_physics,acc,0.4297872340425532,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_electrical_engineering,acc,0.5586206896551724,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_elementary_mathematics,acc,0.42063492063492064,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_biology,acc,0.7322580645161291,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_chemistry,acc,0.4236453201970443,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_computer_science,acc,0.59,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_mathematics,acc,0.34814814814814815,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_physics,acc,0.31125827814569534,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_high_school_statistics,acc,0.5,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_mmlu_machine_learning,acc,0.36607142857142855,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048 meta-llama/Llama-2-7b-chat-hf:W4A16,task_truthfulqa_mc1,acc,0.29008567931456547,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_truthfulqa_mc2,acc,0.4573321156241587,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_boolq,acc,0.7889908256880734,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_logiqa,acc,0.2519201228878648,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_openbookqa,acc,0.326,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_truthfulqa_mc1,acc,0.29008567931456547,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_truthfulqa_mc2,acc,0.45601374796274113,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_boolq,acc,0.7889908256880734,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_logiqa,acc,0.2519201228878648,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_piqa,acc,0.7611534276387377,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu,acc,0.45492095143142003,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_humanities,acc,0.42359192348565355,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_formal_logic,acc,0.2619047619047619,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_european_history,acc,0.5818181818181818,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_us_history,acc,0.6519607843137255,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_world_history,acc,0.5949367088607594,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_international_law,acc,0.5785123966942148,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_jurisprudence,acc,0.5462962962962963,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_logical_fallacies,acc,0.5766871165644172,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_moral_disputes,acc,0.4797687861271676,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_moral_scenarios,acc,0.2424581005586592,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_philosophy,acc,0.5305466237942122,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_prehistory,acc,0.5370370370370371,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_professional_law,acc,0.34485006518904826,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_world_religions,acc,0.6783625730994152,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_other,acc,0.5345992919214676,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_business_ethics,acc,0.47,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_clinical_knowledge,acc,0.5358490566037736,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_medicine,acc,0.3699421965317919,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_global_facts,acc,0.4,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_human_aging,acc,0.5874439461883408,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_management,acc,0.6019417475728155,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_marketing,acc,0.7222222222222222,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_medical_genetics,acc,0.45,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_miscellaneous,acc,0.6615581098339719,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_nutrition,acc,0.477124183006536,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_professional_accounting,acc,0.36524822695035464,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_professional_medicine,acc,0.43014705882352944,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_virology,acc,0.463855421686747,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_social_sciences,acc,0.5212869678258043,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_econometrics,acc,0.2894736842105263,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_geography,acc,0.6060606060606061,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_government_and_politics,acc,0.689119170984456,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_macroeconomics,acc,0.38974358974358975,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_microeconomics,acc,0.35714285714285715,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_psychology,acc,0.5944954128440367,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_human_sexuality,acc,0.5648854961832062,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_professional_psychology,acc,0.4411764705882353,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_public_relations,acc,0.5363636363636364,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_security_studies,acc,0.5387755102040817,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_sociology,acc,0.746268656716418,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_us_foreign_policy,acc,0.72,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_stem,acc,0.35838883602917854,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_abstract_algebra,acc,0.28,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_anatomy,acc,0.48148148148148145,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_astronomy,acc,0.45394736842105265,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_biology,acc,0.4722222222222222,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_chemistry,acc,0.24,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_computer_science,acc,0.29,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_mathematics,acc,0.33,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_physics,acc,0.22549019607843138,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_computer_security,acc,0.55,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_conceptual_physics,acc,0.3617021276595745,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_electrical_engineering,acc,0.46206896551724136,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_elementary_mathematics,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_biology,acc,0.5096774193548387,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_chemistry,acc,0.32019704433497537,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_computer_science,acc,0.44,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_mathematics,acc,0.25925925925925924,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_physics,acc,0.2847682119205298,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_statistics,acc,0.2638888888888889,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_machine_learning,acc,0.375,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu,acc,0.45492095143142003,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_humanities,acc,0.42359192348565355,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_formal_logic,acc,0.2619047619047619,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_european_history,acc,0.5818181818181818,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_us_history,acc,0.6519607843137255,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_world_history,acc,0.5949367088607594,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_international_law,acc,0.5785123966942148,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_jurisprudence,acc,0.5462962962962963,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_logical_fallacies,acc,0.5766871165644172,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_moral_disputes,acc,0.4797687861271676,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_moral_scenarios,acc,0.2424581005586592,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_philosophy,acc,0.5305466237942122,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_prehistory,acc,0.5370370370370371,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_professional_law,acc,0.34485006518904826,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_world_religions,acc,0.6783625730994152,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_other,acc,0.5345992919214676,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_business_ethics,acc,0.47,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_clinical_knowledge,acc,0.5358490566037736,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_medicine,acc,0.3699421965317919,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_global_facts,acc,0.4,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_human_aging,acc,0.5874439461883408,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_management,acc,0.6019417475728155,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_marketing,acc,0.7222222222222222,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_medical_genetics,acc,0.45,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_miscellaneous,acc,0.6615581098339719,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_nutrition,acc,0.477124183006536,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_professional_accounting,acc,0.36524822695035464,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_professional_medicine,acc,0.43014705882352944,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_virology,acc,0.463855421686747,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_social_sciences,acc,0.5212869678258043,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_econometrics,acc,0.2894736842105263,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_geography,acc,0.6060606060606061,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_government_and_politics,acc,0.689119170984456,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_macroeconomics,acc,0.38974358974358975,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_microeconomics,acc,0.35714285714285715,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_psychology,acc,0.5944954128440367,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_human_sexuality,acc,0.5648854961832062,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_professional_psychology,acc,0.4411764705882353,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_public_relations,acc,0.5363636363636364,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_security_studies,acc,0.5387755102040817,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_sociology,acc,0.746268656716418,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_us_foreign_policy,acc,0.72,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_stem,acc,0.35838883602917854,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_abstract_algebra,acc,0.28,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_anatomy,acc,0.48148148148148145,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_astronomy,acc,0.45394736842105265,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_biology,acc,0.4722222222222222,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_chemistry,acc,0.24,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_computer_science,acc,0.29,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_mathematics,acc,0.33,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_college_physics,acc,0.22549019607843138,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_computer_security,acc,0.55,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_conceptual_physics,acc,0.3617021276595745,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_electrical_engineering,acc,0.46206896551724136,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_elementary_mathematics,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_biology,acc,0.5096774193548387,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_chemistry,acc,0.32019704433497537,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_computer_science,acc,0.44,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_mathematics,acc,0.25925925925925924,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_physics,acc,0.2847682119205298,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_high_school_statistics,acc,0.2638888888888889,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_mmlu_machine_learning,acc,0.375,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_boolq,acc,0.7889908256880734,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_logiqa,acc,0.2519201228878648,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_openbookqa,acc,0.326,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_piqa,acc,0.7611534276387377,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_truthfulqa_mc1,acc,0.29008567931456547,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-2-7b-chat-hf:W4A16,task_truthfulqa_mc2,acc,0.45601374796274113,W4A16,espressor/meta-llama.Llama-2-7b-chat-hf_W4A16,3238006272 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_boolq,acc,0.5339449541284403,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_logiqa,acc,0.23195084485407066,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_piqa,acc,0.5729053318824809,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu,acc,0.2800170915823957,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_humanities,acc,0.27013815090329435,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_formal_logic,acc,0.25396825396825395,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_european_history,acc,0.23636363636363636,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_us_history,acc,0.22549019607843138,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_world_history,acc,0.23628691983122363,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_international_law,acc,0.24793388429752067,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_jurisprudence,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_logical_fallacies,acc,0.31901840490797545,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_moral_disputes,acc,0.2976878612716763,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_moral_scenarios,acc,0.24022346368715083,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_philosophy,acc,0.3054662379421222,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_prehistory,acc,0.24382716049382716,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_professional_law,acc,0.2803129074315515,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_world_religions,acc,0.3742690058479532,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_other,acc,0.3064048921789508,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_business_ethics,acc,0.31,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_clinical_knowledge,acc,0.30943396226415093,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_medicine,acc,0.3179190751445087,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_global_facts,acc,0.33,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_human_aging,acc,0.3452914798206278,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_management,acc,0.32038834951456313,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_marketing,acc,0.37606837606837606,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_medical_genetics,acc,0.27,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_miscellaneous,acc,0.29246487867177523,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_nutrition,acc,0.2647058823529412,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_professional_accounting,acc,0.2765957446808511,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_professional_medicine,acc,0.29411764705882354,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_virology,acc,0.3493975903614458,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_social_sciences,acc,0.2804679883002925,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_econometrics,acc,0.19298245614035087,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_geography,acc,0.22727272727272727,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_government_and_politics,acc,0.27461139896373055,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_macroeconomics,acc,0.23076923076923078,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_microeconomics,acc,0.24789915966386555,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_psychology,acc,0.30458715596330277,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_human_sexuality,acc,0.2900763358778626,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_professional_psychology,acc,0.315359477124183,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_public_relations,acc,0.2727272727272727,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_security_studies,acc,0.20816326530612245,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_sociology,acc,0.3582089552238806,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_us_foreign_policy,acc,0.44,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_stem,acc,0.26831588962892483,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_abstract_algebra,acc,0.18,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_anatomy,acc,0.22962962962962963,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_astronomy,acc,0.2631578947368421,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_biology,acc,0.3125,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_chemistry,acc,0.18,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_computer_science,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_mathematics,acc,0.29,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_physics,acc,0.27450980392156865,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_computer_security,acc,0.3,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_conceptual_physics,acc,0.30638297872340425,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_electrical_engineering,acc,0.33793103448275863,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_elementary_mathematics,acc,0.2222222222222222,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_biology,acc,0.2903225806451613,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_chemistry,acc,0.33497536945812806,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_computer_science,acc,0.28,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_mathematics,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_physics,acc,0.23178807947019867,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.24537037037037038,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2631578947368421,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.48418137284368573,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu,acc,0.2800170915823957,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_humanities,acc,0.27013815090329435,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_formal_logic,acc,0.25396825396825395,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_european_history,acc,0.23636363636363636,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_us_history,acc,0.22549019607843138,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_world_history,acc,0.23628691983122363,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_international_law,acc,0.24793388429752067,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_jurisprudence,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_logical_fallacies,acc,0.31901840490797545,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_moral_disputes,acc,0.2976878612716763,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_moral_scenarios,acc,0.24022346368715083,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_philosophy,acc,0.3054662379421222,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_prehistory,acc,0.24382716049382716,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_professional_law,acc,0.2803129074315515,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_world_religions,acc,0.3742690058479532,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_other,acc,0.3064048921789508,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_business_ethics,acc,0.31,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_clinical_knowledge,acc,0.30943396226415093,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_medicine,acc,0.3179190751445087,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_global_facts,acc,0.33,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_human_aging,acc,0.3452914798206278,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_management,acc,0.32038834951456313,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_marketing,acc,0.37606837606837606,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_medical_genetics,acc,0.27,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_miscellaneous,acc,0.29246487867177523,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_nutrition,acc,0.2647058823529412,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_professional_accounting,acc,0.2765957446808511,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_professional_medicine,acc,0.29411764705882354,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_virology,acc,0.3493975903614458,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_social_sciences,acc,0.2804679883002925,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_econometrics,acc,0.19298245614035087,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_geography,acc,0.22727272727272727,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_government_and_politics,acc,0.27461139896373055,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_macroeconomics,acc,0.23076923076923078,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_microeconomics,acc,0.24789915966386555,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_psychology,acc,0.30458715596330277,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_human_sexuality,acc,0.2900763358778626,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_professional_psychology,acc,0.315359477124183,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_public_relations,acc,0.2727272727272727,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_security_studies,acc,0.20816326530612245,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_sociology,acc,0.3582089552238806,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_us_foreign_policy,acc,0.44,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_stem,acc,0.26831588962892483,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_abstract_algebra,acc,0.18,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_anatomy,acc,0.22962962962962963,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_astronomy,acc,0.2631578947368421,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_biology,acc,0.3125,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_chemistry,acc,0.18,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_computer_science,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_mathematics,acc,0.29,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_college_physics,acc,0.27450980392156865,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_computer_security,acc,0.3,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_conceptual_physics,acc,0.30638297872340425,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_electrical_engineering,acc,0.33793103448275863,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_elementary_mathematics,acc,0.2222222222222222,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_biology,acc,0.2903225806451613,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_chemistry,acc,0.33497536945812806,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_computer_science,acc,0.28,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_mathematics,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_physics,acc,0.23178807947019867,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.24537037037037038,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.2-1B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-1B-Instruct_W4A16,1552553728 meta-llama/Llama-3.1-8B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.3378212974296206,W4A16,espressor/meta-llama.Llama-3.1-8B-Instruct_W4A16,5700595200 meta-llama/Llama-3.1-8B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.5051760429703329,W4A16,espressor/meta-llama.Llama-3.1-8B-Instruct_W4A16,5700595200 meta-llama/Llama-3.1-8B-Instruct:W4A16,task_boolq,acc,0.8186544342507646,W4A16,espressor/meta-llama.Llama-3.1-8B-Instruct_W4A16,5700595200 meta-llama/Llama-3.1-8B-Instruct:W4A16,task_logiqa,acc,0.271889400921659,W4A16,espressor/meta-llama.Llama-3.1-8B-Instruct_W4A16,5700595200 meta-llama/Llama-3.1-8B-Instruct:W4A16,task_piqa,acc,0.7818280739934712,W4A16,espressor/meta-llama.Llama-3.1-8B-Instruct_W4A16,5700595200 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_boolq,acc,0.7948012232415902,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.29292929292929293,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.25757575757575757,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.27472527472527475,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.2564102564102564,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_main_n_shot,acc,0.3013392857142857,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.25223214285714285,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_logiqa,acc,0.2749615975422427,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu,acc,0.4600484261501211,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_humanities,acc,0.42869287991498406,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_formal_logic,acc,0.2619047619047619,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.5636363636363636,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.6568627450980392,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.6244725738396625,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_international_law,acc,0.6033057851239669,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_jurisprudence,acc,0.5648148148148148,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.5766871165644172,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_moral_disputes,acc,0.4797687861271676,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.2424581005586592,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_philosophy,acc,0.5241157556270096,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_prehistory,acc,0.5462962962962963,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_professional_law,acc,0.3513689700130378,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_world_religions,acc,0.695906432748538,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_other,acc,0.5455423237850016,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_business_ethics,acc,0.48,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.5320754716981132,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_college_medicine,acc,0.3988439306358382,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_global_facts,acc,0.38,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_human_aging,acc,0.5829596412556054,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_management,acc,0.6796116504854369,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_marketing,acc,0.7435897435897436,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_medical_genetics,acc,0.48,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_miscellaneous,acc,0.6871008939974457,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_nutrition,acc,0.49019607843137253,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_professional_accounting,acc,0.37943262411347517,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_professional_medicine,acc,0.4007352941176471,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_virology,acc,0.4397590361445783,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_social_sciences,acc,0.525836854078648,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_econometrics,acc,0.2894736842105263,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_geography,acc,0.5757575757575758,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.6632124352331606,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.3923076923076923,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.36134453781512604,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.6238532110091743,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_human_sexuality,acc,0.5801526717557252,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_professional_psychology,acc,0.46568627450980393,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_public_relations,acc,0.5272727272727272,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_security_studies,acc,0.5061224489795918,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_sociology,acc,0.7412935323383084,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.72,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_stem,acc,0.35838883602917854,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.3,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_anatomy,acc,0.4666666666666667,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_astronomy,acc,0.4868421052631579,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_college_biology,acc,0.4375,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_college_chemistry,acc,0.25,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_college_computer_science,acc,0.32,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_college_mathematics,acc,0.32,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_college_physics,acc,0.23529411764705882,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_computer_security,acc,0.6,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.4,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.4482758620689655,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.2698412698412698,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_biology,acc,0.4806451612903226,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.3448275862068966,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.39,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.26296296296296295,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_physics,acc,0.2582781456953642,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.26851851851851855,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_mmlu_machine_learning,acc,0.35714285714285715,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_openbookqa,acc,0.334,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_piqa,acc,0.764417845484222,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_truthfulqa_mc1,acc,0.29498164014687883,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_truthfulqa_mc2,acc,0.4506984874530874,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_boolq,acc,0.7948012232415902,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.29292929292929293,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.25757575757575757,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.27472527472527475,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.2564102564102564,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_main_n_shot,acc,0.3013392857142857,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.25223214285714285,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-2-7b-chat-hf:W8A8_FP8,task_logiqa,acc,0.2749615975422427,W8A8_FP8,espressor/meta-llama.Llama-2-7b-chat-hf_W8A8_FP8,6476005376 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_boolq,acc,0.8403669724770643,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_logiqa,acc,0.30414746543778803,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_openbookqa,acc,0.346,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_piqa,acc,0.8008705114254625,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_truthfulqa_mc1,acc,0.3659730722154223,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_truthfulqa_mc2,acc,0.5392220169800028,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_boolq,acc,0.8403669724770643,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_logiqa,acc,0.30414746543778803,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_piqa,acc,0.8008705114254625,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_boolq,acc,0.8403669724770643,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_logiqa,acc,0.30414746543778803,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_openbookqa,acc,0.346,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_truthfulqa_mc1,acc,0.3659730722154223,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_truthfulqa_mc2,acc,0.5392220169800028,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu,acc,0.6754023643355648,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_humanities,acc,0.638682252922423,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_formal_logic,acc,0.46825396825396826,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_european_history,acc,0.7515151515151515,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_us_history,acc,0.8186274509803921,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_world_history,acc,0.8481012658227848,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_international_law,acc,0.7933884297520661,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_jurisprudence,acc,0.7685185185185185,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_logical_fallacies,acc,0.7791411042944786,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_moral_disputes,acc,0.7196531791907514,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_moral_scenarios,acc,0.5899441340782123,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_philosophy,acc,0.7202572347266881,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_prehistory,acc,0.7530864197530864,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_professional_law,acc,0.49869621903520206,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_world_religions,acc,0.8070175438596491,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_other,acc,0.7396202124235597,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_business_ethics,acc,0.69,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.7622641509433963,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_medicine,acc,0.6878612716763006,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_global_facts,acc,0.41,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_human_aging,acc,0.6681614349775785,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_management,acc,0.8349514563106796,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_marketing,acc,0.8888888888888888,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_medical_genetics,acc,0.81,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_miscellaneous,acc,0.8403575989782887,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_nutrition,acc,0.7679738562091504,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_professional_accounting,acc,0.5531914893617021,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_professional_medicine,acc,0.7647058823529411,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_virology,acc,0.5180722891566265,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_social_sciences,acc,0.7647058823529411,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_econometrics,acc,0.5087719298245614,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_geography,acc,0.7929292929292929,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.8601036269430051,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.6794871794871795,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.7773109243697479,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_psychology,acc,0.8532110091743119,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_human_sexuality,acc,0.8091603053435115,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_professional_psychology,acc,0.7173202614379085,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_public_relations,acc,0.6636363636363637,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_security_studies,acc,0.7551020408163265,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_sociology,acc,0.8407960199004975,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.85,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_stem,acc,0.5797653028861401,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_abstract_algebra,acc,0.35,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_anatomy,acc,0.7037037037037037,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_astronomy,acc,0.7763157894736842,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_biology,acc,0.8055555555555556,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_chemistry,acc,0.46,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_computer_science,acc,0.52,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_mathematics,acc,0.35,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_physics,acc,0.4019607843137255,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_computer_security,acc,0.74,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_conceptual_physics,acc,0.6042553191489362,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_electrical_engineering,acc,0.6413793103448275,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.48677248677248675,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_biology,acc,0.8129032258064516,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.6157635467980296,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.72,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.4,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_physics,acc,0.44370860927152317,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_statistics,acc,0.5416666666666666,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_machine_learning,acc,0.5,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_openbookqa,acc,0.346,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_truthfulqa_mc1,acc,0.3659730722154223,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_truthfulqa_mc2,acc,0.5392220169800028,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu,acc,0.6754023643355648,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_humanities,acc,0.638682252922423,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_formal_logic,acc,0.46825396825396826,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_european_history,acc,0.7515151515151515,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_us_history,acc,0.8186274509803921,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_world_history,acc,0.8481012658227848,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_international_law,acc,0.7933884297520661,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_jurisprudence,acc,0.7685185185185185,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_logical_fallacies,acc,0.7791411042944786,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_moral_disputes,acc,0.7196531791907514,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_moral_scenarios,acc,0.5899441340782123,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_philosophy,acc,0.7202572347266881,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_prehistory,acc,0.7530864197530864,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_professional_law,acc,0.49869621903520206,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_world_religions,acc,0.8070175438596491,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_other,acc,0.7396202124235597,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_business_ethics,acc,0.69,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.7622641509433963,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_medicine,acc,0.6878612716763006,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_global_facts,acc,0.41,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_human_aging,acc,0.6681614349775785,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_management,acc,0.8349514563106796,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_marketing,acc,0.8888888888888888,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_medical_genetics,acc,0.81,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_miscellaneous,acc,0.8403575989782887,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_nutrition,acc,0.7679738562091504,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_professional_accounting,acc,0.5531914893617021,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_professional_medicine,acc,0.7647058823529411,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_virology,acc,0.5180722891566265,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_social_sciences,acc,0.7647058823529411,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_econometrics,acc,0.5087719298245614,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_geography,acc,0.7929292929292929,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.8601036269430051,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.6794871794871795,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.7773109243697479,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_psychology,acc,0.8532110091743119,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_human_sexuality,acc,0.8091603053435115,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_professional_psychology,acc,0.7173202614379085,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_public_relations,acc,0.6636363636363637,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_security_studies,acc,0.7551020408163265,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_sociology,acc,0.8407960199004975,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.85,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_stem,acc,0.5797653028861401,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_abstract_algebra,acc,0.35,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_anatomy,acc,0.7037037037037037,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_astronomy,acc,0.7763157894736842,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_biology,acc,0.8055555555555556,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_chemistry,acc,0.46,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_computer_science,acc,0.52,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_mathematics,acc,0.35,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_college_physics,acc,0.4019607843137255,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_computer_security,acc,0.74,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_conceptual_physics,acc,0.6042553191489362,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_electrical_engineering,acc,0.6413793103448275,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.48677248677248675,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_biology,acc,0.8129032258064516,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.6157635467980296,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.72,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.4,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_physics,acc,0.44370860927152317,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_high_school_statistics,acc,0.5416666666666666,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 meta-llama/Llama-3.1-8B-Instruct:W8A8_int8,task_mmlu_machine_learning,acc,0.5,W8A8_int8,espressor/meta-llama.Llama-3.1-8B-Instruct_W8A8_int8,9083953152 google/gemma-2b-it:W4A16,task_boolq,acc,0.6232415902140673,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_logiqa,acc,0.2488479262672811,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_openbookqa,acc,0.338,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_piqa,acc,0.7453754080522307,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_truthfulqa_mc1,acc,0.29253365973072215,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_truthfulqa_mc2,acc,0.4539681140918823,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_boolq,acc,0.6232415902140673,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_logiqa,acc,0.2488479262672811,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_piqa,acc,0.7453754080522307,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_boolq,acc,0.6232415902140673,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_logiqa,acc,0.2488479262672811,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_openbookqa,acc,0.338,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_truthfulqa_mc1,acc,0.29253365973072215,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_truthfulqa_mc2,acc,0.4539681140918823,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_truthfulqa_mc1,acc,0.29253365973072215,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_truthfulqa_mc2,acc,0.4539681140918823,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu,acc,0.3748753738783649,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_humanities,acc,0.3564293304994687,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_formal_logic,acc,0.36507936507936506,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_european_history,acc,0.5212121212121212,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_us_history,acc,0.4264705882352941,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_world_history,acc,0.5232067510548524,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_international_law,acc,0.512396694214876,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_jurisprudence,acc,0.46296296296296297,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_logical_fallacies,acc,0.4049079754601227,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_moral_disputes,acc,0.40173410404624277,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_moral_scenarios,acc,0.24804469273743016,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_philosophy,acc,0.3536977491961415,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_prehistory,acc,0.3888888888888889,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_professional_law,acc,0.31421121251629724,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_world_religions,acc,0.4502923976608187,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_other,acc,0.42645638879948505,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_business_ethics,acc,0.48,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_clinical_knowledge,acc,0.4,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_medicine,acc,0.3699421965317919,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_global_facts,acc,0.23,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_human_aging,acc,0.4484304932735426,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_management,acc,0.49514563106796117,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_marketing,acc,0.6068376068376068,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_medical_genetics,acc,0.38,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_miscellaneous,acc,0.4827586206896552,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_nutrition,acc,0.4477124183006536,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_professional_accounting,acc,0.32269503546099293,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_professional_medicine,acc,0.3235294117647059,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_virology,acc,0.35542168674698793,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_social_sciences,acc,0.41501462463438415,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_econometrics,acc,0.22807017543859648,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_geography,acc,0.45454545454545453,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_government_and_politics,acc,0.48704663212435234,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_macroeconomics,acc,0.36153846153846153,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_microeconomics,acc,0.31512605042016806,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_psychology,acc,0.5155963302752293,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_human_sexuality,acc,0.4351145038167939,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_professional_psychology,acc,0.3790849673202614,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_public_relations,acc,0.4090909090909091,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_security_studies,acc,0.34285714285714286,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_sociology,acc,0.48756218905472637,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_us_foreign_policy,acc,0.54,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_stem,acc,0.31240088804313354,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_abstract_algebra,acc,0.29,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_anatomy,acc,0.4,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_astronomy,acc,0.3684210526315789,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_biology,acc,0.3888888888888889,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_chemistry,acc,0.31,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_computer_science,acc,0.35,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_mathematics,acc,0.3,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_physics,acc,0.16666666666666666,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_computer_security,acc,0.48,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_conceptual_physics,acc,0.31063829787234043,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_electrical_engineering,acc,0.46206896551724136,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_elementary_mathematics,acc,0.23544973544973544,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_biology,acc,0.432258064516129,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_chemistry,acc,0.270935960591133,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_computer_science,acc,0.33,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_mathematics,acc,0.2074074074074074,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_physics,acc,0.25165562913907286,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_statistics,acc,0.2175925925925926,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_machine_learning,acc,0.33035714285714285,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu,acc,0.3748753738783649,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_humanities,acc,0.3564293304994687,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_formal_logic,acc,0.36507936507936506,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_european_history,acc,0.5212121212121212,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_us_history,acc,0.4264705882352941,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_world_history,acc,0.5232067510548524,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_international_law,acc,0.512396694214876,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_jurisprudence,acc,0.46296296296296297,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_logical_fallacies,acc,0.4049079754601227,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_moral_disputes,acc,0.40173410404624277,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_moral_scenarios,acc,0.24804469273743016,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_philosophy,acc,0.3536977491961415,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_prehistory,acc,0.3888888888888889,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_professional_law,acc,0.31421121251629724,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_world_religions,acc,0.4502923976608187,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_other,acc,0.42645638879948505,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_business_ethics,acc,0.48,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_clinical_knowledge,acc,0.4,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_medicine,acc,0.3699421965317919,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_global_facts,acc,0.23,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_human_aging,acc,0.4484304932735426,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_management,acc,0.49514563106796117,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_marketing,acc,0.6068376068376068,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_medical_genetics,acc,0.38,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_miscellaneous,acc,0.4827586206896552,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_nutrition,acc,0.4477124183006536,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_professional_accounting,acc,0.32269503546099293,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_professional_medicine,acc,0.3235294117647059,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_virology,acc,0.35542168674698793,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_social_sciences,acc,0.41501462463438415,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_econometrics,acc,0.22807017543859648,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_geography,acc,0.45454545454545453,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_government_and_politics,acc,0.48704663212435234,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_macroeconomics,acc,0.36153846153846153,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_microeconomics,acc,0.31512605042016806,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_psychology,acc,0.5155963302752293,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_human_sexuality,acc,0.4351145038167939,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_professional_psychology,acc,0.3790849673202614,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_public_relations,acc,0.4090909090909091,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_security_studies,acc,0.34285714285714286,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_sociology,acc,0.48756218905472637,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_us_foreign_policy,acc,0.54,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_stem,acc,0.31240088804313354,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_abstract_algebra,acc,0.29,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_anatomy,acc,0.4,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_astronomy,acc,0.3684210526315789,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_biology,acc,0.3888888888888889,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_chemistry,acc,0.31,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_computer_science,acc,0.35,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_mathematics,acc,0.3,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_college_physics,acc,0.16666666666666666,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_computer_security,acc,0.48,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_conceptual_physics,acc,0.31063829787234043,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_electrical_engineering,acc,0.46206896551724136,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_elementary_mathematics,acc,0.23544973544973544,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_biology,acc,0.432258064516129,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_chemistry,acc,0.270935960591133,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_computer_science,acc,0.33,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_mathematics,acc,0.2074074074074074,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_physics,acc,0.25165562913907286,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_high_school_statistics,acc,0.2175925925925926,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_mmlu_machine_learning,acc,0.33035714285714285,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 google/gemma-2b-it:W4A16,task_openbookqa,acc,0.338,W4A16,espressor/google.gemma-2b-it_W4A16,3119175648 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_boolq,acc,0.8351681957186544,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_logiqa,acc,0.2672811059907834,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_piqa,acc,0.780195865070729,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_boolq,acc,0.8351681957186544,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_logiqa,acc,0.2672811059907834,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_openbookqa,acc,0.34,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_piqa,acc,0.780195865070729,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_truthfulqa_mc1,acc,0.3537331701346389,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_truthfulqa_mc2,acc,0.5173151918892398,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_boolq,acc,0.8351681957186544,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_logiqa,acc,0.2672811059907834,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_openbookqa,acc,0.34,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_truthfulqa_mc1,acc,0.3537331701346389,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_truthfulqa_mc2,acc,0.5173151918892398,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu,acc,0.633314342686227,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_humanities,acc,0.5785334750265675,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_formal_logic,acc,0.49206349206349204,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_european_history,acc,0.7333333333333333,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_us_history,acc,0.8382352941176471,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_world_history,acc,0.8143459915611815,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_international_law,acc,0.7603305785123967,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_jurisprudence,acc,0.7685185185185185,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_logical_fallacies,acc,0.7730061349693251,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_moral_disputes,acc,0.7023121387283237,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_moral_scenarios,acc,0.3318435754189944,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_philosophy,acc,0.7138263665594855,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_prehistory,acc,0.7222222222222222,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_professional_law,acc,0.48565840938722293,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_world_religions,acc,0.7777777777777778,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_other,acc,0.7109752172513679,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_business_ethics,acc,0.65,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.7094339622641509,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_medicine,acc,0.6242774566473989,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_global_facts,acc,0.39,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_human_aging,acc,0.6547085201793722,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_management,acc,0.8446601941747572,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_marketing,acc,0.8888888888888888,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_medical_genetics,acc,0.81,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_miscellaneous,acc,0.8045977011494253,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_nutrition,acc,0.7320261437908496,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_professional_accounting,acc,0.5425531914893617,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_professional_medicine,acc,0.7169117647058824,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_virology,acc,0.5120481927710844,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_social_sciences,acc,0.7403314917127072,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_econometrics,acc,0.5087719298245614,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_geography,acc,0.7878787878787878,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.8808290155440415,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.6282051282051282,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.7226890756302521,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_psychology,acc,0.8311926605504587,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_human_sexuality,acc,0.7404580152671756,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_professional_psychology,acc,0.6830065359477124,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_public_relations,acc,0.6727272727272727,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_security_studies,acc,0.7387755102040816,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_sociology,acc,0.8407960199004975,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.85,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_stem,acc,0.5340945131620679,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_abstract_algebra,acc,0.31,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_anatomy,acc,0.6296296296296297,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_astronomy,acc,0.6842105263157895,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_biology,acc,0.7291666666666666,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_chemistry,acc,0.44,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_computer_science,acc,0.48,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_mathematics,acc,0.34,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_physics,acc,0.49019607843137253,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_computer_security,acc,0.73,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_conceptual_physics,acc,0.5361702127659574,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_electrical_engineering,acc,0.6137931034482759,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.46296296296296297,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_biology,acc,0.7419354838709677,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.4433497536945813,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.69,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.37407407407407406,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_physics,acc,0.423841059602649,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_statistics,acc,0.5092592592592593,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_machine_learning,acc,0.5,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu,acc,0.633314342686227,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_humanities,acc,0.5785334750265675,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_formal_logic,acc,0.49206349206349204,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_european_history,acc,0.7333333333333333,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_us_history,acc,0.8382352941176471,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_world_history,acc,0.8143459915611815,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_international_law,acc,0.7603305785123967,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_jurisprudence,acc,0.7685185185185185,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_logical_fallacies,acc,0.7730061349693251,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_moral_disputes,acc,0.7023121387283237,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_moral_scenarios,acc,0.3318435754189944,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_philosophy,acc,0.7138263665594855,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_prehistory,acc,0.7222222222222222,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_professional_law,acc,0.48565840938722293,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_world_religions,acc,0.7777777777777778,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_other,acc,0.7109752172513679,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_business_ethics,acc,0.65,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.7094339622641509,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_medicine,acc,0.6242774566473989,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_global_facts,acc,0.39,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_human_aging,acc,0.6547085201793722,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_management,acc,0.8446601941747572,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_marketing,acc,0.8888888888888888,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_medical_genetics,acc,0.81,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_miscellaneous,acc,0.8045977011494253,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_nutrition,acc,0.7320261437908496,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_professional_accounting,acc,0.5425531914893617,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_professional_medicine,acc,0.7169117647058824,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_virology,acc,0.5120481927710844,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_social_sciences,acc,0.7403314917127072,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_econometrics,acc,0.5087719298245614,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_geography,acc,0.7878787878787878,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.8808290155440415,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.6282051282051282,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.7226890756302521,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_psychology,acc,0.8311926605504587,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_human_sexuality,acc,0.7404580152671756,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_professional_psychology,acc,0.6830065359477124,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_public_relations,acc,0.6727272727272727,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_security_studies,acc,0.7387755102040816,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_sociology,acc,0.8407960199004975,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.85,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_stem,acc,0.5340945131620679,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_abstract_algebra,acc,0.31,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_anatomy,acc,0.6296296296296297,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_astronomy,acc,0.6842105263157895,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_biology,acc,0.7291666666666666,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_chemistry,acc,0.44,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_computer_science,acc,0.48,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_mathematics,acc,0.34,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_college_physics,acc,0.49019607843137253,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_computer_security,acc,0.73,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_conceptual_physics,acc,0.5361702127659574,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_electrical_engineering,acc,0.6137931034482759,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.46296296296296297,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_biology,acc,0.7419354838709677,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.4433497536945813,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.69,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.37407407407407406,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_physics,acc,0.423841059602649,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_high_school_statistics,acc,0.5092592592592593,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_mmlu_machine_learning,acc,0.5,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_truthfulqa_mc1,acc,0.3537331701346389,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_truthfulqa_mc2,acc,0.5173151918892398,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 meta-llama/Meta-Llama-3-8B-Instruct:W8A8_int8,task_openbookqa,acc,0.34,W8A8_int8,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W8A8_int8,9083953152 google/gemma-2-9b-it:W8A8_FP8,task_boolq,acc,0.8889908256880734,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.36363636363636365,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.35353535353535354,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.3315018315018315,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.3498168498168498,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_main_n_shot,acc,0.35044642857142855,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.375,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_logiqa,acc,0.3317972350230415,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu,acc,0.7196268337843612,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_humanities,acc,0.6501594048884166,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_formal_logic,acc,0.5238095238095238,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.8484848484848485,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.8823529411764706,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.8945147679324894,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_international_law,acc,0.8760330578512396,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_jurisprudence,acc,0.8240740740740741,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.8282208588957055,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_moral_disputes,acc,0.7601156069364162,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.4033519553072626,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_philosophy,acc,0.7620578778135049,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_prehistory,acc,0.808641975308642,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_professional_law,acc,0.5619295958279009,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_world_religions,acc,0.8538011695906432,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_other,acc,0.7698744769874477,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_business_ethics,acc,0.7,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.7773584905660378,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_college_medicine,acc,0.7283236994219653,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_global_facts,acc,0.45,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_human_aging,acc,0.7757847533632287,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_management,acc,0.8543689320388349,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_marketing,acc,0.9188034188034188,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_medical_genetics,acc,0.86,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_miscellaneous,acc,0.8671775223499362,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_nutrition,acc,0.7418300653594772,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_professional_accounting,acc,0.6099290780141844,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_professional_medicine,acc,0.7977941176470589,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_virology,acc,0.5301204819277109,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_social_sciences,acc,0.8368540786480339,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_econometrics,acc,0.6140350877192983,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_geography,acc,0.9040404040404041,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.9481865284974094,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.7948717948717948,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.8235294117647058,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.9155963302752294,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_human_sexuality,acc,0.8320610687022901,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_professional_psychology,acc,0.7859477124183006,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_public_relations,acc,0.7454545454545455,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_security_studies,acc,0.8081632653061225,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_sociology,acc,0.8706467661691543,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.93,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_stem,acc,0.659372026641294,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.46,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_anatomy,acc,0.725925925925926,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_astronomy,acc,0.8092105263157895,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_college_biology,acc,0.8680555555555556,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_college_chemistry,acc,0.54,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_college_computer_science,acc,0.56,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_college_mathematics,acc,0.44,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_college_physics,acc,0.49019607843137253,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_computer_security,acc,0.81,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.6851063829787234,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.7172413793103448,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.6111111111111112,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_biology,acc,0.9032258064516129,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.6748768472906403,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.81,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.44074074074074077,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_physics,acc,0.5894039735099338,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.6527777777777778,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_mmlu_machine_learning,acc,0.5267857142857143,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_openbookqa,acc,0.402,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_piqa,acc,0.8101196953210011,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.42962056303549573,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.6020533600309542,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_boolq,acc,0.8889908256880734,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.36363636363636365,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.35353535353535354,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.3315018315018315,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.3498168498168498,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_main_n_shot,acc,0.35044642857142855,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.375,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 google/gemma-2-9b-it:W8A8_FP8,task_logiqa,acc,0.3317972350230415,W8A8_FP8,espressor/google.gemma-2-9b-it_W8A8_FP8,11998522368 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu,acc,0.4531405782652044,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_humanities,acc,0.42911795961742827,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_formal_logic,acc,0.35714285714285715,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_european_history,acc,0.6363636363636364,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_us_history,acc,0.5784313725490197,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_world_history,acc,0.6497890295358649,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_international_law,acc,0.5537190082644629,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_jurisprudence,acc,0.5092592592592593,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_logical_fallacies,acc,0.43558282208588955,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_moral_disputes,acc,0.4393063583815029,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_moral_scenarios,acc,0.32737430167597764,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_philosophy,acc,0.4887459807073955,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_prehistory,acc,0.49691358024691357,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_professional_law,acc,0.3559322033898305,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_world_religions,acc,0.5847953216374269,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_other,acc,0.5143224975860959,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_business_ethics,acc,0.43,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.49433962264150944,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_medicine,acc,0.3815028901734104,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_global_facts,acc,0.3,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_human_aging,acc,0.515695067264574,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_management,acc,0.5436893203883495,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_marketing,acc,0.6837606837606838,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_medical_genetics,acc,0.48,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_miscellaneous,acc,0.5887611749680716,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_nutrition,acc,0.5555555555555556,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_professional_accounting,acc,0.36879432624113473,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_professional_medicine,acc,0.5367647058823529,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_virology,acc,0.40963855421686746,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_social_sciences,acc,0.5017874553136171,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_econometrics,acc,0.21929824561403508,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_geography,acc,0.5555555555555556,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.5181347150259067,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.41025641025641024,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.4579831932773109,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_psychology,acc,0.6256880733944954,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_human_sexuality,acc,0.5038167938931297,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_professional_psychology,acc,0.42320261437908496,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_public_relations,acc,0.4636363636363636,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_security_studies,acc,0.4897959183673469,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_sociology,acc,0.6666666666666666,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.69,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_stem,acc,0.3812242308912147,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_abstract_algebra,acc,0.24,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_anatomy,acc,0.5037037037037037,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_astronomy,acc,0.5263157894736842,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_biology,acc,0.4652777777777778,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_chemistry,acc,0.38,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_computer_science,acc,0.3,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_mathematics,acc,0.32,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_physics,acc,0.27450980392156865,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_computer_security,acc,0.46,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_conceptual_physics,acc,0.4085106382978723,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_electrical_engineering,acc,0.5241379310344828,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.29365079365079366,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_biology,acc,0.49032258064516127,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.3497536945812808,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.3037037037037037,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_physics,acc,0.2913907284768212,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_statistics,acc,0.35648148148148145,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_machine_learning,acc,0.29464285714285715,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu,acc,0.4531405782652044,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_humanities,acc,0.42911795961742827,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_formal_logic,acc,0.35714285714285715,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_european_history,acc,0.6363636363636364,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_us_history,acc,0.5784313725490197,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_world_history,acc,0.6497890295358649,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_international_law,acc,0.5537190082644629,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_jurisprudence,acc,0.5092592592592593,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_logical_fallacies,acc,0.43558282208588955,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_moral_disputes,acc,0.4393063583815029,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_moral_scenarios,acc,0.32737430167597764,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_philosophy,acc,0.4887459807073955,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_prehistory,acc,0.49691358024691357,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_professional_law,acc,0.3559322033898305,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_world_religions,acc,0.5847953216374269,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_other,acc,0.5143224975860959,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_business_ethics,acc,0.43,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.49433962264150944,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_medicine,acc,0.3815028901734104,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_global_facts,acc,0.3,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_human_aging,acc,0.515695067264574,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_management,acc,0.5436893203883495,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_marketing,acc,0.6837606837606838,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_medical_genetics,acc,0.48,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_miscellaneous,acc,0.5887611749680716,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_nutrition,acc,0.5555555555555556,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_professional_accounting,acc,0.36879432624113473,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_professional_medicine,acc,0.5367647058823529,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_virology,acc,0.40963855421686746,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_social_sciences,acc,0.5017874553136171,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_econometrics,acc,0.21929824561403508,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_geography,acc,0.5555555555555556,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.5181347150259067,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.41025641025641024,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.4579831932773109,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_psychology,acc,0.6256880733944954,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_human_sexuality,acc,0.5038167938931297,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_professional_psychology,acc,0.42320261437908496,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_public_relations,acc,0.4636363636363636,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_security_studies,acc,0.4897959183673469,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_sociology,acc,0.6666666666666666,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.69,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_stem,acc,0.3812242308912147,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_abstract_algebra,acc,0.24,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_anatomy,acc,0.5037037037037037,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_astronomy,acc,0.5263157894736842,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_biology,acc,0.4652777777777778,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_chemistry,acc,0.38,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_computer_science,acc,0.3,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_mathematics,acc,0.32,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_college_physics,acc,0.27450980392156865,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_computer_security,acc,0.46,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_conceptual_physics,acc,0.4085106382978723,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_electrical_engineering,acc,0.5241379310344828,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.29365079365079366,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_biology,acc,0.49032258064516127,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.3497536945812808,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.47,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.3037037037037037,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_physics,acc,0.2913907284768212,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_high_school_statistics,acc,0.35648148148148145,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_mmlu_machine_learning,acc,0.29464285714285715,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_truthfulqa_mc1,acc,0.27539779681762544,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 meta-llama/Llama-3.2-1B-Instruct:W8A8_int8,task_truthfulqa_mc2,acc,0.4429420395738545,W8A8_int8,espressor/meta-llama.Llama-3.2-1B-Instruct_W8A8_int8,2024640512 google/gemma-2b-it:W8A8_int8,task_mmlu,acc,0.24654607605754167,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_humanities,acc,0.2450584484590861,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_formal_logic,acc,0.1984126984126984,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_european_history,acc,0.24242424242424243,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_us_history,acc,0.23529411764705882,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_world_history,acc,0.2616033755274262,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_international_law,acc,0.24793388429752067,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_jurisprudence,acc,0.2962962962962963,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_logical_fallacies,acc,0.24539877300613497,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_moral_disputes,acc,0.24566473988439305,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_moral_scenarios,acc,0.2424581005586592,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_philosophy,acc,0.2733118971061093,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_prehistory,acc,0.2654320987654321,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_professional_law,acc,0.2392438070404172,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_world_religions,acc,0.21052631578947367,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_other,acc,0.26874798841326036,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_business_ethics,acc,0.26,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.2679245283018868,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_medicine,acc,0.20809248554913296,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_global_facts,acc,0.31,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_human_aging,acc,0.37668161434977576,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_management,acc,0.2524271844660194,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_marketing,acc,0.2564102564102564,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_medical_genetics,acc,0.26,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_miscellaneous,acc,0.28735632183908044,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_nutrition,acc,0.22875816993464052,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_professional_accounting,acc,0.2553191489361702,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_professional_medicine,acc,0.20220588235294118,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_virology,acc,0.3192771084337349,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_social_sciences,acc,0.23431914202144946,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_econometrics,acc,0.2807017543859649,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_geography,acc,0.21717171717171718,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.20725388601036268,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.2205128205128205,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.23109243697478993,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_psychology,acc,0.23669724770642203,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_human_sexuality,acc,0.22900763358778625,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_professional_psychology,acc,0.2565359477124183,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_public_relations,acc,0.34545454545454546,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_security_studies,acc,0.17142857142857143,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_sociology,acc,0.23880597014925373,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.21,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_stem,acc,0.23882017126546146,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_abstract_algebra,acc,0.26,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_anatomy,acc,0.2518518518518518,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_astronomy,acc,0.18421052631578946,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_biology,acc,0.2222222222222222,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_chemistry,acc,0.21,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_computer_science,acc,0.15,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_mathematics,acc,0.23,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_physics,acc,0.19607843137254902,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_computer_security,acc,0.24,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_conceptual_physics,acc,0.32340425531914896,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_electrical_engineering,acc,0.2206896551724138,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.2566137566137566,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_biology,acc,0.25483870967741934,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.270935960591133,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.23,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.26296296296296295,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_physics,acc,0.1986754966887417,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.16203703703703703,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.2857142857142857,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu,acc,0.24654607605754167,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_humanities,acc,0.2450584484590861,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_formal_logic,acc,0.1984126984126984,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_european_history,acc,0.24242424242424243,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_us_history,acc,0.23529411764705882,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_world_history,acc,0.2616033755274262,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_international_law,acc,0.24793388429752067,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_jurisprudence,acc,0.2962962962962963,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_logical_fallacies,acc,0.24539877300613497,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_moral_disputes,acc,0.24566473988439305,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_moral_scenarios,acc,0.2424581005586592,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_philosophy,acc,0.2733118971061093,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_prehistory,acc,0.2654320987654321,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_professional_law,acc,0.2392438070404172,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_world_religions,acc,0.21052631578947367,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_other,acc,0.26874798841326036,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_business_ethics,acc,0.26,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.2679245283018868,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_medicine,acc,0.20809248554913296,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_global_facts,acc,0.31,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_human_aging,acc,0.37668161434977576,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_management,acc,0.2524271844660194,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_marketing,acc,0.2564102564102564,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_medical_genetics,acc,0.26,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_miscellaneous,acc,0.28735632183908044,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_nutrition,acc,0.22875816993464052,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_professional_accounting,acc,0.2553191489361702,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_professional_medicine,acc,0.20220588235294118,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_virology,acc,0.3192771084337349,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_social_sciences,acc,0.23431914202144946,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_econometrics,acc,0.2807017543859649,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_geography,acc,0.21717171717171718,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.20725388601036268,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.2205128205128205,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.23109243697478993,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_psychology,acc,0.23669724770642203,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_human_sexuality,acc,0.22900763358778625,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_professional_psychology,acc,0.2565359477124183,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_public_relations,acc,0.34545454545454546,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_security_studies,acc,0.17142857142857143,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_sociology,acc,0.23880597014925373,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.21,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_stem,acc,0.23882017126546146,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_abstract_algebra,acc,0.26,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_anatomy,acc,0.2518518518518518,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_astronomy,acc,0.18421052631578946,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_biology,acc,0.2222222222222222,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_chemistry,acc,0.21,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_computer_science,acc,0.15,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_mathematics,acc,0.23,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_college_physics,acc,0.19607843137254902,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_computer_security,acc,0.24,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_conceptual_physics,acc,0.32340425531914896,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_electrical_engineering,acc,0.2206896551724138,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.2566137566137566,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_biology,acc,0.25483870967741934,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.270935960591133,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.23,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.26296296296296295,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_physics,acc,0.1986754966887417,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.16203703703703703,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.2857142857142857,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_truthfulqa_mc1,acc,0.200734394124847,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_truthfulqa_mc2,acc,0.4449819227010454,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_boolq,acc,0.6217125382262997,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_logiqa,acc,0.2304147465437788,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-2b-it:W8A8_int8,task_piqa,acc,0.5429815016322089,W8A8_int8,espressor/google.gemma-2b-it_W8A8_int8,4080531456 google/gemma-7b-it:W8A8_FP8,task_boolq,acc,0.8110091743119267,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.30303030303030304,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.25252525252525254,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.2783882783882784,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.2948717948717949,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_main_n_shot,acc,0.2611607142857143,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.296875,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_logiqa,acc,0.24423963133640553,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_boolq,acc,0.8110091743119267,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.30303030303030304,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.25252525252525254,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.2783882783882784,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.2948717948717949,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_main_n_shot,acc,0.2611607142857143,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.296875,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_logiqa,acc,0.24423963133640553,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu,acc,0.4992166358068651,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_humanities,acc,0.4486716259298619,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_formal_logic,acc,0.3492063492063492,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.6303030303030303,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.6029411764705882,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.6919831223628692,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_international_law,acc,0.6528925619834711,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_jurisprudence,acc,0.6388888888888888,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.558282208588957,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_moral_disputes,acc,0.5635838150289018,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.2335195530726257,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_philosophy,acc,0.5787781350482315,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_prehistory,acc,0.5462962962962963,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_professional_law,acc,0.36571056062581486,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_world_religions,acc,0.672514619883041,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_other,acc,0.576440296105568,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_business_ethics,acc,0.51,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.5509433962264151,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_college_medicine,acc,0.4393063583815029,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_global_facts,acc,0.4,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_human_aging,acc,0.6233183856502242,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_management,acc,0.6796116504854369,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_marketing,acc,0.8205128205128205,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_medical_genetics,acc,0.59,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_miscellaneous,acc,0.7037037037037037,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_nutrition,acc,0.5718954248366013,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_professional_accounting,acc,0.3404255319148936,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_professional_medicine,acc,0.4522058823529412,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_virology,acc,0.4397590361445783,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_social_sciences,acc,0.5758856028599285,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_econometrics,acc,0.34210526315789475,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_geography,acc,0.6666666666666666,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.6787564766839378,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.4717948717948718,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.4831932773109244,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.7211009174311926,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_human_sexuality,acc,0.6259541984732825,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_professional_psychology,acc,0.49019607843137253,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_public_relations,acc,0.6545454545454545,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_security_studies,acc,0.4897959183673469,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_sociology,acc,0.6616915422885572,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.71,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_stem,acc,0.4237234379955598,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.29,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_anatomy,acc,0.4666666666666667,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_astronomy,acc,0.4868421052631579,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_college_biology,acc,0.5555555555555556,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_college_chemistry,acc,0.38,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_college_computer_science,acc,0.49,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_college_mathematics,acc,0.33,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_college_physics,acc,0.2647058823529412,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_computer_security,acc,0.72,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.4765957446808511,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.4827586206896552,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.3201058201058201,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_biology,acc,0.5838709677419355,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.4187192118226601,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.53,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.3037037037037037,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_physics,acc,0.33112582781456956,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.3194444444444444,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_mmlu_machine_learning,acc,0.42857142857142855,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_openbookqa,acc,0.36,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_piqa,acc,0.7682263329706203,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.3023255813953488,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 google/gemma-7b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.4740387230460525,W8A8_FP8,espressor/google.gemma-7b-it_W8A8_FP8,10900936704 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_boolq,acc,0.6587155963302752,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_logiqa,acc,0.25960061443932414,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_piqa,acc,0.7682263329706203,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu,acc,0.4646773963822817,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_humanities,acc,0.3615302869287991,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_formal_logic,acc,0.3253968253968254,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_european_history,acc,0.20606060606060606,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_us_history,acc,0.2647058823529412,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_world_history,acc,0.2742616033755274,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_international_law,acc,0.5041322314049587,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_jurisprudence,acc,0.6018518518518519,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_logical_fallacies,acc,0.5214723926380368,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_moral_disputes,acc,0.5404624277456648,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_philosophy,acc,0.5691318327974276,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_prehistory,acc,0.49382716049382713,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_professional_law,acc,0.2900912646675359,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_world_religions,acc,0.6666666666666666,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_other,acc,0.5786932732539427,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_business_ethics,acc,0.51,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_clinical_knowledge,acc,0.630188679245283,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_medicine,acc,0.5260115606936416,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_global_facts,acc,0.33,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_human_aging,acc,0.5739910313901345,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_management,acc,0.7475728155339806,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_marketing,acc,0.7393162393162394,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_medical_genetics,acc,0.63,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_miscellaneous,acc,0.7369093231162197,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_nutrition,acc,0.6078431372549019,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_professional_accounting,acc,0.36524822695035464,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_professional_medicine,acc,0.29411764705882354,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_virology,acc,0.41566265060240964,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_social_sciences,acc,0.5492362690932727,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_econometrics,acc,0.3684210526315789,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_geography,acc,0.6818181818181818,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_government_and_politics,acc,0.5906735751295337,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_macroeconomics,acc,0.5897435897435898,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_microeconomics,acc,0.4957983193277311,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_psychology,acc,0.6146788990825688,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_human_sexuality,acc,0.6717557251908397,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_professional_psychology,acc,0.49019607843137253,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_public_relations,acc,0.5272727272727272,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_security_studies,acc,0.3306122448979592,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_sociology,acc,0.6019900497512438,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_us_foreign_policy,acc,0.68,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_stem,acc,0.4237234379955598,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_abstract_algebra,acc,0.29,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_anatomy,acc,0.4962962962962963,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_astronomy,acc,0.6776315789473685,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_biology,acc,0.625,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_chemistry,acc,0.32,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_computer_science,acc,0.4,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_mathematics,acc,0.28,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_physics,acc,0.4019607843137255,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_computer_security,acc,0.62,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_conceptual_physics,acc,0.49361702127659574,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_electrical_engineering,acc,0.5103448275862069,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_elementary_mathematics,acc,0.37566137566137564,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_biology,acc,0.5290322580645161,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_chemistry,acc,0.35960591133004927,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_computer_science,acc,0.42,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_mathematics,acc,0.2740740740740741,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_physics,acc,0.304635761589404,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.3055555555555556,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.41964285714285715,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2741738066095471,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.4777084681350537,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu,acc,0.4646773963822817,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_humanities,acc,0.3615302869287991,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_formal_logic,acc,0.3253968253968254,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_european_history,acc,0.20606060606060606,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_us_history,acc,0.2647058823529412,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_world_history,acc,0.2742616033755274,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_international_law,acc,0.5041322314049587,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_jurisprudence,acc,0.6018518518518519,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_logical_fallacies,acc,0.5214723926380368,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_moral_disputes,acc,0.5404624277456648,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_philosophy,acc,0.5691318327974276,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_prehistory,acc,0.49382716049382713,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_professional_law,acc,0.2900912646675359,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_world_religions,acc,0.6666666666666666,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_other,acc,0.5786932732539427,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_business_ethics,acc,0.51,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_clinical_knowledge,acc,0.630188679245283,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_medicine,acc,0.5260115606936416,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_global_facts,acc,0.33,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_human_aging,acc,0.5739910313901345,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_management,acc,0.7475728155339806,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_marketing,acc,0.7393162393162394,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_medical_genetics,acc,0.63,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_miscellaneous,acc,0.7369093231162197,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_nutrition,acc,0.6078431372549019,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_professional_accounting,acc,0.36524822695035464,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_professional_medicine,acc,0.29411764705882354,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_virology,acc,0.41566265060240964,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_social_sciences,acc,0.5492362690932727,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_econometrics,acc,0.3684210526315789,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_geography,acc,0.6818181818181818,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_government_and_politics,acc,0.5906735751295337,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_macroeconomics,acc,0.5897435897435898,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_microeconomics,acc,0.4957983193277311,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_psychology,acc,0.6146788990825688,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_human_sexuality,acc,0.6717557251908397,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_professional_psychology,acc,0.49019607843137253,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_public_relations,acc,0.5272727272727272,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_security_studies,acc,0.3306122448979592,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_sociology,acc,0.6019900497512438,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_us_foreign_policy,acc,0.68,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_stem,acc,0.4237234379955598,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_abstract_algebra,acc,0.29,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_anatomy,acc,0.4962962962962963,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_astronomy,acc,0.6776315789473685,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_biology,acc,0.625,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_chemistry,acc,0.32,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_computer_science,acc,0.4,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_mathematics,acc,0.28,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_college_physics,acc,0.4019607843137255,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_computer_security,acc,0.62,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_conceptual_physics,acc,0.49361702127659574,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_electrical_engineering,acc,0.5103448275862069,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_elementary_mathematics,acc,0.37566137566137564,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_biology,acc,0.5290322580645161,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_chemistry,acc,0.35960591133004927,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_computer_science,acc,0.42,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_mathematics,acc,0.2740740740740741,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_physics,acc,0.304635761589404,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.3055555555555556,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 meta-llama/Meta-Llama-3-8B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.41964285714285715,W4A16,espressor/meta-llama.Meta-Llama-3-8B-Instruct_W4A16,5700595200 google/gemma-2-2b-it:W8A8_FP8,task_boolq,acc,0.8388379204892966,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.25757575757575757,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.29292929292929293,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.304029304029304,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.32234432234432236,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_main_n_shot,acc,0.31026785714285715,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.3169642857142857,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_logiqa,acc,0.2764976958525346,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_boolq,acc,0.8388379204892966,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.25757575757575757,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.29292929292929293,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.304029304029304,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.32234432234432236,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_main_n_shot,acc,0.31026785714285715,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.3169642857142857,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_logiqa,acc,0.2764976958525346,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu,acc,0.5704315624554906,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_humanities,acc,0.5092454835281616,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_formal_logic,acc,0.35714285714285715,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.7333333333333333,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.7450980392156863,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.759493670886076,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_international_law,acc,0.7107438016528925,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_jurisprudence,acc,0.6851851851851852,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.7361963190184049,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_moral_disputes,acc,0.6329479768786127,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.24916201117318434,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_philosophy,acc,0.6495176848874598,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_prehistory,acc,0.6141975308641975,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_law,acc,0.42633637548891784,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_world_religions,acc,0.7076023391812866,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_other,acc,0.6411329256517541,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_business_ethics,acc,0.52,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.6339622641509434,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_medicine,acc,0.6184971098265896,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_global_facts,acc,0.29,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_human_aging,acc,0.5964125560538116,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_management,acc,0.7864077669902912,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_marketing,acc,0.811965811965812,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_medical_genetics,acc,0.65,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_miscellaneous,acc,0.7675606641123882,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_nutrition,acc,0.6601307189542484,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_accounting,acc,0.425531914893617,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_medicine,acc,0.5661764705882353,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_virology,acc,0.5421686746987951,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_social_sciences,acc,0.6766330841728957,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_econometrics,acc,0.40350877192982454,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_geography,acc,0.7373737373737373,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.7927461139896373,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.6205128205128205,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.5756302521008403,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.8238532110091743,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_human_sexuality,acc,0.6870229007633588,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_psychology,acc,0.5571895424836601,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_public_relations,acc,0.6727272727272727,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_security_studies,acc,0.689795918367347,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_sociology,acc,0.7860696517412935,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.77,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_stem,acc,0.48842372343799556,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.39,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_anatomy,acc,0.5333333333333333,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_astronomy,acc,0.5657894736842105,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_biology,acc,0.6875,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_chemistry,acc,0.45,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_computer_science,acc,0.44,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_mathematics,acc,0.37,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_physics,acc,0.35294117647058826,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_computer_security,acc,0.63,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.46382978723404256,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.5862068965517241,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.4126984126984127,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_biology,acc,0.7548387096774194,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.4433497536945813,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.6,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.362962962962963,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_physics,acc,0.2781456953642384,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.49074074074074076,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_mmlu_machine_learning,acc,0.3482142857142857,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_openbookqa,acc,0.36,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_piqa,acc,0.7861806311207835,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.3733170134638923,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.5289090993939894,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc1,acc,0.23378212974296206,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc2,acc,,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_piqa,acc,0.529923830250272,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_piqa,acc,0.529923830250272,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc1,acc,0.23378212974296206,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc2,acc,,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu,acc,0.2457627118644068,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_humanities,acc,0.24187035069075452,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_formal_logic,acc,0.23015873015873015,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_european_history,acc,0.24848484848484848,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_us_history,acc,0.23529411764705882,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_world_history,acc,0.22362869198312235,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_international_law,acc,0.23140495867768596,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_jurisprudence,acc,0.3148148148148148,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_logical_fallacies,acc,0.2331288343558282,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_moral_disputes,acc,0.2630057803468208,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_moral_scenarios,acc,0.23798882681564246,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_philosophy,acc,0.2379421221864952,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_prehistory,acc,0.23765432098765432,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_law,acc,0.2470664928292047,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_world_religions,acc,0.19298245614035087,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_other,acc,0.25523012552301255,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_business_ethics,acc,0.25,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.26037735849056604,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_medicine,acc,0.2023121387283237,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_global_facts,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_human_aging,acc,0.34977578475336324,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_management,acc,0.2524271844660194,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_marketing,acc,0.24358974358974358,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_medical_genetics,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_miscellaneous,acc,0.2707535121328225,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_nutrition,acc,0.22549019607843138,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_accounting,acc,0.19858156028368795,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_medicine,acc,0.22794117647058823,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_virology,acc,0.3373493975903614,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_social_sciences,acc,0.24731881702957426,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_econometrics,acc,0.22807017543859648,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_geography,acc,0.20707070707070707,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.22279792746113988,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.24358974358974358,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.23949579831932774,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_psychology,acc,0.25321100917431194,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_human_sexuality,acc,0.22137404580152673,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_psychology,acc,0.2679738562091503,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_public_relations,acc,0.32727272727272727,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_security_studies,acc,0.21224489795918366,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_sociology,acc,0.27860696517412936,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_stem,acc,0.2407231208372978,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_abstract_algebra,acc,0.25,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_anatomy,acc,0.1925925925925926,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_astronomy,acc,0.23026315789473684,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_biology,acc,0.2152777777777778,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_chemistry,acc,0.23,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_computer_science,acc,0.21,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_mathematics,acc,0.21,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_physics,acc,0.22549019607843138,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_computer_security,acc,0.23,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_conceptual_physics,acc,0.3148936170212766,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_electrical_engineering,acc,0.21379310344827587,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.24338624338624337,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_biology,acc,0.22903225806451613,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.2660098522167488,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.26,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.26666666666666666,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_physics,acc,0.2185430463576159,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.22685185185185186,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.25892857142857145,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc1,acc,0.23378212974296206,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc2,acc,,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu,acc,0.2457627118644068,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_humanities,acc,0.24187035069075452,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_formal_logic,acc,0.23015873015873015,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_european_history,acc,0.24848484848484848,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_us_history,acc,0.23529411764705882,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_world_history,acc,0.22362869198312235,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_international_law,acc,0.23140495867768596,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_jurisprudence,acc,0.3148148148148148,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_logical_fallacies,acc,0.2331288343558282,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_moral_disputes,acc,0.2630057803468208,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_moral_scenarios,acc,0.23798882681564246,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_philosophy,acc,0.2379421221864952,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_prehistory,acc,0.23765432098765432,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_law,acc,0.2470664928292047,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_world_religions,acc,0.19298245614035087,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_other,acc,0.25523012552301255,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_business_ethics,acc,0.25,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.26037735849056604,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_medicine,acc,0.2023121387283237,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_global_facts,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_human_aging,acc,0.34977578475336324,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_management,acc,0.2524271844660194,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_marketing,acc,0.24358974358974358,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_medical_genetics,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_miscellaneous,acc,0.2707535121328225,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_nutrition,acc,0.22549019607843138,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_accounting,acc,0.19858156028368795,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_medicine,acc,0.22794117647058823,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_virology,acc,0.3373493975903614,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_social_sciences,acc,0.24731881702957426,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_econometrics,acc,0.22807017543859648,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_geography,acc,0.20707070707070707,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.22279792746113988,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.24358974358974358,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.23949579831932774,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_psychology,acc,0.25321100917431194,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_human_sexuality,acc,0.22137404580152673,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_psychology,acc,0.2679738562091503,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_public_relations,acc,0.32727272727272727,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_security_studies,acc,0.21224489795918366,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_sociology,acc,0.27860696517412936,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_stem,acc,0.2407231208372978,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_abstract_algebra,acc,0.25,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_anatomy,acc,0.1925925925925926,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_astronomy,acc,0.23026315789473684,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_biology,acc,0.2152777777777778,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_chemistry,acc,0.23,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_computer_science,acc,0.21,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_mathematics,acc,0.21,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_physics,acc,0.22549019607843138,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_computer_security,acc,0.23,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_conceptual_physics,acc,0.3148936170212766,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_electrical_engineering,acc,0.21379310344827587,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.24338624338624337,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_biology,acc,0.22903225806451613,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.2660098522167488,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.26,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.26666666666666666,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_physics,acc,0.2185430463576159,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.22685185185185186,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 google/gemma-2-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.25892857142857145,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880 meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_boolq,acc,0.7804281345565749,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512 meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.29292929292929293,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512 meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.3181818181818182,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512 meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.29120879120879123,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512 meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.33516483516483514,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512 meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_main_n_shot,acc,0.32142857142857145,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512 meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.28348214285714285,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512 meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_logiqa,acc,0.250384024577573,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512 google/gemma-2b-it:W8A8_FP8,task_boolq,acc,0.6327217125382263,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.26262626262626265,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.2828282828282828,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.2564102564102564,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.29120879120879123,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_main_n_shot,acc,0.27455357142857145,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.3080357142857143,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_logiqa,acc,0.2457757296466974,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_boolq,acc,0.6327217125382263,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.26262626262626265,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.2828282828282828,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.2564102564102564,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_extended_zeroshot,acc,0.29120879120879123,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_main_n_shot,acc,0.27455357142857145,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_gpqa_main_zeroshot,acc,0.3080357142857143,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_logiqa,acc,0.2457757296466974,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu,acc,0.3793619142572283,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_humanities,acc,0.35451647183846974,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_formal_logic,acc,0.35714285714285715,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.5333333333333333,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.4068627450980392,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.5569620253164557,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_international_law,acc,0.5537190082644629,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_jurisprudence,acc,0.46296296296296297,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.3803680981595092,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_moral_disputes,acc,0.4046242774566474,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.23128491620111732,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_philosophy,acc,0.3440514469453376,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_prehistory,acc,0.38580246913580246,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_professional_law,acc,0.3135593220338983,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_world_religions,acc,0.47368421052631576,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_other,acc,0.4287093659478597,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_business_ethics,acc,0.44,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.4075471698113208,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_college_medicine,acc,0.3468208092485549,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_global_facts,acc,0.23,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_human_aging,acc,0.452914798206278,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_management,acc,0.49514563106796117,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_marketing,acc,0.6068376068376068,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_medical_genetics,acc,0.4,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_miscellaneous,acc,0.4878671775223499,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_nutrition,acc,0.4673202614379085,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_professional_accounting,acc,0.3262411347517731,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_professional_medicine,acc,0.3088235294117647,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_virology,acc,0.37349397590361444,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_social_sciences,acc,0.42476438089047774,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_econometrics,acc,0.2719298245614035,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_geography,acc,0.4393939393939394,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.5129533678756477,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.358974358974359,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.33613445378151263,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.5266055045871559,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_human_sexuality,acc,0.40458015267175573,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_professional_psychology,acc,0.37745098039215685,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_public_relations,acc,0.4,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_security_studies,acc,0.3836734693877551,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_sociology,acc,0.527363184079602,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.55,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_stem,acc,0.3235014272121789,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.31,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_anatomy,acc,0.3851851851851852,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_astronomy,acc,0.3684210526315789,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_college_biology,acc,0.4375,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_college_chemistry,acc,0.28,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_college_computer_science,acc,0.37,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_college_mathematics,acc,0.31,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_college_physics,acc,0.17647058823529413,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_computer_security,acc,0.51,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.3191489361702128,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.4896551724137931,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.24074074074074073,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_biology,acc,0.4290322580645161,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.2857142857142857,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.35,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.21481481481481482,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_physics,acc,0.271523178807947,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.24537037037037038,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_mmlu_machine_learning,acc,0.3392857142857143,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_openbookqa,acc,0.33,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_piqa,acc,0.7459194776931447,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.2913096695226438,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 google/gemma-2b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.45527595550844063,W8A8_FP8,espressor/google.gemma-2b-it_W8A8_FP8,4080531456 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_truthfulqa_mc1,acc,0.2692778457772338,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_truthfulqa_mc2,acc,0.4382848532929551,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu,acc,0.4585529126904999,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_humanities,acc,0.4403825717321998,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_formal_logic,acc,0.3253968253968254,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_european_history,acc,0.6242424242424243,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_us_history,acc,0.5833333333333334,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_world_history,acc,0.6497890295358649,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_international_law,acc,0.5867768595041323,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_jurisprudence,acc,0.5277777777777778,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_logical_fallacies,acc,0.44785276073619634,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_moral_disputes,acc,0.4624277456647399,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_moral_scenarios,acc,0.33519553072625696,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_philosophy,acc,0.5176848874598071,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_prehistory,acc,0.5277777777777778,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_professional_law,acc,0.3644067796610169,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_world_religions,acc,0.6023391812865497,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_other,acc,0.5159317669777921,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_business_ethics,acc,0.44,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_clinical_knowledge,acc,0.4716981132075472,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_medicine,acc,0.3872832369942196,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_global_facts,acc,0.31,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_human_aging,acc,0.515695067264574,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_management,acc,0.5339805825242718,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_marketing,acc,0.6752136752136753,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_medical_genetics,acc,0.47,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_miscellaneous,acc,0.598978288633461,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_nutrition,acc,0.5522875816993464,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_professional_accounting,acc,0.3617021276595745,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_professional_medicine,acc,0.5588235294117647,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_virology,acc,0.41566265060240964,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_social_sciences,acc,0.5089372765680859,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_econometrics,acc,0.23684210526315788,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_geography,acc,0.5555555555555556,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_government_and_politics,acc,0.5233160621761658,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_macroeconomics,acc,0.4025641025641026,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_microeconomics,acc,0.4579831932773109,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_psychology,acc,0.6311926605504588,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_human_sexuality,acc,0.5572519083969466,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_professional_psychology,acc,0.41830065359477125,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_public_relations,acc,0.4909090909090909,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_security_studies,acc,0.5428571428571428,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_sociology,acc,0.6517412935323383,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_us_foreign_policy,acc,0.71,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_stem,acc,0.37995559784332383,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_abstract_algebra,acc,0.23,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_anatomy,acc,0.48148148148148145,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_astronomy,acc,0.5460526315789473,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_biology,acc,0.4930555555555556,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_chemistry,acc,0.35,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_computer_science,acc,0.32,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_mathematics,acc,0.31,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_physics,acc,0.2647058823529412,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_computer_security,acc,0.46,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_conceptual_physics,acc,0.4297872340425532,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_electrical_engineering,acc,0.5310344827586206,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_elementary_mathematics,acc,0.2804232804232804,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_biology,acc,0.5,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_chemistry,acc,0.3497536945812808,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_computer_science,acc,0.46,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_mathematics,acc,0.26666666666666666,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_physics,acc,0.31125827814569534,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_statistics,acc,0.35648148148148145,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_machine_learning,acc,0.29464285714285715,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_openbookqa,acc,0.248,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu,acc,0.4585529126904999,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_humanities,acc,0.4403825717321998,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_formal_logic,acc,0.3253968253968254,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_european_history,acc,0.6242424242424243,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_us_history,acc,0.5833333333333334,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_world_history,acc,0.6497890295358649,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_international_law,acc,0.5867768595041323,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_jurisprudence,acc,0.5277777777777778,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_logical_fallacies,acc,0.44785276073619634,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_moral_disputes,acc,0.4624277456647399,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_moral_scenarios,acc,0.33519553072625696,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_philosophy,acc,0.5176848874598071,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_prehistory,acc,0.5277777777777778,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_professional_law,acc,0.3644067796610169,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_world_religions,acc,0.6023391812865497,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_other,acc,0.5159317669777921,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_business_ethics,acc,0.44,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_clinical_knowledge,acc,0.4716981132075472,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_medicine,acc,0.3872832369942196,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_global_facts,acc,0.31,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_human_aging,acc,0.515695067264574,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_management,acc,0.5339805825242718,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_marketing,acc,0.6752136752136753,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_medical_genetics,acc,0.47,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_miscellaneous,acc,0.598978288633461,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_nutrition,acc,0.5522875816993464,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_professional_accounting,acc,0.3617021276595745,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_professional_medicine,acc,0.5588235294117647,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_virology,acc,0.41566265060240964,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_social_sciences,acc,0.5089372765680859,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_econometrics,acc,0.23684210526315788,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_geography,acc,0.5555555555555556,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_government_and_politics,acc,0.5233160621761658,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_macroeconomics,acc,0.4025641025641026,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_microeconomics,acc,0.4579831932773109,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_psychology,acc,0.6311926605504588,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_human_sexuality,acc,0.5572519083969466,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_professional_psychology,acc,0.41830065359477125,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_public_relations,acc,0.4909090909090909,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_security_studies,acc,0.5428571428571428,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_sociology,acc,0.6517412935323383,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_us_foreign_policy,acc,0.71,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_stem,acc,0.37995559784332383,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_abstract_algebra,acc,0.23,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_anatomy,acc,0.48148148148148145,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_astronomy,acc,0.5460526315789473,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_biology,acc,0.4930555555555556,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_chemistry,acc,0.35,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_computer_science,acc,0.32,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_mathematics,acc,0.31,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_college_physics,acc,0.2647058823529412,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_computer_security,acc,0.46,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_conceptual_physics,acc,0.4297872340425532,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_electrical_engineering,acc,0.5310344827586206,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_elementary_mathematics,acc,0.2804232804232804,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_biology,acc,0.5,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_chemistry,acc,0.3497536945812808,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_computer_science,acc,0.46,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_mathematics,acc,0.26666666666666666,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_physics,acc,0.31125827814569534,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_high_school_statistics,acc,0.35648148148148145,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800 meta-llama/Llama-3.2-1B-Instruct:Default (bf16/fp16),task_mmlu_machine_learning,acc,0.29464285714285715,Default (bf16/fp16),meta-llama/Llama-3.2-1B-Instruct,2471628800