xzyao commited on
Commit
c6609ff
·
verified ·
1 Parent(s): c5de046

Upload eval_results.csv

Browse files
Files changed (1) hide show
  1. eval_results.csv +335 -0
eval_results.csv CHANGED
@@ -320,6 +320,73 @@ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.16
320
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.26785714285714285,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
321
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
322
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
323
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
324
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
325
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
@@ -966,6 +1033,73 @@ google/gemma-2-2b-it:W4A16,task_logiqa,acc,0.271889400921659,W4A16,espressor/goo
966
  google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
967
  google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
968
  google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
969
  google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
970
  google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
971
  google/gemma-2-2b-it:W4A16,task_mmlu,acc,0.5548354935194417,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
@@ -2574,6 +2708,140 @@ google/gemma-2-2b-it:W8A8_FP8,task_openbookqa,acc,0.36,W8A8_FP8,espressor/google
2574
  google/gemma-2-2b-it:W8A8_FP8,task_piqa,acc,0.7861806311207835,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2575
  google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.3733170134638923,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2576
  google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.5289090993939894,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2577
  google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2578
  google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2579
  google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
@@ -2716,6 +2984,73 @@ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_physics,acc,0.2185430463576
2716
  google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.22685185185185186,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2717
  google/gemma-2-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.25892857142857145,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2718
  meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_boolq,acc,0.7804281345565749,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2719
  meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.29292929292929293,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2720
  meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.3181818181818182,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2721
  meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.29120879120879123,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
 
320
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.26785714285714285,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
321
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
322
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
323
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu,acc,0.23394103404073494,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
324
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_humanities,acc,0.24654622741764082,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
325
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_formal_logic,acc,0.2777777777777778,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
326
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_european_history,acc,0.23636363636363636,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
327
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_us_history,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
328
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_world_history,acc,0.26582278481012656,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
329
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_international_law,acc,0.24793388429752067,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
330
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_jurisprudence,acc,0.25925925925925924,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
331
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_logical_fallacies,acc,0.26993865030674846,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
332
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_moral_disputes,acc,0.2543352601156069,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
333
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
334
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_philosophy,acc,0.22186495176848875,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
335
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_prehistory,acc,0.23765432098765432,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
336
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_law,acc,0.24445893089960888,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
337
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_world_religions,acc,0.2807017543859649,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
338
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_other,acc,0.2281943997425169,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
339
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_business_ethics,acc,0.21,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
340
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_clinical_knowledge,acc,0.26037735849056604,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
341
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_medicine,acc,0.27167630057803466,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
342
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_global_facts,acc,0.15,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
343
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_human_aging,acc,0.17937219730941703,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
344
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_management,acc,0.33980582524271846,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
345
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_marketing,acc,0.25213675213675213,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
346
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_medical_genetics,acc,0.31,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
347
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_miscellaneous,acc,0.20689655172413793,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
348
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_nutrition,acc,0.21895424836601307,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
349
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_accounting,acc,0.24113475177304963,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
350
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_medicine,acc,0.17279411764705882,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
351
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_virology,acc,0.2891566265060241,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
352
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_social_sciences,acc,0.23366915827104323,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
353
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_econometrics,acc,0.2543859649122807,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
354
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_geography,acc,0.26262626262626265,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
355
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_government_and_politics,acc,0.18652849740932642,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
356
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_macroeconomics,acc,0.22564102564102564,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
357
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_microeconomics,acc,0.226890756302521,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
358
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_psychology,acc,0.25321100917431194,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
359
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_human_sexuality,acc,0.2595419847328244,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
360
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_professional_psychology,acc,0.22712418300653595,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
361
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_public_relations,acc,0.2727272727272727,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
362
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_security_studies,acc,0.19183673469387755,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
363
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_sociology,acc,0.23383084577114427,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
364
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_us_foreign_policy,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
365
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_stem,acc,0.2210593085949889,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
366
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_abstract_algebra,acc,0.25,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
367
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_anatomy,acc,0.2074074074074074,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
368
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_astronomy,acc,0.2236842105263158,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
369
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_biology,acc,0.22916666666666666,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
370
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_chemistry,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
371
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_computer_science,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
372
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_mathematics,acc,0.23,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
373
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_college_physics,acc,0.23529411764705882,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
374
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_computer_security,acc,0.27,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
375
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_conceptual_physics,acc,0.19574468085106383,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
376
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_electrical_engineering,acc,0.2206896551724138,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
377
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_elementary_mathematics,acc,0.24867724867724866,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
378
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_biology,acc,0.2032258064516129,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
379
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_chemistry,acc,0.20689655172413793,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
380
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_computer_science,acc,0.2,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
381
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_mathematics,acc,0.21851851851851853,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
382
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_physics,acc,0.23178807947019867,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
383
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_high_school_statistics,acc,0.16666666666666666,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
384
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_mmlu_machine_learning,acc,0.26785714285714285,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
385
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
386
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
387
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
388
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_boolq,acc,0.41192660550458715,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
389
+ meta-llama/Llama-3.2-3B-Instruct:W4A16,task_logiqa,acc,0.2012288786482335,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
390
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_openbookqa,acc,0.186,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
391
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc1,acc,0.2778457772337821,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
392
  meta-llama/Llama-3.2-3B-Instruct:W4A16,task_truthfulqa_mc2,acc,0.49779200888041425,W4A16,espressor/meta-llama.Llama-3.2-3B-Instruct_W4A16,3029689408
 
1033
  google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1034
  google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1035
  google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1036
+ google/gemma-2-2b-it:W4A16,task_boolq,acc,0.8333333333333334,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1037
+ google/gemma-2-2b-it:W4A16,task_logiqa,acc,0.271889400921659,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1038
+ google/gemma-2-2b-it:W4A16,task_mmlu,acc,0.5548354935194417,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1039
+ google/gemma-2-2b-it:W4A16,task_mmlu_humanities,acc,0.491817215727949,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1040
+ google/gemma-2-2b-it:W4A16,task_mmlu_formal_logic,acc,0.3412698412698413,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1041
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_european_history,acc,0.7272727272727273,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1042
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_us_history,acc,0.7450980392156863,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1043
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_world_history,acc,0.7468354430379747,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1044
+ google/gemma-2-2b-it:W4A16,task_mmlu_international_law,acc,0.6942148760330579,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1045
+ google/gemma-2-2b-it:W4A16,task_mmlu_jurisprudence,acc,0.6296296296296297,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1046
+ google/gemma-2-2b-it:W4A16,task_mmlu_logical_fallacies,acc,0.6809815950920245,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1047
+ google/gemma-2-2b-it:W4A16,task_mmlu_moral_disputes,acc,0.5982658959537572,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1048
+ google/gemma-2-2b-it:W4A16,task_mmlu_moral_scenarios,acc,0.23798882681564246,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1049
+ google/gemma-2-2b-it:W4A16,task_mmlu_philosophy,acc,0.6205787781350482,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1050
+ google/gemma-2-2b-it:W4A16,task_mmlu_prehistory,acc,0.595679012345679,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1051
+ google/gemma-2-2b-it:W4A16,task_mmlu_professional_law,acc,0.41134289439374183,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1052
+ google/gemma-2-2b-it:W4A16,task_mmlu_world_religions,acc,0.7134502923976608,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1053
+ google/gemma-2-2b-it:W4A16,task_mmlu_other,acc,0.618925008046347,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1054
+ google/gemma-2-2b-it:W4A16,task_mmlu_business_ethics,acc,0.5,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1055
+ google/gemma-2-2b-it:W4A16,task_mmlu_clinical_knowledge,acc,0.6,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1056
+ google/gemma-2-2b-it:W4A16,task_mmlu_college_medicine,acc,0.5838150289017341,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1057
+ google/gemma-2-2b-it:W4A16,task_mmlu_global_facts,acc,0.29,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1058
+ google/gemma-2-2b-it:W4A16,task_mmlu_human_aging,acc,0.5560538116591929,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1059
+ google/gemma-2-2b-it:W4A16,task_mmlu_management,acc,0.7961165048543689,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1060
+ google/gemma-2-2b-it:W4A16,task_mmlu_marketing,acc,0.7863247863247863,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1061
+ google/gemma-2-2b-it:W4A16,task_mmlu_medical_genetics,acc,0.61,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1062
+ google/gemma-2-2b-it:W4A16,task_mmlu_miscellaneous,acc,0.7535121328224776,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1063
+ google/gemma-2-2b-it:W4A16,task_mmlu_nutrition,acc,0.6437908496732027,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1064
+ google/gemma-2-2b-it:W4A16,task_mmlu_professional_accounting,acc,0.3971631205673759,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1065
+ google/gemma-2-2b-it:W4A16,task_mmlu_professional_medicine,acc,0.5625,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1066
+ google/gemma-2-2b-it:W4A16,task_mmlu_virology,acc,0.4879518072289157,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1067
+ google/gemma-2-2b-it:W4A16,task_mmlu_social_sciences,acc,0.6564835879103023,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1068
+ google/gemma-2-2b-it:W4A16,task_mmlu_econometrics,acc,0.3508771929824561,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1069
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_geography,acc,0.7373737373737373,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1070
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_government_and_politics,acc,0.772020725388601,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1071
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_macroeconomics,acc,0.5897435897435898,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1072
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_microeconomics,acc,0.5714285714285714,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1073
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_psychology,acc,0.8073394495412844,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1074
+ google/gemma-2-2b-it:W4A16,task_mmlu_human_sexuality,acc,0.6564885496183206,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1075
+ google/gemma-2-2b-it:W4A16,task_mmlu_professional_psychology,acc,0.5392156862745098,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1076
+ google/gemma-2-2b-it:W4A16,task_mmlu_public_relations,acc,0.6454545454545455,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1077
+ google/gemma-2-2b-it:W4A16,task_mmlu_security_studies,acc,0.6653061224489796,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1078
+ google/gemma-2-2b-it:W4A16,task_mmlu_sociology,acc,0.746268656716418,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1079
+ google/gemma-2-2b-it:W4A16,task_mmlu_us_foreign_policy,acc,0.79,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1080
+ google/gemma-2-2b-it:W4A16,task_mmlu_stem,acc,0.4865207738661592,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1081
+ google/gemma-2-2b-it:W4A16,task_mmlu_abstract_algebra,acc,0.37,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1082
+ google/gemma-2-2b-it:W4A16,task_mmlu_anatomy,acc,0.5555555555555556,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1083
+ google/gemma-2-2b-it:W4A16,task_mmlu_astronomy,acc,0.5986842105263158,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1084
+ google/gemma-2-2b-it:W4A16,task_mmlu_college_biology,acc,0.6944444444444444,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1085
+ google/gemma-2-2b-it:W4A16,task_mmlu_college_chemistry,acc,0.44,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1086
+ google/gemma-2-2b-it:W4A16,task_mmlu_college_computer_science,acc,0.47,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1087
+ google/gemma-2-2b-it:W4A16,task_mmlu_college_mathematics,acc,0.37,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1088
+ google/gemma-2-2b-it:W4A16,task_mmlu_college_physics,acc,0.3137254901960784,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1089
+ google/gemma-2-2b-it:W4A16,task_mmlu_computer_security,acc,0.68,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1090
+ google/gemma-2-2b-it:W4A16,task_mmlu_conceptual_physics,acc,0.4297872340425532,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1091
+ google/gemma-2-2b-it:W4A16,task_mmlu_electrical_engineering,acc,0.5586206896551724,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1092
+ google/gemma-2-2b-it:W4A16,task_mmlu_elementary_mathematics,acc,0.42063492063492064,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1093
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_biology,acc,0.7322580645161291,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1094
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_chemistry,acc,0.4236453201970443,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1095
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_computer_science,acc,0.59,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1096
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_mathematics,acc,0.34814814814814815,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1097
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_physics,acc,0.31125827814569534,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1098
+ google/gemma-2-2b-it:W4A16,task_mmlu_high_school_statistics,acc,0.5,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1099
+ google/gemma-2-2b-it:W4A16,task_mmlu_machine_learning,acc,0.36607142857142855,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1100
+ google/gemma-2-2b-it:W4A16,task_openbookqa,acc,0.356,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1101
+ google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1102
+ google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1103
  google/gemma-2-2b-it:W4A16,task_truthfulqa_mc1,acc,0.34516523867809057,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1104
  google/gemma-2-2b-it:W4A16,task_truthfulqa_mc2,acc,0.513524194450901,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
1105
  google/gemma-2-2b-it:W4A16,task_mmlu,acc,0.5548354935194417,W4A16,espressor/google.gemma-2-2b-it_W4A16,3403550048
 
2708
  google/gemma-2-2b-it:W8A8_FP8,task_piqa,acc,0.7861806311207835,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2709
  google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.3733170134638923,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2710
  google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.5289090993939894,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2711
+ google/gemma-2-2b-it:W8A8_FP8,task_boolq,acc,0.8388379204892966,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2712
+ google/gemma-2-2b-it:W8A8_FP8,task_logiqa,acc,0.2764976958525346,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2713
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu,acc,0.5704315624554906,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2714
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_humanities,acc,0.5092454835281616,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2715
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_formal_logic,acc,0.35714285714285715,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2716
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.7333333333333333,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2717
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.7450980392156863,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2718
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.759493670886076,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2719
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_international_law,acc,0.7107438016528925,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2720
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_jurisprudence,acc,0.6851851851851852,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2721
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.7361963190184049,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2722
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_moral_disputes,acc,0.6329479768786127,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2723
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.24916201117318434,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2724
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_philosophy,acc,0.6495176848874598,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2725
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_prehistory,acc,0.6141975308641975,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2726
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_law,acc,0.42633637548891784,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2727
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_world_religions,acc,0.7076023391812866,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2728
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_other,acc,0.6411329256517541,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2729
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_business_ethics,acc,0.52,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2730
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.6339622641509434,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2731
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_medicine,acc,0.6184971098265896,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2732
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_global_facts,acc,0.29,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2733
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_human_aging,acc,0.5964125560538116,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2734
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_management,acc,0.7864077669902912,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2735
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_marketing,acc,0.811965811965812,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2736
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_medical_genetics,acc,0.65,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2737
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_miscellaneous,acc,0.7675606641123882,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2738
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_nutrition,acc,0.6601307189542484,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2739
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_accounting,acc,0.425531914893617,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2740
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_medicine,acc,0.5661764705882353,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2741
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_virology,acc,0.5421686746987951,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2742
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_social_sciences,acc,0.6766330841728957,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2743
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_econometrics,acc,0.40350877192982454,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2744
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_geography,acc,0.7373737373737373,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2745
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.7927461139896373,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2746
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.6205128205128205,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2747
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.5756302521008403,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2748
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.8238532110091743,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2749
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_human_sexuality,acc,0.6870229007633588,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2750
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_professional_psychology,acc,0.5571895424836601,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2751
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_public_relations,acc,0.6727272727272727,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2752
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_security_studies,acc,0.689795918367347,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2753
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_sociology,acc,0.7860696517412935,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2754
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.77,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2755
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_stem,acc,0.48842372343799556,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2756
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.39,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2757
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_anatomy,acc,0.5333333333333333,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2758
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_astronomy,acc,0.5657894736842105,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2759
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_biology,acc,0.6875,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2760
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_chemistry,acc,0.45,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2761
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_computer_science,acc,0.44,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2762
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_mathematics,acc,0.37,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2763
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_college_physics,acc,0.35294117647058826,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2764
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_computer_security,acc,0.63,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2765
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.46382978723404256,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2766
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.5862068965517241,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2767
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.4126984126984127,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2768
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_biology,acc,0.7548387096774194,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2769
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.4433497536945813,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2770
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.6,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2771
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.362962962962963,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2772
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_physics,acc,0.2781456953642384,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2773
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.49074074074074076,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2774
+ google/gemma-2-2b-it:W8A8_FP8,task_mmlu_machine_learning,acc,0.3482142857142857,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2775
+ google/gemma-2-2b-it:W8A8_FP8,task_openbookqa,acc,0.36,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2776
+ google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc1,acc,0.3733170134638923,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2777
+ google/gemma-2-2b-it:W8A8_FP8,task_truthfulqa_mc2,acc,0.5289090993939894,W8A8_FP8,espressor/google.gemma-2-2b-it_W8A8_FP8,4385466880
2778
+ google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2779
+ google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2780
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu,acc,0.2457627118644068,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2781
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_humanities,acc,0.24187035069075452,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2782
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_formal_logic,acc,0.23015873015873015,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2783
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_european_history,acc,0.24848484848484848,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2784
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_us_history,acc,0.23529411764705882,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2785
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_world_history,acc,0.22362869198312235,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2786
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_international_law,acc,0.23140495867768596,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2787
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_jurisprudence,acc,0.3148148148148148,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2788
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_logical_fallacies,acc,0.2331288343558282,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2789
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_moral_disputes,acc,0.2630057803468208,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2790
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_moral_scenarios,acc,0.23798882681564246,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2791
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_philosophy,acc,0.2379421221864952,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2792
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_prehistory,acc,0.23765432098765432,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2793
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_law,acc,0.2470664928292047,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2794
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_world_religions,acc,0.19298245614035087,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2795
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_other,acc,0.25523012552301255,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2796
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_business_ethics,acc,0.25,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2797
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_clinical_knowledge,acc,0.26037735849056604,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2798
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_medicine,acc,0.2023121387283237,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2799
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_global_facts,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2800
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_human_aging,acc,0.34977578475336324,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2801
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_management,acc,0.2524271844660194,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2802
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_marketing,acc,0.24358974358974358,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2803
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_medical_genetics,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2804
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_miscellaneous,acc,0.2707535121328225,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2805
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_nutrition,acc,0.22549019607843138,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2806
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_accounting,acc,0.19858156028368795,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2807
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_medicine,acc,0.22794117647058823,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2808
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_virology,acc,0.3373493975903614,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2809
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_social_sciences,acc,0.24731881702957426,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2810
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_econometrics,acc,0.22807017543859648,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2811
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_geography,acc,0.20707070707070707,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2812
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_government_and_politics,acc,0.22279792746113988,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2813
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_macroeconomics,acc,0.24358974358974358,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2814
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_microeconomics,acc,0.23949579831932774,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2815
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_psychology,acc,0.25321100917431194,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2816
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_human_sexuality,acc,0.22137404580152673,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2817
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_professional_psychology,acc,0.2679738562091503,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2818
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_public_relations,acc,0.32727272727272727,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2819
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_security_studies,acc,0.21224489795918366,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2820
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_sociology,acc,0.27860696517412936,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2821
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_us_foreign_policy,acc,0.24,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2822
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_stem,acc,0.2407231208372978,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2823
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_abstract_algebra,acc,0.25,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2824
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_anatomy,acc,0.1925925925925926,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2825
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_astronomy,acc,0.23026315789473684,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2826
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_biology,acc,0.2152777777777778,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2827
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_chemistry,acc,0.23,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2828
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_computer_science,acc,0.21,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2829
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_mathematics,acc,0.21,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2830
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_college_physics,acc,0.22549019607843138,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2831
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_computer_security,acc,0.23,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2832
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_conceptual_physics,acc,0.3148936170212766,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2833
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_electrical_engineering,acc,0.21379310344827587,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2834
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_elementary_mathematics,acc,0.24338624338624337,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2835
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_biology,acc,0.22903225806451613,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2836
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_chemistry,acc,0.2660098522167488,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2837
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_computer_science,acc,0.26,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2838
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_mathematics,acc,0.26666666666666666,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2839
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_physics,acc,0.2185430463576159,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2840
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.22685185185185186,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2841
+ google/gemma-2-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.25892857142857145,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2842
+ google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2843
+ google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc1,acc,0.23378212974296206,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2844
+ google/gemma-2-2b-it:W8A8_int8,task_truthfulqa_mc2,acc,,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2845
  google/gemma-2-2b-it:W8A8_int8,task_openbookqa,acc,0.182,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2846
  google/gemma-2-2b-it:W8A8_int8,task_boolq,acc,0.44464831804281346,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2847
  google/gemma-2-2b-it:W8A8_int8,task_logiqa,acc,0.21351766513056836,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
 
2984
  google/gemma-2-2b-it:W8A8_int8,task_mmlu_high_school_statistics,acc,0.22685185185185186,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2985
  google/gemma-2-2b-it:W8A8_int8,task_mmlu_machine_learning,acc,0.25892857142857145,W8A8_int8,espressor/google.gemma-2-2b-it_W8A8_int8,4385466880
2986
  meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_boolq,acc,0.7804281345565749,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2987
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_logiqa,acc,0.250384024577573,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2988
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu,acc,0.5977068793619142,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2989
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_humanities,acc,0.5844845908607864,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2990
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_formal_logic,acc,0.3412698412698413,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2991
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_european_history,acc,0.7212121212121212,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2992
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_us_history,acc,0.7450980392156863,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2993
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_world_history,acc,0.7763713080168776,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2994
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_international_law,acc,0.743801652892562,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2995
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_jurisprudence,acc,0.6203703703703703,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2996
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_logical_fallacies,acc,0.7055214723926381,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2997
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_moral_disputes,acc,0.6416184971098265,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2998
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_moral_scenarios,acc,0.5698324022346368,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
2999
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_philosophy,acc,0.6720257234726688,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3000
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_prehistory,acc,0.6512345679012346,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3001
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_professional_law,acc,0.4556714471968709,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3002
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_world_religions,acc,0.7543859649122807,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3003
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_other,acc,0.663018989378822,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3004
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_business_ethics,acc,0.58,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3005
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_clinical_knowledge,acc,0.6339622641509434,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3006
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_medicine,acc,0.5953757225433526,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3007
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_global_facts,acc,0.33,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3008
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_human_aging,acc,0.5695067264573991,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3009
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_management,acc,0.7572815533980582,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3010
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_marketing,acc,0.8803418803418803,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3011
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_medical_genetics,acc,0.71,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3012
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_miscellaneous,acc,0.7675606641123882,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3013
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_nutrition,acc,0.6633986928104575,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3014
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_professional_accounting,acc,0.4645390070921986,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3015
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_professional_medicine,acc,0.75,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3016
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_virology,acc,0.463855421686747,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3017
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_social_sciences,acc,0.6590835229119272,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3018
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_econometrics,acc,0.38596491228070173,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3019
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_geography,acc,0.7070707070707071,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3020
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_government_and_politics,acc,0.7461139896373057,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3021
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_macroeconomics,acc,0.5538461538461539,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3022
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_microeconomics,acc,0.592436974789916,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3023
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_psychology,acc,0.7651376146788991,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3024
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_human_sexuality,acc,0.6870229007633588,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3025
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_professional_psychology,acc,0.5931372549019608,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3026
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_public_relations,acc,0.6181818181818182,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3027
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_security_studies,acc,0.6571428571428571,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3028
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_sociology,acc,0.8059701492537313,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3029
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_us_foreign_policy,acc,0.82,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3030
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_stem,acc,0.4931810973675864,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3031
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_abstract_algebra,acc,0.29,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3032
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_anatomy,acc,0.5703703703703704,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3033
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_astronomy,acc,0.6776315789473685,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3034
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_biology,acc,0.7083333333333334,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3035
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_chemistry,acc,0.36,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3036
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_computer_science,acc,0.48,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3037
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_mathematics,acc,0.32,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3038
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_college_physics,acc,0.3431372549019608,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3039
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_computer_security,acc,0.7,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3040
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_conceptual_physics,acc,0.4978723404255319,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3041
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_electrical_engineering,acc,0.5862068965517241,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3042
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_elementary_mathematics,acc,0.3915343915343915,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3043
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_biology,acc,0.7064516129032258,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3044
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_chemistry,acc,0.5467980295566502,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3045
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_computer_science,acc,0.58,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3046
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_mathematics,acc,0.3333333333333333,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3047
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_physics,acc,0.36423841059602646,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3048
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_high_school_statistics,acc,0.3888888888888889,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3049
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_mmlu_machine_learning,acc,0.5,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3050
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_openbookqa,acc,0.278,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3051
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_truthfulqa_mc1,acc,0.31701346389228885,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3052
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_truthfulqa_mc2,acc,0.49237827622660857,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3053
+ meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_boolq,acc,0.7804281345565749,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3054
  meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_n_shot,acc,0.29292929292929293,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3055
  meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_diamond_zeroshot,acc,0.3181818181818182,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512
3056
  meta-llama/Llama-3.2-3B-Instruct:W8A8_FP8,task_gpqa_extended_n_shot,acc,0.29120879120879123,W8A8_FP8,espressor/meta-llama.Llama-3.2-3B-Instruct_W8A8_FP8,4396480512