|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.354, |
|
"acc_stderr": 0.015129868238451773 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.334, |
|
"acc_stderr": 0.014922019523732965 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.3525, |
|
"acc_stderr": 0.013797164918918355 |
|
}, |
|
"cb": { |
|
"acc": 0.5178571428571429, |
|
"acc_stderr": 0.06737697508644647, |
|
"f1": 0.34887334887334887 |
|
}, |
|
"copa": { |
|
"acc": 0.75, |
|
"acc_stderr": 0.04351941398892446 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.4297948615813583, |
|
"acc_stderr": 0.004940349676769321, |
|
"acc_norm": 0.5647281418044214, |
|
"acc_norm_stderr": 0.004947793051042662 |
|
}, |
|
"rte": { |
|
"acc": 0.5523465703971119, |
|
"acc_stderr": 0.029931070362939526 |
|
}, |
|
"winogrande": { |
|
"acc": 0.5611681136543015, |
|
"acc_stderr": 0.013946933444507032 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.6905398182789952, |
|
"acc_stderr": 0.010689956745189072 |
|
}, |
|
"boolq": { |
|
"acc": 0.6128440366972477, |
|
"acc_stderr": 0.008519429207594416 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.5867003367003367, |
|
"acc_stderr": 0.010104361780747513, |
|
"acc_norm": 0.5774410774410774, |
|
"acc_norm_stderr": 0.010135978222981075 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.24744027303754265, |
|
"acc_stderr": 0.012610352663292673, |
|
"acc_norm": 0.27559726962457337, |
|
"acc_norm_stderr": 0.013057169655761838 |
|
}, |
|
"sciq": { |
|
"acc": 0.901, |
|
"acc_stderr": 0.009449248027662732, |
|
"acc_norm": 0.912, |
|
"acc_norm_stderr": 0.008963053962592085 |
|
}, |
|
"piqa": { |
|
"acc": 0.733949945593036, |
|
"acc_stderr": 0.010310039263352831, |
|
"acc_norm": 0.7421109902067464, |
|
"acc_norm_stderr": 0.010206956662056232 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |