BenCzechMark / compare_significance.py
idolezal's picture
Reduce "compare_significance.py"
a03ea09
raw
history blame
249 Bytes
SUPPORTED_METRICS = [
"avg_mcauroc", # for classification tasks
"exact_match", # for QA tasks
"acc", # for multichoice tasks
"rouge_raw_r2_mid_f", # for summarization tasks
"word_perplexity", # for language modeling tasks
]