open-r1-eval-leaderboard
/
eval_results
/mistralai
/Mixtral-8x22B-Instruct-v0.1
/main
/alpaca_eval
/results_2024-05-25T10-52-51.json
{ | |
"results":{ | |
"mistralai_Mixtral-8x22B-Instruct-v0.1_main":{ | |
"win_rate":22.8361861628, | |
"standard_error":1.2574032273, | |
"n_wins":174, | |
"n_wins_base":631, | |
"n_draws":0, | |
"n_total":805, | |
"discrete_win_rate":21.6149068323, | |
"mode":"community", | |
"avg_length":1466, | |
"length_controlled_winrate":30.0912200713 | |
} | |
} | |
} |