open-r1-eval-leaderboard
/
eval_results
/mistralai
/Mixtral-8x22B-Instruct-v0.1
/main
/alpaca_eval
/results_2024-05-25T17-34-07.json
{ | |
"results":{ | |
"mistralai_Mixtral-8x22B-Instruct-v0.1_main":{ | |
"win_rate":23.0125264618, | |
"standard_error":1.2659746348, | |
"n_wins":180, | |
"n_wins_base":625, | |
"n_draws":0, | |
"n_total":805, | |
"discrete_win_rate":22.3602484472, | |
"mode":"community", | |
"avg_length":1466, | |
"length_controlled_winrate":30.574783441 | |
} | |
} | |
} |