File size: 1,303 Bytes
be36629 cbf54c8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 |
# Corrected and cleaned data
gpt4 = {
'b4bqa': 0.94921875,
'medqa_og': 0.9232804232804233,
'medqa_g2b': 0.8994708994708994,
'medmcqa_og': 0.9166666666666666,
'medmcqa_g2b': 0.8879310344827587
}
gpt4o = {
'b4bqa': 0.96484375,
'medqa_og': 0.9021164021164021,
'medqa_g2b': 0.8835978835978836,
'medmcqa_og': 0.9051724137931034,
'medmcqa_g2b': 0.8649425287356322
}
gpt35turbo = {
'b4bqa': 0.9174107142857143,
'medmcqa_og': 0.9827586206896551,
'medmcqa_g2b': 0.9770114942528736,
'medqa_og': 0.9629629629629629,
'medqa_g2b': 0.9603174603174603
}
claude_opus = {
'b4bqa': 0.921875,
'medqa_og': 0.8571428571428571,
'medqa_g2b': 0.8333333333333334,
'medmcqa_og': 0.8649425287356322,
'medmcqa_g2b': 0.7988505747126436
}
gemini_15_pro = {
'medqa_og': 0.8862433862433863,
'medqa_g2b': 0.873015873015873,
'medmcqa_og': 0.8649425287356322,
'medmcqa_g2b': 0.8247126436781609
}
gemini_pro_1 = {
'medqa_og': 0.7063492063492064,
'medqa_g2b': 0.7301587301587301,
'medmcqa_og': 0.6810344827586207,
'medmcqa_g2b': 0.7385057471264368
}
gemini_15_flash = {
'medqa_og': 0.9708994708994709,
'medqa_g2b': 0.9603174603174603,
'medmcqa_og': 0.9741379310344828,
'medmcqa_g2b': 0.9482758620689655
}
|