Spaces:
Running
Running
model,score | |
arx_0.3,1.0 | |
claude_3.5_sonnet,0.9876543209876543 | |
gpt_4o_2024_05_13,0.9814814814814814 | |
grok_2,0.9753086419753086 | |
gpt_4_0613,0.971830985915493 | |
claude_3.5_sonnet_20240620,0.971830985915493 | |
gpt_4_turbo_2024_04_09,0.9577464788732394 | |
grok_2_mini,0.9506172839506173 | |
llama3.1_instruct_turbo_405b,0.9436619718309859 | |
gemini_1.5_pro,0.9382716049382716 | |
llama3.1_instruct_turbo_70b,0.9295774647887324 | |
claude_3_opus,0.9259259259259259 | |
qwen2_72b_chat,0.9135802469135802 | |
qwen2_instruct_72b,0.9014084507042254 | |
magnum_72b_v1,0.9012345679012346 | |
gpt_4_turbo,0.8888888888888888 | |
mistral_large_2_2407,0.8873239436619719 | |
deepseek_coder_v2_instruct,0.8765432098765432 | |
gemini_1.5_pro_001,0.8732394366197183 | |
higgs_llama3_70b,0.8641975308641975 | |
gpt_4o_mini_2024_07_18,0.8591549295774648 | |
gpt_4o_mini,0.8518518518518519 | |
mixtral_8x22b,0.8450704225352113 | |
llama3.1_70b_instruct,0.8395061728395061 | |
gpt_4_turbo_1106_preview,0.8309859154929577 | |
llama3_70b,0.8281168492436097 | |
gemini_1.5_flash,0.8271604938271605 | |
palmyra_x_v3_72b,0.8169014084507042 | |
yi_large,0.8148148148148148 | |
gemma_2_instruct_27b,0.8028169014084507 | |
claude_3_sonnet,0.8024691358024691 | |
llama3_70b_instruct,0.7901234567901234 | |
gemini_1.5_flash_001,0.7887323943661971 | |
phi3_medium_4k,0.7777777777777778 | |
claude_3_opus_20240229,0.7746478873239436 | |
qwen2_72b_32k,0.7654320987654321 | |
palm_2_unicorn,0.7605633802816901 | |
deepseek_v2_chat,0.7530864197530864 | |
qwen1.5_72b,0.7464788732394366 | |
palmyra_x_v2_33b,0.7323943661971831 | |
qwen1.5_72b_chat,0.7283950617283951 | |
gemma_2_instruct_9b,0.7183098591549296 | |
llama3.1_70b,0.7160493827160493 | |
yi_1.5_34b_chat,0.7037037037037037 | |
gemma_2_9b_it,0.691358024691358 | |
qwen1.5_chat_110b,0.6901408450704225 | |
phi3_medium_128k,0.6790123456790124 | |
qwen1.5_32b,0.676056338028169 | |
mammoth2_8x7b_plus,0.6666666666666666 | |
claude_v1.3,0.6619718309859155 | |
qwen1.5_110b,0.654320987654321 | |
palm_2_bison,0.647887323943662 | |
glm_4_9b_chat,0.6419753086419753 | |
mixtral_8x7b_32k_seqlen,0.6338028169014085 | |
glm_4_9b,0.6296296296296297 | |
phi_3_14b,0.6197183098591549 | |
phi_3.5_mini_instruct,0.6172839506172839 | |
claude_2.0,0.6056338028169014 | |
qwen2_7b_instruct,0.6049382716049383 | |
yi_34b,0.5990262563032516 | |
yi_1.5_9b_chat,0.5925925925925926 | |
deepseek_llm_chat_67b,0.5915492957746479 | |
phi3_mini_4k,0.5802469135802469 | |
phi_3_7b,0.5774647887323944 | |
gemma_2_9b,0.5679012345679012 | |
mistral_nemo_instruct_2407,0.5555555555555556 | |
yi_large_preview,0.5492957746478874 | |
llama3.1_8b_instruct,0.5432098765432098 | |
command_r_plus,0.5352112676056338 | |
phi3_mini_128k,0.5308641975308642 | |
mammoth2_8b_plus,0.5185185185185185 | |
gpt_3.5_text_davinci_003,0.5070422535211268 | |
claude_2.1,0.5070422535211268 | |
mixtral_8x7b_instruct_v0.1,0.5061728395061729 | |
qwen1.5_14b,0.49295774647887325 | |
mathstral_7b_v0.1,0.48148148148148145 | |
gemini_1.0_pro_002,0.4788732394366197 | |
deepseek_coder_v2_lite_instruct,0.4691358024691358 | |
claude_instant_1.2,0.4647887323943662 | |
mixtral_8x7b_v0.1,0.4567901234567901 | |
llama_2_70b,0.4483568075117371 | |
llama3_8b_instruct,0.4444444444444444 | |
mammoth2_7b_plus,0.43209876543209874 | |
gpt_3.5_turbo_0613,0.4225352112676056 | |
claude_3_sonnet_20240229,0.4225352112676056 | |
qwen2_7b,0.41975308641975306 | |
mistral_nemo_2402,0.4084507042253521 | |
mistral_nemo_base_2407,0.4074074074074074 | |
wizardlm_2_8x22b,0.3950617283950617 | |
arctic_instruct,0.39436619718309857 | |
yi_1.5_6b_chat,0.38271604938271603 | |
qwen1.5_14b_chat,0.37037037037037035 | |
gpt_3.5_text_davinci_002,0.36619718309859156 | |
llama3_8b,0.3611545818118588 | |
llama_65b,0.352112676056338 | |
c4ai_command_r_v01,0.345679012345679 | |
staring_7b,0.345679012345679 | |
mistral_large_2402,0.3380281690140845 | |
command,0.323943661971831 | |
openchat_3.5_8b,0.32098765432098764 | |
command_r,0.30985915492957744 | |
internmath_20b_plus,0.30864197530864196 | |
gemma_7b,0.3003825421665797 | |
llama3_smaug_8b,0.2962962962962963 | |
llama3.1_instruct_turbo_8b,0.29577464788732394 | |
llama3.1_8b,0.2839506172839506 | |
mistral_small_2402,0.28169014084507044 | |
dbrx_instructruct,0.2676056338028169 | |
deepseekmath_7b_instruct,0.25925925925925924 | |
jamba_instruct,0.2535211267605634 | |
deepseek_coder_v2_lite_base,0.24691358024691357 | |
mistral_v0.1_7b,0.23943661971830985 | |
mistral_medium_2312,0.22535211267605634 | |
internmath_7b_plus,0.2222222222222222 | |
qwen1.5_7b,0.2112676056338028 | |
zephyr_7b_beta,0.20987654320987653 | |
mistral_7b_v0.1,0.19753086419753085 | |
claude_3_haiku_20240307,0.19718309859154928 | |
mistral_7b_instruct_v0.2,0.18518518518518517 | |
mistral_7b_v0.2,0.1728395061728395 | |
qwen1.5_7b_chat,0.16049382716049382 | |
jurassic_2_jumbo_178b,0.15492957746478872 | |
yi_6b,0.15327769083637627 | |
yi_6b_chat,0.14814814814814814 | |
falcon_40b,0.14084507042253522 | |
neo_7b_instruct,0.13580246913580246 | |
llama_2_13b,0.127716918796731 | |
mistral_instruct_v0.3_7b,0.1267605633802817 | |
jurassic_2_grande_17b,0.11267605633802817 | |
neo_7b,0.1111111111111111 | |
mistral_7b_instruct_v0.1,0.09876543209876543 | |
phi_2,0.09859154929577464 | |
llemma_7b,0.07407407407407407 | |
luminous_supreme_70b,0.07042253521126761 | |
qwen2_1.5b_instruct,0.06172839506172839 | |
llama_2_7b,0.06077203964527908 | |
command_light,0.056338028169014086 | |
qwen2_1.5b,0.04938271604938271 | |
luminous_extended_30b,0.04225352112676056 | |
falcon_7b,0.028169014084507043 | |
qwen2_0.5b_instruct,0.024691358024691357 | |
olmo_7b,0.014084507042253521 | |
gemma_2b,0.012345679012345678 | |
luminous_base_13b,0.0 | |
qwen2_0.5b,0.0 | |