benchbench / cache /aggregate_scoress_cache_2d8c9f9c6d96807c68a9475184afcecb.csv
Yotam-Perlitz
revise cache
292d764
raw
history blame
26 kB
model,score
claude_3_5_sonnet_20240620,1.0
gpt_4o_20240513,1.0
calme_2.1_qwen2_72b,1.0
shopee_slimmoa_v1,1.0
calme_2.2_qwen2_72b,0.9970414201183432
blendax.ai_gm_l6_vo31,0.9947368421052631
magnum_72b_v1,0.9911242603550295
gemma_2_9b_it_wpo_hb,0.9894736842105263
gpt_4o_2024_05_13,0.984963768115942
blendax.ai_gm_l3_v35,0.9842105263157894
claude_3.5_sonnet,0.9830508474576272
calme_2.2_llama3_70b,0.9822485207100592
llama3_tenyxchat_70b,0.9763313609467456
openpipe_moa_gpt_4_turbo,0.9736842105263158
claude_3.5_sonnet_20240620,0.971830985915493
chatgpt_4o_latest,0.9710144927536232
rys_llama3_large_instruct,0.9704142011834319
text_davinci_002,0.9696969696969697
gpt_4o_2024_08_06,0.9677536231884059
qwen2_72b,0.9674556213017751
gemini_1.5_pro,0.9661016949152542
together_moa,0.9631578947368421
smaug_llama3_70b_instruct_32k,0.9615384615384616
rys_llama3_huge_instruct,0.9585798816568047
llama3_pbm_nova_70b,0.9578947368421052
zephyr_orpo_141b_a35b_v0.1,0.9526627218934911
storm_7b_best_of_64,0.9526315789473684
together_moa_lite,0.9473684210526315
llama3.1_instruct_turbo_405b,0.9436619718309859
09,0.9421052631578948
llama3.1_405b_instruct_turbo,0.9420289855072463
calme_2.4_llama3_70b,0.9408284023668639
gpt_4_turbo_2024_04_09,0.9399808331689967
cohere_command_beta_52.4b,0.9393939393939394
internlm2_5_20b_chat,0.9378698224852071
13,0.9368421052631579
dolphin_2.9.2_qwen2_72b,0.9349112426035503
multiverse_70b,0.9319526627218935
higgs_llama3_70b_v2,0.9315789473684211
llama3.1_instruct_turbo_70b,0.9295774647887324
barcenas_14b_phi_3_medium_orpo,0.9289940828402367
gemini_1.5_pro_exp_0827,0.927536231884058
sppo_gemma_2_9b_it_pairrm,0.9263157894736842
c4ai_command_r_plus,0.9260355029585798
text_davinci_003,0.9242424242424242
internlm2_5_7b_chat,0.9230769230769231
llama3_instruct_8b_wpo_hb_v2,0.9210526315789473
llama3_70b_shiningvaliant2,0.9201183431952663
qwen2_57b_a14b_instruct,0.9171597633136095
gpt_4o_mini,0.9166666666666666
20,0.9157894736842105
deepseek_v2_chat_0628_api,0.9152542372881356
qwen1.5_110b,0.9142011834319527
gpt_4_0125_preview,0.9115123229345778
yi_1.5_34b_chat_16k,0.908284023668639
18,0.9052631578947369
qwen2_instruct_72b,0.9014084507042254
gemini_1.5_pro_api_preview,0.9
storm_7b,0.9
blossom_v5.1_34b,0.8994082840236687
gemini_1.5_pro_exp_0801,0.8985507246376812
rys_phi_3_medium_4k_instruct,0.8964497041420119
gpt_4o_mini_20240718,0.8947368421052632
06,0.8947368421052632
configurable_llama3.1_8b_instruct,0.8905325443786982
infinity_instruct_7m_gen_llama3_1_70b,0.8894736842105263
mistral_large_2_2407,0.8873239436619719
llama3_70b,0.8867405617134761
chocolatine_3b_instruct_dpo_revised,0.8846153846153846
expo_+_llama3_instruct_8b_simpo,0.8842105263157894
claude_3_opus,0.8813559322033898
tnlg_v2_530b,0.8787878787878788
nous_hermes_2_mixtral_8x7b_dpo,0.8757396449704142
nanbeige_plus_chat_v0.1,0.8736842105263158
gemini_1.5_pro_001,0.8732394366197183
athene_70b,0.8649717514124293
gemini_1.5_flash,0.864406779661017
yi_1.5_34b_32k,0.863905325443787
aligner_2b+claude_3_opus,0.8631578947368421
barcenas_llama3_8b_orpo,0.8609467455621301
nanbeige2_16b_chat,0.8578947368421053
dracarys_llama3.1_70b_instruct,0.855072463768116
mistral_large_2407,0.8547101449275363
llama3.1_405b_instruct,0.8543859649122807
llama3.1_70b_instruct,0.8530727706841068
29,0.8526315789473684
llama3.1_70b,0.8520710059171598
yi_34bx2_moe_60b_dpo,0.8520710059171598
glm_4_0520,0.85
phi_3_mini_4k_instruct_cpo_simpo,0.849112426035503
llama30b,0.8484848484848485
infinity_instruct_7m_gen_mistral_7b,0.8473684210526315
dolphin_2.9.2_phi_3_medium,0.8461538461538461
mixtral_8x22b,0.8450704225352113
llama3_instruct_8b_simpo,0.8447991279975086
gritlm_8x7b_kto,0.8431952662721893
llama3.1_70b_instruct_turbo,0.8405797101449275
mixtral_8x22b_v0.3,0.8402366863905325
sppo_llama3_instruct_8b_pairrm,0.8368421052631579
anthropic_lm_v4_s3_52b,0.8333333333333334
yi_1.5_34b,0.8313609467455622
gpt_4_turbo_1106_preview,0.8309859154929577
deepseek_v2_coder_0614_api,0.8305084745762712
hermes_3_llama3.1_70b,0.8302246805591287
c4ai_command_r_v01,0.8284023668639053
arcee_spark,0.8254437869822485
yi_large,0.8234463276836159
gpt_4,0.8210526315789474
claude_3_opus_20240229,0.8195686194461455
humanish_rp_llama3.1_8b,0.8195266272189349
smaug_qwen2_72b_instruct,0.8186905068175971
palmyra_x_v3_72b,0.8169014084507042
qwen2_57b_a14b,0.8165680473372781
infinity_instruct_3m_0625_llama3_70b,0.8157894736842105
gemini_1.5_flash_exp_0827,0.8115942028985508
aligner_2b+qwen1.5_72b_chat,0.8105263157894737
blossom_v5.1_9b,0.8076923076923077
deepseek_coder_v2,0.8068840579710145
gemma_2_9b_it_dpo,0.8062444246208742
qwen2_72b_instruct,0.8060674423919884
aya_23_35b,0.8047337278106509
gemma_2_27b_it,0.8036174652870135
gemma_2_instruct_27b,0.8028169014084507
bagelmisterytour_v2_8x7b,0.8017751479289941
14,0.8
calme_2.1_phi3_4b,0.7988165680473372
yi_large_preview,0.7973418267559564
llama3_instruct_8b_cpo_simpo,0.7958579881656804
ein_70b_v0.1,0.7947368421052632
maid_yuzu_v7,0.7928994082840237
fsfairx_zephyr_chat_v0.1,0.7894736842105263
gemini_1.5_flash_001,0.7887323943661971
palmyra_x_43b,0.7878787878787878
notux_8x7b_v1,0.7869822485207101
mixtral_8x22b_v0.1,0.7855808159451885
gpt_4_0613,0.7855378648703817
llama3_70b_instruct,0.7843069749718884
llama3_cantonese_8b_instruct,0.7840236686390533
deepseek_chat_v2,0.782608695652174
openbuddy_llama3.1_8b_v22.2_131k,0.7810650887573964
nemotron_4_340b_inst,0.7796610169491526
infinity_instruct_7m_gen_llama3_1_8b,0.7789473684210526
roleplay_llama3_8b,0.7781065088757396
02,0.7736842105263158
qwen1.5_32b,0.7714601216768064
yi_1.5_34b_chat,0.7702354371537107
gpt_4o_mini_2024_07_18,0.7700499237132448
llama3_instruct_8b_sppo_iter2,0.7692307692307693
expo_+_sppo_mistral7b_pairrm,0.7684210526315789
configurable_yi_1.5_9b_chat,0.7662721893491125
phi_3.5_moe_instruct,0.7648572163622331
smaug_34b_v0.1,0.7633136094674556
merlinite_7b_aot,0.7631578947368421
palm_2_unicorn,0.7605633802816901
qwen2_7b,0.7603550295857988
falcon_instruct_40b,0.7575757575757576
gemma_2_27b,0.757396449704142
gemma_2_9b_it_simpo,0.7550089997835828
qwen1.5_110b_chat,0.7546031756778104
seallms_v3_7b_chat,0.7544378698224852
gemini_1.5_pro_api_0514,0.7536231884057971
infinity_instruct_3m_0613_llama3_70b,0.7526315789473684
samba_coe_v0.2_best_of_16,0.7526315789473684
qwen2_cantonese_7b_instruct,0.7514792899408284
glm_4_0116,0.75
hermes_3_llama3.1_8b,0.7485207100591716
qwen1.5_72b,0.7464788732394366
mistral_large_2,0.7457627118644068
luxia_21.4b_alignment_v1.2,0.7455621301775148
suzume_llama3_8b_multilingual_orpo_borda_top75,0.742603550295858
mpt_instruct_30b,0.7424242424242424
rebel_llama3_8b_instruct,0.7421052631578947
infinity_instruct_3m_0625_mistral_7b,0.7421052631578947
suzume_llama3_8b_multilingual_orpo_borda_top25,0.7396449704142012
nous_hermes_2_solar_10.7b,0.7366863905325444
calme_2.2_phi3_4b,0.7337278106508875
glm_4_air,0.7333333333333333
palmyra_x_v2_33b,0.7323943661971831
sppo_mistral7b_pairrm,0.7315789473684211
llama3_instruct_8b_sppo_iter3,0.7307692307692307
claude_3_sonnet,0.7288135593220338
calme_2.3_phi3_4b,0.727810650887574
mpt_30b,0.7272727272727273
snorkel_mistral_pairrm_dpo+best_of_16,0.7263157894736842
qwen1.5_32b_chat,0.725864216754905
k2_chat,0.7248520710059172
yi_1.5_9b_chat_16k,0.7218934911242604
contextual_ai_kto_mistral_pairrm,0.7210526315789474
luxia_21.4b_alignment_v1.0,0.7189349112426036
gemma_2_instruct_9b,0.7183098591549296
gpt_4_0314,0.7166666666666667
llama3_refueled,0.7159763313609467
pairrm_0.4b+yi_34b_chat_best_of_16,0.7157894736842105
openchat_3.5_1210,0.7130177514792899
dracarys_72b_instruct,0.7101449275362319
configurablebeagle_11b,0.7100591715976331
carbonbeagle_11b,0.7071005917159763
mixtral_8x22b_instruct_v0.1,0.7062215933453392
claude_2,0.7052631578947368
mistral_nemo_instruct_2407,0.7041420118343196
yi_34b,0.7027043920326694
llama_2_70b,0.7006139400505598
gemini_1.5_flash_api_preview,0.7
samba_coe_v0.2,0.7
openbuddy_mixtral_7bx8_v18.1_32k,0.6982248520710059
j1_grande_v2_beta_17b,0.696969696969697
vicuna_v1.3_13b,0.696969696969697
deepseek_llm_67b_chat,0.6954375583930239
chocolatine_8b_instruct_dpo_v1.0,0.6923076923076923
qwen1.5_chat_110b,0.6901408450704225
claude,0.6894736842105263
yi_1.5_9b,0.6893491124260355
openbuddy_llama3_8b_v21.2_32k,0.6863905325443787
internlm2.5_chat_7b,0.6842105263157895
rys_llama3_8b_instruct,0.6834319526627219
phi_3_small_128k_instruct,0.6830674899236772
cohere_command_beta_6.1b,0.6818181818181818
infinity_instruct_3m_0625_llama3_8b,0.6816879476798505
nous_hermes_2_mixtral_8x7b_sft,0.6804733727810651
expo_+_internlm2_chat_20b,0.6789473684210526
reka_core,0.6779661016949152
hermes_2_pro_mistral_7b,0.6775147928994083
hermes_2_pro_llama3_8b,0.6745562130177515
openchat_3.5,0.6715976331360947
expo_+_starling_lm_7b_beta,0.6684210526315789
cohere_xlarge_v20221108_52.4b,0.6666666666666666
gemini_1.5_flash_api_0514,0.6666666666666666
exaone_3.0_7.8b_instruct,0.665680473372781
phi_3_medium_4k_instruct,0.6641525884000801
expo_+_tulu_2_dpo_70b,0.6631578947368421
lion_llama3_8b_dpo_v1.0,0.6627218934911243
claude_v1.3,0.6619718309859155
openhermes_2_mistral_7b,0.6597633136094675
gemma_2_9b_it,0.6572979514989604
carbonbeagle_11b_truthy,0.6568047337278107
suzume_llama3_8b_multilingual_orpo_borda_half,0.6538461538461539
infinity_instruct_3m_0613_mistral_7b,0.6526315789473685
calm3_22b_chat,0.650887573964497
palm_2_bison,0.647887323943662
gemma_2_9b_it_sppo_iter2,0.6449704142011834
nanbeige2_8b_chat,0.6368421052631579
phi_3.5_mini_instruct,0.6364805762799074
vicuna_v1.3_7b,0.6363636363636364
nous_hermes_2_mistral_7b_dpo,0.636094674556213
mixtral_8x7b_32k_seqlen,0.6338028169014085
dolphin_2.9.2_qwen2_7b,0.6331360946745562
xwinlm_70b_v0.1,0.631578947368421
gemma_2_9b,0.6301775147928994
llama3.1_instruct_nsfw_pretrained_e1_plus_reddit,0.6272189349112426
gemini_pro,0.6263157894736842
gemma_2_9b_it_sppo_iter_1,0.621301775147929
opt_175b,0.6212121212121212
phi_3_14b,0.6197183098591549
lion_llama3_8b_sft_v1.0,0.6183431952662722
yi_1.5_9b_chat,0.6175945329173903
mistral_medium,0.6135964912280703
gemma_2_9b_it_sppo_iter_1_evol_1,0.6124260355029586
evo_v2_7b,0.6105263157894737
claude_3_haiku,0.6101694915254238
llama3_korean_bllossom_8b,0.6094674556213018
einstein_v6.1_llama3_8b,0.606508875739645
ghost_8b_beta_d0x5,0.6052631578947368
openbuddy_llama3_8b_v21.1_8k,0.6035502958579881
yi_34b_200k,0.6005917159763313
yi_34b_chat,0.6003789058444928
mixtral_8x7b_v0.1,0.5993148551853005
sauerkrautlm_una_solar_instruct,0.5976331360946746
mistral_v0.1_7b,0.5969910371318822
samba_coe_v0.1,0.5947368421052631
solar_10.7b_instruct_v1.0,0.5946745562130178
mistral_nemo_inst_12b,0.5932203389830508
yi_1.5_9b_32k,0.591715976331361
deepseek_llm_chat_67b,0.5915492957746479
llama_13b,0.5909090909090909
expo_+_internlm2_chat_7b,0.5894736842105263
suzume_llama3_8b_multilingual_orpo_borda_full,0.5887573964497042
llama3.1_8b_instruct,0.587304058963978
configurablehermes_7b,0.5857988165680473
phi_3_mini_4k_instruct,0.5842766486579196
infinity_instruct_3m_0625_qwen2_7b,0.5842105263157895
silicon_maid_7b,0.5798816568047337
pairrm_0.4b+tulu_2+dpo_70b_best_of_16,0.5789473684210527
gpt_3.5_turbo_0613,0.5787238583013231
phi_3_7b,0.5774647887323944
dolphin_2.9.3_mistral_7b_32k,0.5769230769230769
mistral_large,0.576271186440678
instructpalmyra_30b,0.5757575757575758
lion_llama3_8b_odpo_v1.0,0.5739644970414202
tulu_2+dpo_70b,0.5736842105263158
gritlm_7b_kto,0.5710059171597633
claude_3_sonnet_20240229,0.5707967612437912
openbuddy_zero_14b_v22.3_32k,0.5680473372781065
llama_65b,0.5679416887434222
recurrentgemma_9b_it,0.5650887573964497
claude_instant_1.2,0.5613417346182358
cohere_xlarge_v20220609_52.4b,0.5606060606060606
mistral_7b_remax_v0.1,0.5578947368421052
configurablesolar_10.7b,0.5562130177514792
einstein_v6.1_developed_by_weyaxi_llama3_8b,0.5562130177514792
qwen1.5_14b,0.5541711809317443
neuralbeagle14_7b,0.5532544378698225
infinity_instruct_3m_0625_yi_1.5_9b,0.5526315789473685
qwen1.5_72b_chat,0.5518426870418492
expo_+_starling_lm_7b_alpha,0.5473684210526316
jurassic_2_large_7.5b,0.5454545454545454
dbrx_instructruct,0.5450454204517043
notus_7b_v1,0.5443786982248521
lmcocktail_10.7b_v1,0.5421052631578948
dolphin_2.9_llama3_8b,0.5414201183431953
llama3_8b_instruct_gradient_1048k,0.5355029585798816
command_r_plus,0.5331641531824205
llama3.1_8b_fireplace2,0.5325443786982249
jurassic_2_jumbo_178b,0.5320102432778488
01,0.531578947368421
davinci_175b,0.5303030303030303
glm_4_9b,0.5295857988165681
xwinlm_13b_v0.1,0.5263157894736842
gpt_3.5_turbo_0301,0.5257575757575758
qwen1.5_14b_chat,0.5252984532336759
mistral_large_2402,0.5252364428114581
mistral_7b_openorca,0.5236686390532544
yi_9b,0.5207100591715976
qwen2_7b_instruct,0.5178342262482379
mistral_nemo_minitron_8b_base,0.5177514792899408
gpt_3.5,0.5157894736842106
llama_7b,0.5151515151515151
yi_9b_200k,0.5118343195266272
alphamonarch_7b,0.5118343195266272
neuralllama3_8b_orpo_v0.3,0.5088757396449705
magpie_8b_align_v0.1,0.5084745762711864
gpt_3.5_text_davinci_003,0.5070422535211268
decilm_7b_instruct,0.5059171597633136
claude_2.0,0.5028169014084507
expo_+_tulu_2_dpo_13b,0.5
wizardlm_70b,0.5
internlm2.5_20b_chat,0.5
mistral7b_pairrm_sppo_iter2,0.5
redpajama_incite_instruct_7b,0.5
llama3_8b_magpie_align_v0.3,0.4970414201183432
pairrm_0.4b+tulu_2+dpo_13b_best_of_16,0.49473684210526314
solar_10.7b_v1.0,0.4940828402366864
merlinite_7b,0.4911242603550296
claude_2.1,0.48860472778189606
einstein_v4_7b,0.4881656804733728
j1_jumbo_v1_178b,0.48484848484848486
conifer_7b_dpo,0.4842105263157895
dictalm2.0_instruct,0.4822485207100592
yi_1.5_6b,0.47928994082840237
evo_7b,0.4789473684210526
gemini_1.0_pro_002,0.4788732394366197
mistral_7b_v0.3,0.4786515104328869
glm_4_9b_chat,0.47836972835257335
phi_3_medium_128k_instruct,0.4782608695652174
llama3_8b_magpie_align_v0.1,0.47633136094674555
snorkel_mistral_pairrm_dpo,0.4758771929824561
claude_3_haiku_20240307,0.47490644349186906
llama3_inst_8b_simpo,0.4745762711864407
mistral7b_pairrm_sppo_iter3,0.47337278106508873
stablelm_2_12b_chat,0.47041420118343197
glm_130b,0.4696969696969697
humpback_llama2_70b,0.46842105263157896
aya_23_8b,0.46745562130177515
mistral_next,0.4666666666666667
llama3_neuralhercules_5.0_8b,0.46449704142011833
deita_7b_v1.0,0.4631578947368421
zephyr_7b_gemma_v0.1,0.46153846153846156
josiev4o_8b_stage1_v4,0.45857988165680474
openhermes_2.5_mistral_7b,0.45808701068338453
jinachat,0.45789473684210524
jurassic_2_grande_17b,0.45785317968416556
llama3_8b_instruct,0.45427998888105275
tempnet_llama2_chat_70b_v0.1,0.45263157894736844
dbrx_instruct,0.4508028545941124
go_bruins_v2,0.44970414201183434
llama_2_13b,0.44800618906794415
causallm_14b,0.4473684210526316
ennoai_pro_french_llama3_8b_v0.4,0.4437869822485207
pairrm_0.4b+zephyr_7b_beta_best_of_16,0.4421052631578947
mistral_7b_v0.2,0.44180940516972905
llama_pro_8b_instruct,0.4408284023668639
llama3_inst_8b_simpo_v0.2,0.4406779661016949
opt_66b,0.4393939393939394
mistral_nemo_base_2407,0.4378698224852071
phi_3_mini_128k_instruct,0.435111339793614
falcon_mamba_7b,0.4349112426035503
deepseek_coder_v2_lite_instruct,0.43478260869565216
dbrx_instructruct_preview,0.43333333333333335
decilm_7b,0.4319526627218935
orpollama3_8b,0.4289940828402367
qwen1.5_moe_a2.7b_chat,0.4260355029585799
bloom_176b,0.42424242424242425
llama3_inst_8b_simpo_expo,0.423728813559322
deepseek_llm_7b_chat,0.4230769230769231
phi_3_small_8k_instruct,0.42282608695652174
llama2_chat_70b,0.42105263157894735
mistral_orpo_beta,0.42105263157894735
k2,0.42011834319526625
mistral_7b_v0.1,0.4171597633136095
internlm2_20b_chat,0.4166666666666667
mistral_7b_v0.1_signtensors_1_over_2,0.41420118343195267
phi_2_instruct_v0.1,0.41124260355029585
openchat_v3.1_13b,0.4105263157894737
wizardlm_13b_v1.2,0.4105263157894737
gemma_7b,0.4094299524960413
j1_grande_v1_17b,0.4090909090909091
mistral_small_2402,0.4089610124515207
mistral_nemo_2402,0.4084507042253521
windyflollm,0.40828402366863903
selm_llama3_8b_inst_iter3,0.4067796610169492
open_mistral_nemo,0.4057971014492754
ultralm_13b_v2.0_best_of_16,0.4052631578947368
llama3_8b,0.404346195516293
falcon_40b,0.40117105718405827
internlm2_chat_20b,0.4
expo_+_zephyr_7b_beta,0.4
mistral_7b_v0.1_signtensors_7_over_16,0.3994082840236686
gpt_3.5_turbo_0125,0.39619258167526406
wizardlm_13b_v1.1,0.39473684210526316
mixtral_8x7b_instruct_v0.1,0.3943864275430021
arctic_instruct,0.39436619718309857
dclm_7b,0.39349112426035504
starling_lm_7b_alpha,0.3928821066472888
expo_+_zephyr_7b_alpha,0.3894736842105263
stablelm_2_12b,0.3875739644970414
hebrew_gemma_11b_instruct,0.38461538461538464
dolphin_2.2.1_mistral_7b,0.37894736842105264
falcon_11b,0.378698224852071
llama3.1_8b,0.378698224852071
llama3.1_8b_instruct_turbo,0.37681159420289856
mistral_7b_v0.1_signtensors_3_over_8,0.3757396449704142
humpback_llama_65b,0.3736842105263158
phi_3_medium_128k,0.3728813559322034
flan_flan-ul2,0.3698224852071006
openbudddy_llama2_70b_v10.1,0.3684210526315789
gpt_3.5_text_davinci_002,0.36619718309859156
recurrentgemma_9b,0.363905325443787
redpajama_incite_base_7b,0.36363636363636365
openbuddy_llama_65b_v8,0.3631578947368421
luminous_supreme_70b,0.36096884336320956
flan_t5_xxl,0.3609467455621302
qwen_14b_chat,0.35789473684210527
hermes_2_theta_llama3_8b,0.3559322033898305
ende_chat_0.0.7,0.35502958579881655
yi_1.5_6b_chat,0.35277832028672623
zephyr_7b_beta,0.35192176049419494
cohere_large_v20220720_13.1b,0.3484848484848485
gpt_4_adversarial,0.3473684210526316
cut_13b,0.3473684210526316
mistral_7b_instruct_v0.1,0.34615384615384615
starcoder2_15b,0.3431952662721893
openchat_v2_w_13b,0.34210526315789475
qwen1.5_moe_a2.7b,0.34023668639053256
starling_lm_7b_beta_expo,0.3389830508474576
hare1.0_beta,0.33727810650887574
zephyr_7b_alpha,0.3339531832754857
redpajama_incite_instruct_v1_3b,0.3333333333333333
expo_+_tulu_2_dpo_7b,0.33157894736842103
vicuna_13b_v1.5_together,0.33157894736842103
qwen1.5_7b,0.32900658388199017
lion_gemma_2b_sft_v1.0,0.32840236686390534
stablelm_zephyr_3b,0.32840236686390534
tulu_2+dpo_13b,0.3263157894736842
nxcode_cq_7b_orpo,0.3254437869822485
command,0.323943661971831
autotrain_llama3_orpo_v2,0.3224852071005917
selm_zephyr_7b_iter3,0.3220338983050847
ennoai_pro_llama3_8b,0.31952662721893493
text_curie_001,0.3181818181818182
mistral_7b_v0.1_signtensors_5_over_16,0.3165680473372781
claude2_alpaca_13b,0.3157894736842105
minotaur_13b,0.3157894736842105
internlm2_5_1_8b_chat,0.3136094674556213
mistral_v0.3_7b_orpo,0.3106508875739645
airoboros_65b,0.3105263157894737
yi_6b_200k,0.3076923076923077
llama_2_7b,0.30711229302778603
cohere_command,0.30526315789473685
reka_flash,0.3050847457627119
flan_t5_xl,0.3047337278106509
openbuddy_zero_3b_v21.2_32k,0.30177514792899407
lion_gemma_2b_dpo_v1.0,0.2988165680473373
llama3.1_instruct_turbo_8b,0.29577464788732394
xwinlm_7b_v0.1,0.29473684210526313
vicuna_13b_v1.3,0.29473684210526313
h2o_danube3_4b_chat,0.29289940828402367
lion_gemma_2b_odpo_v1.0,0.29289940828402367
airoboros_33b,0.2894736842105263
mistral_7b_instruct_v0.2,0.2888078325695241
gemma_2_2b_it,0.288135593220339
qwen1.5_4b,0.2869822485207101
llama_2_13b_chat,0.28402366863905326
vicuna_33b_v1.3,0.2833333333333333
vicuna_13b_v1.5,0.2789473684210526
platolm_7b,0.2789473684210526
yi_6b,0.2779398283190266
mathstral_7b_v0.1,0.2753623188405797
hare_1.1b_base_0.5v,0.27514792899408286
cohere_medium_v20221108_6.1b,0.2727272727272727
olmo_7b_instruct,0.27218934911242604
internlm2_chat_1_8b,0.2692307692307692
gemma_1.1_7b_it,0.2686190435354315
gemma_instruct_7b,0.26842105263157895
openchat_v2_13b,0.26842105263157895
mistral_7b_instruct_v0.3,0.2646714118286025
qwen2_1.5b,0.26331360946745563
deepseek_moe_16b_chat,0.2603550295857988
openbuddy_llama30b_v7.1,0.2578947368421053
redpajama_incite_base_v1_3b,0.25757575757575757
gemma_2_2b,0.257396449704142
flan_t5_large,0.25443786982248523
jamba_instruct,0.2535211267605634
command_r,0.25324162489058644
gpt_3.5_turbo_1106,0.25
stablelm_2_zephyr_1_6b,0.2485207100591716
luminous_extended_30b,0.24839948783610755
llama33b_oasst_sft,0.24736842105263157
ultralm_13b_best_of_16,0.24736842105263157
qwen1.5_1.8b,0.2455621301775148
jamba_v0.1,0.24260355029585798
tnlg_v2_6.7b,0.24242424242424243
wizardlm_13b,0.24210526315789474
alpaca_7b,0.24170653907496012
qwen1.5_7b_chat,0.23952847697682547
neo_7b_instruct_expo,0.23728813559322035
nous_hermes_13b,0.23684210526315788
btlm_7b_base_v0.2,0.23668639053254437
matter_0.2_7b_dpo,0.23372781065088757
starling_lm_7b_beta,0.23188405797101447
mistral_7b_v0.1_signtensors_1_over_4,0.22781065088757396
j1_large_v1_7.5b,0.22727272727272727
mistral_medium_2312,0.22535211267605634
stablelm_2_1_6b_chat,0.22485207100591717
qwen2_1.5b_instruct,0.2242517794357259
internlm2_1_8b,0.22189349112426035
tulu_2+dpo_7b,0.22105263157894736
vicuna_13b,0.22105263157894736
openbudddy_llama2_13b_v11.1,0.22105263157894736
yi_6b_chat,0.21996398250578852
starcoder2_7b,0.21893491124260356
gemini_1.0_pro,0.21666666666666667
deepseek_llm_7b_base,0.21597633136094674
ultralm_13b_v2.0,0.21578947368421053
gpt_neox_20b,0.21512461897077284
recurrentgemma_2b_it,0.21301775147928995
granite_7b_base,0.20710059171597633
davinci001,0.20526315789473684
openbuddy_falcon_40b_v9,0.20526315789473684
fox_1_1.6b,0.20414201183431951
starlinglm_7b_beta,0.2033898305084746
neo_7b_instruct,0.2033898305084746
deepseek_moe_16b_base,0.20118343195266272
qwen1.5_4b_chat,0.20043306748992368
snowflake_arctic_instruct,0.2
openchat_13b,0.2
gemma_2b,0.19822485207100593
phi_2,0.1970183187780268
stablelm_3b_4e1t,0.1952662721893491
tempnet_llama2_chat_13b_v0.1,0.19473684210526315
llama2_chat_13b,0.18947368421052632
gemma_2b_orpo,0.1893491124260355
gpt_j_6b,0.18742155280616818
guanaco_65b,0.18421052631578946
phi_1_5,0.1834319526627219
qwen2_0.5b,0.1834319526627219
curie_6.7b,0.18181818181818182
codegemma_1.1_2b,0.1804733727810651
opencoderplus_15b,0.17894736842105263
recurrentgemma_2b,0.17751479289940827
dolly_v1_6b,0.17455621301775148
llama33b_oasst_rlhf,0.1736842105263158
llama_2_70b_chat,0.17239717402690025
smollm_135m,0.17159763313609466
mixtral_8x7b_instruct,0.1694915254237288
openchat8192_13b,0.16842105263157894
falcon_40b_instruct,0.1673466209903457
falcon_instruct_7b,0.16666666666666666
phi_1_5_instruct_v0.1,0.16568047337278108
phi_2_dpo,0.1631578947368421
deepseek_v2_lite_chat,0.15942028985507245
pythia_12b,0.15913573605881298
minichat_1.5_3b,0.15789473684210525
gpt2,0.15680473372781065
starcoder2_3b,0.15680473372781065
olmo_1b,0.15384615384615385
falcon_7b,0.1522980450391068
cohere_medium_v20220720_6.1b,0.15151515151515152
smol_llama_220m_gqa,0.15088757396449703
gpt_neo_2.7b,0.14497041420118342
luminous_base_13b,0.14393939393939395
tulu_2_dpo_70b,0.14279661016949152
recycled_wizardlm_7b_v2.0,0.14210526315789473
llama2_chat_7b_evol70k_neft,0.14210526315789473
sheared_llama_2.7b,0.14201183431952663
gemma_7b_it,0.13967338615317756
flan_t5_base,0.1390532544378698
vicuna_7b_v1.3,0.1368421052631579
text_babbage_001,0.13636363636363635
opt_30b,0.13609467455621302
smollm_360m,0.13313609467455623
flan_t5_small,0.1301775147928994
vicuna_7b_v1.5,0.12704042715484365
mistral_instruct_v0.3_7b,0.1267605633802817
ultralm_13b,0.12631578947368421
alpaca_farm_ppo_sim_gpt_4_7b,0.12631578947368421
mpt_7b,0.1242603550295858
t0pp_11b,0.12121212121212122
baize_v2_13b,0.12105263157894737
reka_edge,0.11864406779661017
mistral_7b_instruct,0.11666666666666667
vicuna_7b_v1.5_16k,0.11594202898550725
gpt2_medium,0.11538461538461539
gemma_1.1_2b_it,0.1133629191321499
pythia_160m,0.11242603550295859
pythia_6.9b,0.11220190066343913
recycled_wizardlm_7b_v1.0,0.11052631578947368
ghost_7b_alpha,0.11052631578947368
phi_1,0.10650887573964497
alpaca_farm_ppo_human_7b,0.10526315789473684
internlm2_chat_7b,0.10526315789473684
sheared_llama_1.3b,0.10355029585798817
gpt2_large,0.10059171597633136
vicuna_7b,0.1
redpajama_incite_7b_base,0.09763313609467456
gemma_2b_it,0.09615384615384616
pythia_2.8b,0.09467455621301775
llama_2_7b_chat,0.09294228625332304
olmo_7b,0.0913617801483457
flan-ul2_20b,0.09090909090909091
phi_2_sft,0.08947368421052632
redpajama_incite_base_3b_v1,0.08875739644970414
smollm_1.7b,0.08875739644970414
qwen2_0.5b_instruct,0.08845725066460852
qwen1.5_1.8b_chat,0.08646696064404215
gpt_neo_1.3b,0.08579881656804733
dialogpt_medium,0.07988165680473373
opt_1.3b,0.07988165680473373
stablelm_2_1_6b,0.07692307692307693
t5_11b,0.07575757575757576
tempnet_llama2_chat_7b_v0.1,0.07368421052631578
minichat_3b,0.07368421052631578
guanaco_33b,0.07368421052631578
smollm_1.7b_instruct,0.07100591715976332
qwen1.5_0.5b,0.07100591715976332
pythia_410m,0.06804733727810651
babbage_1.3b,0.06060606060606061
gpt2_xl,0.05917159763313609
llama2_chat_7b,0.05789473684210526
gemma_instruct_2b,0.05789473684210526
command_light,0.056338028169014086
tinyllama_v1.1,0.05621301775147929
qwen1.5_0.5b_chat,0.05473372781065089
gpt_sw3_40b,0.05325443786982249
openbuddy_falcon_7b_v6,0.05263157894736842
hermes_2_mixtral_8x7b_dpo,0.05084745762711865
helpingai_15b,0.05029585798816568
tinyyi_7b_test,0.047337278106508875
cohere_small_v20220720_410m,0.045454545454545456
gpt_neo_125m,0.04437869822485207
falcon_7b_instruct,0.04422298349423855
bloom_3b,0.04142011834319527
smollm_135m_instruct,0.038461538461538464
chatglm2_6b,0.03684210526315789
baize_v2_7b,0.03684210526315789
llama_160m_chat_v1,0.03550295857988166
phi_3_mini_128k,0.03389830508474576
rhea_72b_v0.5,0.03254437869822485
pythia_12b_sft,0.031578947368421054
ada_350m,0.030303030303030304
bloom_1b7,0.029585798816568046
bloom_1b1,0.026627218934911243
smol_llama_101m_gqa,0.023668639053254437
pythia_12b_oasst_sft,0.021052631578947368
distilgpt2,0.020710059171597635
minueza_32m_ultrachat,0.01775147928994083
guanaco_13b,0.015789473684210527
text_ada_001,0.015151515151515152
pythia_410m_roberta_lr_8e7_kl_01_steps_12000_rlhf_model,0.014792899408284023
bloom_7b1,0.011834319526627219
guanaco_7b,0.010526315789473684
bloom_560m,0.008875739644970414
instructlm_500m,0.005917159763313609
hare_1.1b_base,0.0029585798816568047
yalm_100b,0.0
nucleus_22b_token_500b,0.0
baichuan_13b_chat,0.0