Yotam-Perlitz commited on
Commit
292d764
·
1 Parent(s): 1e20a46

revise cache

Browse files

Signed-off-by: Yotam-Perlitz <y.perlitz@ibm.com>

cache/aggregate_scoress_cache_1edd56d721757789836f081c38c15400.csv ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,score
2
+ arx_0.3,1.0
3
+ claude_3.5_sonnet,0.9876543209876543
4
+ grok_2,0.9753086419753086
5
+ gpt_4o_2024_05_13,0.9629629629629629
6
+ grok_2_mini,0.9506172839506173
7
+ gemini_1.5_pro,0.9382716049382716
8
+ claude_3_opus,0.9259259259259259
9
+ qwen2_72b_chat,0.9135802469135802
10
+ magnum_72b_v1,0.9012345679012346
11
+ gpt_4_turbo,0.8888888888888888
12
+ deepseek_coder_v2_instruct,0.8765432098765432
13
+ higgs_llama3_70b,0.8641975308641975
14
+ gpt_4o_mini,0.8518518518518519
15
+ llama3.1_70b_instruct,0.8395061728395061
16
+ gemini_1.5_flash,0.8271604938271605
17
+ yi_large,0.8148148148148148
18
+ claude_3_sonnet,0.8024691358024691
19
+ llama3_70b_instruct,0.7901234567901234
20
+ phi3_medium_4k,0.7777777777777778
21
+ qwen2_72b_32k,0.7654320987654321
22
+ deepseek_v2_chat,0.7530864197530864
23
+ llama3_70b,0.7407407407407407
24
+ qwen1.5_72b_chat,0.7283950617283951
25
+ llama3.1_70b,0.7160493827160493
26
+ yi_1.5_34b_chat,0.7037037037037037
27
+ gemma_2_9b_it,0.691358024691358
28
+ phi3_medium_128k,0.6790123456790124
29
+ mammoth2_8x7b_plus,0.6666666666666666
30
+ qwen1.5_110b,0.654320987654321
31
+ glm_4_9b_chat,0.6419753086419753
32
+ glm_4_9b,0.6296296296296297
33
+ phi_3.5_mini_instruct,0.6172839506172839
34
+ qwen2_7b_instruct,0.6049382716049383
35
+ yi_1.5_9b_chat,0.5925925925925926
36
+ phi3_mini_4k,0.5802469135802469
37
+ gemma_2_9b,0.5679012345679012
38
+ mistral_nemo_instruct_2407,0.5555555555555556
39
+ llama3.1_8b_instruct,0.5432098765432098
40
+ phi3_mini_128k,0.5308641975308642
41
+ mammoth2_8b_plus,0.5185185185185185
42
+ mixtral_8x7b_instruct_v0.1,0.5061728395061729
43
+ yi_34b,0.49382716049382713
44
+ mathstral_7b_v0.1,0.48148148148148145
45
+ deepseek_coder_v2_lite_instruct,0.4691358024691358
46
+ mixtral_8x7b_v0.1,0.4567901234567901
47
+ llama3_8b_instruct,0.4444444444444444
48
+ mammoth2_7b_plus,0.43209876543209874
49
+ qwen2_7b,0.41975308641975306
50
+ mistral_nemo_base_2407,0.4074074074074074
51
+ wizardlm_2_8x22b,0.3950617283950617
52
+ yi_1.5_6b_chat,0.38271604938271603
53
+ qwen1.5_14b_chat,0.37037037037037035
54
+ c4ai_command_r_v01,0.345679012345679
55
+ staring_7b,0.345679012345679
56
+ llama_2_70b,0.3333333333333333
57
+ openchat_3.5_8b,0.32098765432098764
58
+ internmath_20b_plus,0.30864197530864196
59
+ llama3_smaug_8b,0.2962962962962963
60
+ llama3.1_8b,0.2839506172839506
61
+ llama3_8b,0.2716049382716049
62
+ deepseekmath_7b_instruct,0.25925925925925924
63
+ deepseek_coder_v2_lite_base,0.24691358024691357
64
+ gemma_7b,0.2345679012345679
65
+ internmath_7b_plus,0.2222222222222222
66
+ zephyr_7b_beta,0.20987654320987653
67
+ mistral_7b_v0.1,0.19753086419753085
68
+ mistral_7b_instruct_v0.2,0.18518518518518517
69
+ mistral_7b_v0.2,0.1728395061728395
70
+ qwen1.5_7b_chat,0.16049382716049382
71
+ yi_6b_chat,0.14814814814814814
72
+ neo_7b_instruct,0.13580246913580246
73
+ yi_6b,0.12345679012345678
74
+ neo_7b,0.1111111111111111
75
+ mistral_7b_instruct_v0.1,0.09876543209876543
76
+ llama_2_13b,0.08641975308641975
77
+ llemma_7b,0.07407407407407407
78
+ qwen2_1.5b_instruct,0.06172839506172839
79
+ qwen2_1.5b,0.04938271604938271
80
+ llama_2_7b,0.037037037037037035
81
+ qwen2_0.5b_instruct,0.024691358024691357
82
+ gemma_2b,0.012345679012345678
83
+ qwen2_0.5b,0.0
cache/aggregate_scoress_cache_230b5a189df3af8cde801ce251b7b2ef.csv ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,score
2
+ claude_3_5_sonnet_20240620,1.0
3
+ gpt_4o_2024_08_06,0.9855072463768116
4
+ chatgpt_4o_latest,0.9710144927536232
5
+ gpt_4o_2024_05_13,0.9565217391304348
6
+ llama3.1_405b_instruct_turbo,0.9420289855072463
7
+ gemini_1.5_pro_exp_0827,0.927536231884058
8
+ gpt_4_turbo_2024_04_09,0.9130434782608695
9
+ gemini_1.5_pro_exp_0801,0.8985507246376812
10
+ claude_3_opus_20240229,0.8840579710144928
11
+ gpt_4_0125_preview,0.8695652173913043
12
+ dracarys_llama3.1_70b_instruct,0.855072463768116
13
+ llama3.1_70b_instruct_turbo,0.8405797101449275
14
+ mistral_large_2407,0.8260869565217391
15
+ gemini_1.5_flash_exp_0827,0.8115942028985508
16
+ deepseek_coder_v2,0.7971014492753623
17
+ deepseek_chat_v2,0.782608695652174
18
+ gpt_4_0613,0.7681159420289855
19
+ gemini_1.5_pro_api_0514,0.7536231884057971
20
+ gpt_4o_mini_2024_07_18,0.7391304347826086
21
+ gemma_2_27b_it,0.7246376811594203
22
+ dracarys_72b_instruct,0.7101449275362319
23
+ qwen2_72b_instruct,0.6956521739130435
24
+ hermes_3_llama3.1_70b,0.6811594202898551
25
+ gemini_1.5_flash_api_0514,0.6666666666666666
26
+ smaug_qwen2_72b_instruct,0.6521739130434783
27
+ mistral_large_2402,0.6376811594202898
28
+ claude_3_sonnet_20240229,0.6231884057971014
29
+ llama3_70b_instruct,0.6086956521739131
30
+ claude_3_haiku_20240307,0.5942028985507246
31
+ mixtral_8x22b_instruct_v0.1,0.5797101449275363
32
+ phi_3.5_moe_instruct,0.5652173913043478
33
+ gpt_3.5_turbo_0125,0.5507246376811594
34
+ mistral_small_2402,0.5362318840579711
35
+ command_r_plus,0.5217391304347826
36
+ gemma_2_9b_it,0.5072463768115942
37
+ phi_3_medium_4k_instruct,0.4927536231884058
38
+ phi_3_medium_128k_instruct,0.4782608695652174
39
+ phi_3_small_128k_instruct,0.463768115942029
40
+ qwen1.5_110b_chat,0.4492753623188406
41
+ deepseek_coder_v2_lite_instruct,0.43478260869565216
42
+ qwen1.5_72b_chat,0.42028985507246375
43
+ open_mistral_nemo,0.4057971014492754
44
+ phi_3.5_mini_instruct,0.391304347826087
45
+ llama3.1_8b_instruct_turbo,0.37681159420289856
46
+ phi_3_small_8k_instruct,0.36231884057971014
47
+ llama3_8b_instruct,0.34782608695652173
48
+ command_r,0.3333333333333333
49
+ qwen2_7b_instruct,0.3188405797101449
50
+ phi_3_mini_128k_instruct,0.30434782608695654
51
+ phi_3_mini_4k_instruct,0.2898550724637681
52
+ mathstral_7b_v0.1,0.2753623188405797
53
+ openhermes_2.5_mistral_7b,0.2608695652173913
54
+ mixtral_8x7b_instruct_v0.1,0.2463768115942029
55
+ mistral_7b_instruct_v0.3,0.2318840579710145
56
+ mistral_7b_instruct_v0.2,0.21739130434782608
57
+ gemma_1.1_7b_it,0.2028985507246377
58
+ zephyr_7b_alpha,0.18840579710144928
59
+ qwen1.5_7b_chat,0.17391304347826086
60
+ deepseek_v2_lite_chat,0.15942028985507245
61
+ zephyr_7b_beta,0.14492753623188406
62
+ starling_lm_7b_beta,0.13043478260869565
63
+ vicuna_7b_v1.5_16k,0.11594202898550725
64
+ vicuna_7b_v1.5,0.10144927536231885
65
+ llama_2_7b_chat,0.08695652173913043
66
+ qwen1.5_4b_chat,0.07246376811594203
67
+ qwen2_1.5b_instruct,0.057971014492753624
68
+ yi_6b_chat,0.043478260869565216
69
+ qwen2_0.5b_instruct,0.028985507246376812
70
+ qwen1.5_1.8b_chat,0.014492753623188406
71
+ qwen1.5_0.5b_chat,0.0
cache/aggregate_scoress_cache_2d8c9f9c6d96807c68a9475184afcecb.csv ADDED
@@ -0,0 +1,686 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,score
2
+ claude_3_5_sonnet_20240620,1.0
3
+ gpt_4o_20240513,1.0
4
+ calme_2.1_qwen2_72b,1.0
5
+ shopee_slimmoa_v1,1.0
6
+ calme_2.2_qwen2_72b,0.9970414201183432
7
+ blendax.ai_gm_l6_vo31,0.9947368421052631
8
+ magnum_72b_v1,0.9911242603550295
9
+ gemma_2_9b_it_wpo_hb,0.9894736842105263
10
+ gpt_4o_2024_05_13,0.984963768115942
11
+ blendax.ai_gm_l3_v35,0.9842105263157894
12
+ claude_3.5_sonnet,0.9830508474576272
13
+ calme_2.2_llama3_70b,0.9822485207100592
14
+ llama3_tenyxchat_70b,0.9763313609467456
15
+ openpipe_moa_gpt_4_turbo,0.9736842105263158
16
+ claude_3.5_sonnet_20240620,0.971830985915493
17
+ chatgpt_4o_latest,0.9710144927536232
18
+ rys_llama3_large_instruct,0.9704142011834319
19
+ text_davinci_002,0.9696969696969697
20
+ gpt_4o_2024_08_06,0.9677536231884059
21
+ qwen2_72b,0.9674556213017751
22
+ gemini_1.5_pro,0.9661016949152542
23
+ together_moa,0.9631578947368421
24
+ smaug_llama3_70b_instruct_32k,0.9615384615384616
25
+ rys_llama3_huge_instruct,0.9585798816568047
26
+ llama3_pbm_nova_70b,0.9578947368421052
27
+ zephyr_orpo_141b_a35b_v0.1,0.9526627218934911
28
+ storm_7b_best_of_64,0.9526315789473684
29
+ together_moa_lite,0.9473684210526315
30
+ llama3.1_instruct_turbo_405b,0.9436619718309859
31
+ 09,0.9421052631578948
32
+ llama3.1_405b_instruct_turbo,0.9420289855072463
33
+ calme_2.4_llama3_70b,0.9408284023668639
34
+ gpt_4_turbo_2024_04_09,0.9399808331689967
35
+ cohere_command_beta_52.4b,0.9393939393939394
36
+ internlm2_5_20b_chat,0.9378698224852071
37
+ 13,0.9368421052631579
38
+ dolphin_2.9.2_qwen2_72b,0.9349112426035503
39
+ multiverse_70b,0.9319526627218935
40
+ higgs_llama3_70b_v2,0.9315789473684211
41
+ llama3.1_instruct_turbo_70b,0.9295774647887324
42
+ barcenas_14b_phi_3_medium_orpo,0.9289940828402367
43
+ gemini_1.5_pro_exp_0827,0.927536231884058
44
+ sppo_gemma_2_9b_it_pairrm,0.9263157894736842
45
+ c4ai_command_r_plus,0.9260355029585798
46
+ text_davinci_003,0.9242424242424242
47
+ internlm2_5_7b_chat,0.9230769230769231
48
+ llama3_instruct_8b_wpo_hb_v2,0.9210526315789473
49
+ llama3_70b_shiningvaliant2,0.9201183431952663
50
+ qwen2_57b_a14b_instruct,0.9171597633136095
51
+ gpt_4o_mini,0.9166666666666666
52
+ 20,0.9157894736842105
53
+ deepseek_v2_chat_0628_api,0.9152542372881356
54
+ qwen1.5_110b,0.9142011834319527
55
+ gpt_4_0125_preview,0.9115123229345778
56
+ yi_1.5_34b_chat_16k,0.908284023668639
57
+ 18,0.9052631578947369
58
+ qwen2_instruct_72b,0.9014084507042254
59
+ gemini_1.5_pro_api_preview,0.9
60
+ storm_7b,0.9
61
+ blossom_v5.1_34b,0.8994082840236687
62
+ gemini_1.5_pro_exp_0801,0.8985507246376812
63
+ rys_phi_3_medium_4k_instruct,0.8964497041420119
64
+ gpt_4o_mini_20240718,0.8947368421052632
65
+ 06,0.8947368421052632
66
+ configurable_llama3.1_8b_instruct,0.8905325443786982
67
+ infinity_instruct_7m_gen_llama3_1_70b,0.8894736842105263
68
+ mistral_large_2_2407,0.8873239436619719
69
+ llama3_70b,0.8867405617134761
70
+ chocolatine_3b_instruct_dpo_revised,0.8846153846153846
71
+ expo_+_llama3_instruct_8b_simpo,0.8842105263157894
72
+ claude_3_opus,0.8813559322033898
73
+ tnlg_v2_530b,0.8787878787878788
74
+ nous_hermes_2_mixtral_8x7b_dpo,0.8757396449704142
75
+ nanbeige_plus_chat_v0.1,0.8736842105263158
76
+ gemini_1.5_pro_001,0.8732394366197183
77
+ athene_70b,0.8649717514124293
78
+ gemini_1.5_flash,0.864406779661017
79
+ yi_1.5_34b_32k,0.863905325443787
80
+ aligner_2b+claude_3_opus,0.8631578947368421
81
+ barcenas_llama3_8b_orpo,0.8609467455621301
82
+ nanbeige2_16b_chat,0.8578947368421053
83
+ dracarys_llama3.1_70b_instruct,0.855072463768116
84
+ mistral_large_2407,0.8547101449275363
85
+ llama3.1_405b_instruct,0.8543859649122807
86
+ llama3.1_70b_instruct,0.8530727706841068
87
+ 29,0.8526315789473684
88
+ llama3.1_70b,0.8520710059171598
89
+ yi_34bx2_moe_60b_dpo,0.8520710059171598
90
+ glm_4_0520,0.85
91
+ phi_3_mini_4k_instruct_cpo_simpo,0.849112426035503
92
+ llama30b,0.8484848484848485
93
+ infinity_instruct_7m_gen_mistral_7b,0.8473684210526315
94
+ dolphin_2.9.2_phi_3_medium,0.8461538461538461
95
+ mixtral_8x22b,0.8450704225352113
96
+ llama3_instruct_8b_simpo,0.8447991279975086
97
+ gritlm_8x7b_kto,0.8431952662721893
98
+ llama3.1_70b_instruct_turbo,0.8405797101449275
99
+ mixtral_8x22b_v0.3,0.8402366863905325
100
+ sppo_llama3_instruct_8b_pairrm,0.8368421052631579
101
+ anthropic_lm_v4_s3_52b,0.8333333333333334
102
+ yi_1.5_34b,0.8313609467455622
103
+ gpt_4_turbo_1106_preview,0.8309859154929577
104
+ deepseek_v2_coder_0614_api,0.8305084745762712
105
+ hermes_3_llama3.1_70b,0.8302246805591287
106
+ c4ai_command_r_v01,0.8284023668639053
107
+ arcee_spark,0.8254437869822485
108
+ yi_large,0.8234463276836159
109
+ gpt_4,0.8210526315789474
110
+ claude_3_opus_20240229,0.8195686194461455
111
+ humanish_rp_llama3.1_8b,0.8195266272189349
112
+ smaug_qwen2_72b_instruct,0.8186905068175971
113
+ palmyra_x_v3_72b,0.8169014084507042
114
+ qwen2_57b_a14b,0.8165680473372781
115
+ infinity_instruct_3m_0625_llama3_70b,0.8157894736842105
116
+ gemini_1.5_flash_exp_0827,0.8115942028985508
117
+ aligner_2b+qwen1.5_72b_chat,0.8105263157894737
118
+ blossom_v5.1_9b,0.8076923076923077
119
+ deepseek_coder_v2,0.8068840579710145
120
+ gemma_2_9b_it_dpo,0.8062444246208742
121
+ qwen2_72b_instruct,0.8060674423919884
122
+ aya_23_35b,0.8047337278106509
123
+ gemma_2_27b_it,0.8036174652870135
124
+ gemma_2_instruct_27b,0.8028169014084507
125
+ bagelmisterytour_v2_8x7b,0.8017751479289941
126
+ 14,0.8
127
+ calme_2.1_phi3_4b,0.7988165680473372
128
+ yi_large_preview,0.7973418267559564
129
+ llama3_instruct_8b_cpo_simpo,0.7958579881656804
130
+ ein_70b_v0.1,0.7947368421052632
131
+ maid_yuzu_v7,0.7928994082840237
132
+ fsfairx_zephyr_chat_v0.1,0.7894736842105263
133
+ gemini_1.5_flash_001,0.7887323943661971
134
+ palmyra_x_43b,0.7878787878787878
135
+ notux_8x7b_v1,0.7869822485207101
136
+ mixtral_8x22b_v0.1,0.7855808159451885
137
+ gpt_4_0613,0.7855378648703817
138
+ llama3_70b_instruct,0.7843069749718884
139
+ llama3_cantonese_8b_instruct,0.7840236686390533
140
+ deepseek_chat_v2,0.782608695652174
141
+ openbuddy_llama3.1_8b_v22.2_131k,0.7810650887573964
142
+ nemotron_4_340b_inst,0.7796610169491526
143
+ infinity_instruct_7m_gen_llama3_1_8b,0.7789473684210526
144
+ roleplay_llama3_8b,0.7781065088757396
145
+ 02,0.7736842105263158
146
+ qwen1.5_32b,0.7714601216768064
147
+ yi_1.5_34b_chat,0.7702354371537107
148
+ gpt_4o_mini_2024_07_18,0.7700499237132448
149
+ llama3_instruct_8b_sppo_iter2,0.7692307692307693
150
+ expo_+_sppo_mistral7b_pairrm,0.7684210526315789
151
+ configurable_yi_1.5_9b_chat,0.7662721893491125
152
+ phi_3.5_moe_instruct,0.7648572163622331
153
+ smaug_34b_v0.1,0.7633136094674556
154
+ merlinite_7b_aot,0.7631578947368421
155
+ palm_2_unicorn,0.7605633802816901
156
+ qwen2_7b,0.7603550295857988
157
+ falcon_instruct_40b,0.7575757575757576
158
+ gemma_2_27b,0.757396449704142
159
+ gemma_2_9b_it_simpo,0.7550089997835828
160
+ qwen1.5_110b_chat,0.7546031756778104
161
+ seallms_v3_7b_chat,0.7544378698224852
162
+ gemini_1.5_pro_api_0514,0.7536231884057971
163
+ infinity_instruct_3m_0613_llama3_70b,0.7526315789473684
164
+ samba_coe_v0.2_best_of_16,0.7526315789473684
165
+ qwen2_cantonese_7b_instruct,0.7514792899408284
166
+ glm_4_0116,0.75
167
+ hermes_3_llama3.1_8b,0.7485207100591716
168
+ qwen1.5_72b,0.7464788732394366
169
+ mistral_large_2,0.7457627118644068
170
+ luxia_21.4b_alignment_v1.2,0.7455621301775148
171
+ suzume_llama3_8b_multilingual_orpo_borda_top75,0.742603550295858
172
+ mpt_instruct_30b,0.7424242424242424
173
+ rebel_llama3_8b_instruct,0.7421052631578947
174
+ infinity_instruct_3m_0625_mistral_7b,0.7421052631578947
175
+ suzume_llama3_8b_multilingual_orpo_borda_top25,0.7396449704142012
176
+ nous_hermes_2_solar_10.7b,0.7366863905325444
177
+ calme_2.2_phi3_4b,0.7337278106508875
178
+ glm_4_air,0.7333333333333333
179
+ palmyra_x_v2_33b,0.7323943661971831
180
+ sppo_mistral7b_pairrm,0.7315789473684211
181
+ llama3_instruct_8b_sppo_iter3,0.7307692307692307
182
+ claude_3_sonnet,0.7288135593220338
183
+ calme_2.3_phi3_4b,0.727810650887574
184
+ mpt_30b,0.7272727272727273
185
+ snorkel_mistral_pairrm_dpo+best_of_16,0.7263157894736842
186
+ qwen1.5_32b_chat,0.725864216754905
187
+ k2_chat,0.7248520710059172
188
+ yi_1.5_9b_chat_16k,0.7218934911242604
189
+ contextual_ai_kto_mistral_pairrm,0.7210526315789474
190
+ luxia_21.4b_alignment_v1.0,0.7189349112426036
191
+ gemma_2_instruct_9b,0.7183098591549296
192
+ gpt_4_0314,0.7166666666666667
193
+ llama3_refueled,0.7159763313609467
194
+ pairrm_0.4b+yi_34b_chat_best_of_16,0.7157894736842105
195
+ openchat_3.5_1210,0.7130177514792899
196
+ dracarys_72b_instruct,0.7101449275362319
197
+ configurablebeagle_11b,0.7100591715976331
198
+ carbonbeagle_11b,0.7071005917159763
199
+ mixtral_8x22b_instruct_v0.1,0.7062215933453392
200
+ claude_2,0.7052631578947368
201
+ mistral_nemo_instruct_2407,0.7041420118343196
202
+ yi_34b,0.7027043920326694
203
+ llama_2_70b,0.7006139400505598
204
+ gemini_1.5_flash_api_preview,0.7
205
+ samba_coe_v0.2,0.7
206
+ openbuddy_mixtral_7bx8_v18.1_32k,0.6982248520710059
207
+ j1_grande_v2_beta_17b,0.696969696969697
208
+ vicuna_v1.3_13b,0.696969696969697
209
+ deepseek_llm_67b_chat,0.6954375583930239
210
+ chocolatine_8b_instruct_dpo_v1.0,0.6923076923076923
211
+ qwen1.5_chat_110b,0.6901408450704225
212
+ claude,0.6894736842105263
213
+ yi_1.5_9b,0.6893491124260355
214
+ openbuddy_llama3_8b_v21.2_32k,0.6863905325443787
215
+ internlm2.5_chat_7b,0.6842105263157895
216
+ rys_llama3_8b_instruct,0.6834319526627219
217
+ phi_3_small_128k_instruct,0.6830674899236772
218
+ cohere_command_beta_6.1b,0.6818181818181818
219
+ infinity_instruct_3m_0625_llama3_8b,0.6816879476798505
220
+ nous_hermes_2_mixtral_8x7b_sft,0.6804733727810651
221
+ expo_+_internlm2_chat_20b,0.6789473684210526
222
+ reka_core,0.6779661016949152
223
+ hermes_2_pro_mistral_7b,0.6775147928994083
224
+ hermes_2_pro_llama3_8b,0.6745562130177515
225
+ openchat_3.5,0.6715976331360947
226
+ expo_+_starling_lm_7b_beta,0.6684210526315789
227
+ cohere_xlarge_v20221108_52.4b,0.6666666666666666
228
+ gemini_1.5_flash_api_0514,0.6666666666666666
229
+ exaone_3.0_7.8b_instruct,0.665680473372781
230
+ phi_3_medium_4k_instruct,0.6641525884000801
231
+ expo_+_tulu_2_dpo_70b,0.6631578947368421
232
+ lion_llama3_8b_dpo_v1.0,0.6627218934911243
233
+ claude_v1.3,0.6619718309859155
234
+ openhermes_2_mistral_7b,0.6597633136094675
235
+ gemma_2_9b_it,0.6572979514989604
236
+ carbonbeagle_11b_truthy,0.6568047337278107
237
+ suzume_llama3_8b_multilingual_orpo_borda_half,0.6538461538461539
238
+ infinity_instruct_3m_0613_mistral_7b,0.6526315789473685
239
+ calm3_22b_chat,0.650887573964497
240
+ palm_2_bison,0.647887323943662
241
+ gemma_2_9b_it_sppo_iter2,0.6449704142011834
242
+ nanbeige2_8b_chat,0.6368421052631579
243
+ phi_3.5_mini_instruct,0.6364805762799074
244
+ vicuna_v1.3_7b,0.6363636363636364
245
+ nous_hermes_2_mistral_7b_dpo,0.636094674556213
246
+ mixtral_8x7b_32k_seqlen,0.6338028169014085
247
+ dolphin_2.9.2_qwen2_7b,0.6331360946745562
248
+ xwinlm_70b_v0.1,0.631578947368421
249
+ gemma_2_9b,0.6301775147928994
250
+ llama3.1_instruct_nsfw_pretrained_e1_plus_reddit,0.6272189349112426
251
+ gemini_pro,0.6263157894736842
252
+ gemma_2_9b_it_sppo_iter_1,0.621301775147929
253
+ opt_175b,0.6212121212121212
254
+ phi_3_14b,0.6197183098591549
255
+ lion_llama3_8b_sft_v1.0,0.6183431952662722
256
+ yi_1.5_9b_chat,0.6175945329173903
257
+ mistral_medium,0.6135964912280703
258
+ gemma_2_9b_it_sppo_iter_1_evol_1,0.6124260355029586
259
+ evo_v2_7b,0.6105263157894737
260
+ claude_3_haiku,0.6101694915254238
261
+ llama3_korean_bllossom_8b,0.6094674556213018
262
+ einstein_v6.1_llama3_8b,0.606508875739645
263
+ ghost_8b_beta_d0x5,0.6052631578947368
264
+ openbuddy_llama3_8b_v21.1_8k,0.6035502958579881
265
+ yi_34b_200k,0.6005917159763313
266
+ yi_34b_chat,0.6003789058444928
267
+ mixtral_8x7b_v0.1,0.5993148551853005
268
+ sauerkrautlm_una_solar_instruct,0.5976331360946746
269
+ mistral_v0.1_7b,0.5969910371318822
270
+ samba_coe_v0.1,0.5947368421052631
271
+ solar_10.7b_instruct_v1.0,0.5946745562130178
272
+ mistral_nemo_inst_12b,0.5932203389830508
273
+ yi_1.5_9b_32k,0.591715976331361
274
+ deepseek_llm_chat_67b,0.5915492957746479
275
+ llama_13b,0.5909090909090909
276
+ expo_+_internlm2_chat_7b,0.5894736842105263
277
+ suzume_llama3_8b_multilingual_orpo_borda_full,0.5887573964497042
278
+ llama3.1_8b_instruct,0.587304058963978
279
+ configurablehermes_7b,0.5857988165680473
280
+ phi_3_mini_4k_instruct,0.5842766486579196
281
+ infinity_instruct_3m_0625_qwen2_7b,0.5842105263157895
282
+ silicon_maid_7b,0.5798816568047337
283
+ pairrm_0.4b+tulu_2+dpo_70b_best_of_16,0.5789473684210527
284
+ gpt_3.5_turbo_0613,0.5787238583013231
285
+ phi_3_7b,0.5774647887323944
286
+ dolphin_2.9.3_mistral_7b_32k,0.5769230769230769
287
+ mistral_large,0.576271186440678
288
+ instructpalmyra_30b,0.5757575757575758
289
+ lion_llama3_8b_odpo_v1.0,0.5739644970414202
290
+ tulu_2+dpo_70b,0.5736842105263158
291
+ gritlm_7b_kto,0.5710059171597633
292
+ claude_3_sonnet_20240229,0.5707967612437912
293
+ openbuddy_zero_14b_v22.3_32k,0.5680473372781065
294
+ llama_65b,0.5679416887434222
295
+ recurrentgemma_9b_it,0.5650887573964497
296
+ claude_instant_1.2,0.5613417346182358
297
+ cohere_xlarge_v20220609_52.4b,0.5606060606060606
298
+ mistral_7b_remax_v0.1,0.5578947368421052
299
+ configurablesolar_10.7b,0.5562130177514792
300
+ einstein_v6.1_developed_by_weyaxi_llama3_8b,0.5562130177514792
301
+ qwen1.5_14b,0.5541711809317443
302
+ neuralbeagle14_7b,0.5532544378698225
303
+ infinity_instruct_3m_0625_yi_1.5_9b,0.5526315789473685
304
+ qwen1.5_72b_chat,0.5518426870418492
305
+ expo_+_starling_lm_7b_alpha,0.5473684210526316
306
+ jurassic_2_large_7.5b,0.5454545454545454
307
+ dbrx_instructruct,0.5450454204517043
308
+ notus_7b_v1,0.5443786982248521
309
+ lmcocktail_10.7b_v1,0.5421052631578948
310
+ dolphin_2.9_llama3_8b,0.5414201183431953
311
+ llama3_8b_instruct_gradient_1048k,0.5355029585798816
312
+ command_r_plus,0.5331641531824205
313
+ llama3.1_8b_fireplace2,0.5325443786982249
314
+ jurassic_2_jumbo_178b,0.5320102432778488
315
+ 01,0.531578947368421
316
+ davinci_175b,0.5303030303030303
317
+ glm_4_9b,0.5295857988165681
318
+ xwinlm_13b_v0.1,0.5263157894736842
319
+ gpt_3.5_turbo_0301,0.5257575757575758
320
+ qwen1.5_14b_chat,0.5252984532336759
321
+ mistral_large_2402,0.5252364428114581
322
+ mistral_7b_openorca,0.5236686390532544
323
+ yi_9b,0.5207100591715976
324
+ qwen2_7b_instruct,0.5178342262482379
325
+ mistral_nemo_minitron_8b_base,0.5177514792899408
326
+ gpt_3.5,0.5157894736842106
327
+ llama_7b,0.5151515151515151
328
+ yi_9b_200k,0.5118343195266272
329
+ alphamonarch_7b,0.5118343195266272
330
+ neuralllama3_8b_orpo_v0.3,0.5088757396449705
331
+ magpie_8b_align_v0.1,0.5084745762711864
332
+ gpt_3.5_text_davinci_003,0.5070422535211268
333
+ decilm_7b_instruct,0.5059171597633136
334
+ claude_2.0,0.5028169014084507
335
+ expo_+_tulu_2_dpo_13b,0.5
336
+ wizardlm_70b,0.5
337
+ internlm2.5_20b_chat,0.5
338
+ mistral7b_pairrm_sppo_iter2,0.5
339
+ redpajama_incite_instruct_7b,0.5
340
+ llama3_8b_magpie_align_v0.3,0.4970414201183432
341
+ pairrm_0.4b+tulu_2+dpo_13b_best_of_16,0.49473684210526314
342
+ solar_10.7b_v1.0,0.4940828402366864
343
+ merlinite_7b,0.4911242603550296
344
+ claude_2.1,0.48860472778189606
345
+ einstein_v4_7b,0.4881656804733728
346
+ j1_jumbo_v1_178b,0.48484848484848486
347
+ conifer_7b_dpo,0.4842105263157895
348
+ dictalm2.0_instruct,0.4822485207100592
349
+ yi_1.5_6b,0.47928994082840237
350
+ evo_7b,0.4789473684210526
351
+ gemini_1.0_pro_002,0.4788732394366197
352
+ mistral_7b_v0.3,0.4786515104328869
353
+ glm_4_9b_chat,0.47836972835257335
354
+ phi_3_medium_128k_instruct,0.4782608695652174
355
+ llama3_8b_magpie_align_v0.1,0.47633136094674555
356
+ snorkel_mistral_pairrm_dpo,0.4758771929824561
357
+ claude_3_haiku_20240307,0.47490644349186906
358
+ llama3_inst_8b_simpo,0.4745762711864407
359
+ mistral7b_pairrm_sppo_iter3,0.47337278106508873
360
+ stablelm_2_12b_chat,0.47041420118343197
361
+ glm_130b,0.4696969696969697
362
+ humpback_llama2_70b,0.46842105263157896
363
+ aya_23_8b,0.46745562130177515
364
+ mistral_next,0.4666666666666667
365
+ llama3_neuralhercules_5.0_8b,0.46449704142011833
366
+ deita_7b_v1.0,0.4631578947368421
367
+ zephyr_7b_gemma_v0.1,0.46153846153846156
368
+ josiev4o_8b_stage1_v4,0.45857988165680474
369
+ openhermes_2.5_mistral_7b,0.45808701068338453
370
+ jinachat,0.45789473684210524
371
+ jurassic_2_grande_17b,0.45785317968416556
372
+ llama3_8b_instruct,0.45427998888105275
373
+ tempnet_llama2_chat_70b_v0.1,0.45263157894736844
374
+ dbrx_instruct,0.4508028545941124
375
+ go_bruins_v2,0.44970414201183434
376
+ llama_2_13b,0.44800618906794415
377
+ causallm_14b,0.4473684210526316
378
+ ennoai_pro_french_llama3_8b_v0.4,0.4437869822485207
379
+ pairrm_0.4b+zephyr_7b_beta_best_of_16,0.4421052631578947
380
+ mistral_7b_v0.2,0.44180940516972905
381
+ llama_pro_8b_instruct,0.4408284023668639
382
+ llama3_inst_8b_simpo_v0.2,0.4406779661016949
383
+ opt_66b,0.4393939393939394
384
+ mistral_nemo_base_2407,0.4378698224852071
385
+ phi_3_mini_128k_instruct,0.435111339793614
386
+ falcon_mamba_7b,0.4349112426035503
387
+ deepseek_coder_v2_lite_instruct,0.43478260869565216
388
+ dbrx_instructruct_preview,0.43333333333333335
389
+ decilm_7b,0.4319526627218935
390
+ orpollama3_8b,0.4289940828402367
391
+ qwen1.5_moe_a2.7b_chat,0.4260355029585799
392
+ bloom_176b,0.42424242424242425
393
+ llama3_inst_8b_simpo_expo,0.423728813559322
394
+ deepseek_llm_7b_chat,0.4230769230769231
395
+ phi_3_small_8k_instruct,0.42282608695652174
396
+ llama2_chat_70b,0.42105263157894735
397
+ mistral_orpo_beta,0.42105263157894735
398
+ k2,0.42011834319526625
399
+ mistral_7b_v0.1,0.4171597633136095
400
+ internlm2_20b_chat,0.4166666666666667
401
+ mistral_7b_v0.1_signtensors_1_over_2,0.41420118343195267
402
+ phi_2_instruct_v0.1,0.41124260355029585
403
+ openchat_v3.1_13b,0.4105263157894737
404
+ wizardlm_13b_v1.2,0.4105263157894737
405
+ gemma_7b,0.4094299524960413
406
+ j1_grande_v1_17b,0.4090909090909091
407
+ mistral_small_2402,0.4089610124515207
408
+ mistral_nemo_2402,0.4084507042253521
409
+ windyflollm,0.40828402366863903
410
+ selm_llama3_8b_inst_iter3,0.4067796610169492
411
+ open_mistral_nemo,0.4057971014492754
412
+ ultralm_13b_v2.0_best_of_16,0.4052631578947368
413
+ llama3_8b,0.404346195516293
414
+ falcon_40b,0.40117105718405827
415
+ internlm2_chat_20b,0.4
416
+ expo_+_zephyr_7b_beta,0.4
417
+ mistral_7b_v0.1_signtensors_7_over_16,0.3994082840236686
418
+ gpt_3.5_turbo_0125,0.39619258167526406
419
+ wizardlm_13b_v1.1,0.39473684210526316
420
+ mixtral_8x7b_instruct_v0.1,0.3943864275430021
421
+ arctic_instruct,0.39436619718309857
422
+ dclm_7b,0.39349112426035504
423
+ starling_lm_7b_alpha,0.3928821066472888
424
+ expo_+_zephyr_7b_alpha,0.3894736842105263
425
+ stablelm_2_12b,0.3875739644970414
426
+ hebrew_gemma_11b_instruct,0.38461538461538464
427
+ dolphin_2.2.1_mistral_7b,0.37894736842105264
428
+ falcon_11b,0.378698224852071
429
+ llama3.1_8b,0.378698224852071
430
+ llama3.1_8b_instruct_turbo,0.37681159420289856
431
+ mistral_7b_v0.1_signtensors_3_over_8,0.3757396449704142
432
+ humpback_llama_65b,0.3736842105263158
433
+ phi_3_medium_128k,0.3728813559322034
434
+ flan_flan-ul2,0.3698224852071006
435
+ openbudddy_llama2_70b_v10.1,0.3684210526315789
436
+ gpt_3.5_text_davinci_002,0.36619718309859156
437
+ recurrentgemma_9b,0.363905325443787
438
+ redpajama_incite_base_7b,0.36363636363636365
439
+ openbuddy_llama_65b_v8,0.3631578947368421
440
+ luminous_supreme_70b,0.36096884336320956
441
+ flan_t5_xxl,0.3609467455621302
442
+ qwen_14b_chat,0.35789473684210527
443
+ hermes_2_theta_llama3_8b,0.3559322033898305
444
+ ende_chat_0.0.7,0.35502958579881655
445
+ yi_1.5_6b_chat,0.35277832028672623
446
+ zephyr_7b_beta,0.35192176049419494
447
+ cohere_large_v20220720_13.1b,0.3484848484848485
448
+ gpt_4_adversarial,0.3473684210526316
449
+ cut_13b,0.3473684210526316
450
+ mistral_7b_instruct_v0.1,0.34615384615384615
451
+ starcoder2_15b,0.3431952662721893
452
+ openchat_v2_w_13b,0.34210526315789475
453
+ qwen1.5_moe_a2.7b,0.34023668639053256
454
+ starling_lm_7b_beta_expo,0.3389830508474576
455
+ hare1.0_beta,0.33727810650887574
456
+ zephyr_7b_alpha,0.3339531832754857
457
+ redpajama_incite_instruct_v1_3b,0.3333333333333333
458
+ expo_+_tulu_2_dpo_7b,0.33157894736842103
459
+ vicuna_13b_v1.5_together,0.33157894736842103
460
+ qwen1.5_7b,0.32900658388199017
461
+ lion_gemma_2b_sft_v1.0,0.32840236686390534
462
+ stablelm_zephyr_3b,0.32840236686390534
463
+ tulu_2+dpo_13b,0.3263157894736842
464
+ nxcode_cq_7b_orpo,0.3254437869822485
465
+ command,0.323943661971831
466
+ autotrain_llama3_orpo_v2,0.3224852071005917
467
+ selm_zephyr_7b_iter3,0.3220338983050847
468
+ ennoai_pro_llama3_8b,0.31952662721893493
469
+ text_curie_001,0.3181818181818182
470
+ mistral_7b_v0.1_signtensors_5_over_16,0.3165680473372781
471
+ claude2_alpaca_13b,0.3157894736842105
472
+ minotaur_13b,0.3157894736842105
473
+ internlm2_5_1_8b_chat,0.3136094674556213
474
+ mistral_v0.3_7b_orpo,0.3106508875739645
475
+ airoboros_65b,0.3105263157894737
476
+ yi_6b_200k,0.3076923076923077
477
+ llama_2_7b,0.30711229302778603
478
+ cohere_command,0.30526315789473685
479
+ reka_flash,0.3050847457627119
480
+ flan_t5_xl,0.3047337278106509
481
+ openbuddy_zero_3b_v21.2_32k,0.30177514792899407
482
+ lion_gemma_2b_dpo_v1.0,0.2988165680473373
483
+ llama3.1_instruct_turbo_8b,0.29577464788732394
484
+ xwinlm_7b_v0.1,0.29473684210526313
485
+ vicuna_13b_v1.3,0.29473684210526313
486
+ h2o_danube3_4b_chat,0.29289940828402367
487
+ lion_gemma_2b_odpo_v1.0,0.29289940828402367
488
+ airoboros_33b,0.2894736842105263
489
+ mistral_7b_instruct_v0.2,0.2888078325695241
490
+ gemma_2_2b_it,0.288135593220339
491
+ qwen1.5_4b,0.2869822485207101
492
+ llama_2_13b_chat,0.28402366863905326
493
+ vicuna_33b_v1.3,0.2833333333333333
494
+ vicuna_13b_v1.5,0.2789473684210526
495
+ platolm_7b,0.2789473684210526
496
+ yi_6b,0.2779398283190266
497
+ mathstral_7b_v0.1,0.2753623188405797
498
+ hare_1.1b_base_0.5v,0.27514792899408286
499
+ cohere_medium_v20221108_6.1b,0.2727272727272727
500
+ olmo_7b_instruct,0.27218934911242604
501
+ internlm2_chat_1_8b,0.2692307692307692
502
+ gemma_1.1_7b_it,0.2686190435354315
503
+ gemma_instruct_7b,0.26842105263157895
504
+ openchat_v2_13b,0.26842105263157895
505
+ mistral_7b_instruct_v0.3,0.2646714118286025
506
+ qwen2_1.5b,0.26331360946745563
507
+ deepseek_moe_16b_chat,0.2603550295857988
508
+ openbuddy_llama30b_v7.1,0.2578947368421053
509
+ redpajama_incite_base_v1_3b,0.25757575757575757
510
+ gemma_2_2b,0.257396449704142
511
+ flan_t5_large,0.25443786982248523
512
+ jamba_instruct,0.2535211267605634
513
+ command_r,0.25324162489058644
514
+ gpt_3.5_turbo_1106,0.25
515
+ stablelm_2_zephyr_1_6b,0.2485207100591716
516
+ luminous_extended_30b,0.24839948783610755
517
+ llama33b_oasst_sft,0.24736842105263157
518
+ ultralm_13b_best_of_16,0.24736842105263157
519
+ qwen1.5_1.8b,0.2455621301775148
520
+ jamba_v0.1,0.24260355029585798
521
+ tnlg_v2_6.7b,0.24242424242424243
522
+ wizardlm_13b,0.24210526315789474
523
+ alpaca_7b,0.24170653907496012
524
+ qwen1.5_7b_chat,0.23952847697682547
525
+ neo_7b_instruct_expo,0.23728813559322035
526
+ nous_hermes_13b,0.23684210526315788
527
+ btlm_7b_base_v0.2,0.23668639053254437
528
+ matter_0.2_7b_dpo,0.23372781065088757
529
+ starling_lm_7b_beta,0.23188405797101447
530
+ mistral_7b_v0.1_signtensors_1_over_4,0.22781065088757396
531
+ j1_large_v1_7.5b,0.22727272727272727
532
+ mistral_medium_2312,0.22535211267605634
533
+ stablelm_2_1_6b_chat,0.22485207100591717
534
+ qwen2_1.5b_instruct,0.2242517794357259
535
+ internlm2_1_8b,0.22189349112426035
536
+ tulu_2+dpo_7b,0.22105263157894736
537
+ vicuna_13b,0.22105263157894736
538
+ openbudddy_llama2_13b_v11.1,0.22105263157894736
539
+ yi_6b_chat,0.21996398250578852
540
+ starcoder2_7b,0.21893491124260356
541
+ gemini_1.0_pro,0.21666666666666667
542
+ deepseek_llm_7b_base,0.21597633136094674
543
+ ultralm_13b_v2.0,0.21578947368421053
544
+ gpt_neox_20b,0.21512461897077284
545
+ recurrentgemma_2b_it,0.21301775147928995
546
+ granite_7b_base,0.20710059171597633
547
+ davinci001,0.20526315789473684
548
+ openbuddy_falcon_40b_v9,0.20526315789473684
549
+ fox_1_1.6b,0.20414201183431951
550
+ starlinglm_7b_beta,0.2033898305084746
551
+ neo_7b_instruct,0.2033898305084746
552
+ deepseek_moe_16b_base,0.20118343195266272
553
+ qwen1.5_4b_chat,0.20043306748992368
554
+ snowflake_arctic_instruct,0.2
555
+ openchat_13b,0.2
556
+ gemma_2b,0.19822485207100593
557
+ phi_2,0.1970183187780268
558
+ stablelm_3b_4e1t,0.1952662721893491
559
+ tempnet_llama2_chat_13b_v0.1,0.19473684210526315
560
+ llama2_chat_13b,0.18947368421052632
561
+ gemma_2b_orpo,0.1893491124260355
562
+ gpt_j_6b,0.18742155280616818
563
+ guanaco_65b,0.18421052631578946
564
+ phi_1_5,0.1834319526627219
565
+ qwen2_0.5b,0.1834319526627219
566
+ curie_6.7b,0.18181818181818182
567
+ codegemma_1.1_2b,0.1804733727810651
568
+ opencoderplus_15b,0.17894736842105263
569
+ recurrentgemma_2b,0.17751479289940827
570
+ dolly_v1_6b,0.17455621301775148
571
+ llama33b_oasst_rlhf,0.1736842105263158
572
+ llama_2_70b_chat,0.17239717402690025
573
+ smollm_135m,0.17159763313609466
574
+ mixtral_8x7b_instruct,0.1694915254237288
575
+ openchat8192_13b,0.16842105263157894
576
+ falcon_40b_instruct,0.1673466209903457
577
+ falcon_instruct_7b,0.16666666666666666
578
+ phi_1_5_instruct_v0.1,0.16568047337278108
579
+ phi_2_dpo,0.1631578947368421
580
+ deepseek_v2_lite_chat,0.15942028985507245
581
+ pythia_12b,0.15913573605881298
582
+ minichat_1.5_3b,0.15789473684210525
583
+ gpt2,0.15680473372781065
584
+ starcoder2_3b,0.15680473372781065
585
+ olmo_1b,0.15384615384615385
586
+ falcon_7b,0.1522980450391068
587
+ cohere_medium_v20220720_6.1b,0.15151515151515152
588
+ smol_llama_220m_gqa,0.15088757396449703
589
+ gpt_neo_2.7b,0.14497041420118342
590
+ luminous_base_13b,0.14393939393939395
591
+ tulu_2_dpo_70b,0.14279661016949152
592
+ recycled_wizardlm_7b_v2.0,0.14210526315789473
593
+ llama2_chat_7b_evol70k_neft,0.14210526315789473
594
+ sheared_llama_2.7b,0.14201183431952663
595
+ gemma_7b_it,0.13967338615317756
596
+ flan_t5_base,0.1390532544378698
597
+ vicuna_7b_v1.3,0.1368421052631579
598
+ text_babbage_001,0.13636363636363635
599
+ opt_30b,0.13609467455621302
600
+ smollm_360m,0.13313609467455623
601
+ flan_t5_small,0.1301775147928994
602
+ vicuna_7b_v1.5,0.12704042715484365
603
+ mistral_instruct_v0.3_7b,0.1267605633802817
604
+ ultralm_13b,0.12631578947368421
605
+ alpaca_farm_ppo_sim_gpt_4_7b,0.12631578947368421
606
+ mpt_7b,0.1242603550295858
607
+ t0pp_11b,0.12121212121212122
608
+ baize_v2_13b,0.12105263157894737
609
+ reka_edge,0.11864406779661017
610
+ mistral_7b_instruct,0.11666666666666667
611
+ vicuna_7b_v1.5_16k,0.11594202898550725
612
+ gpt2_medium,0.11538461538461539
613
+ gemma_1.1_2b_it,0.1133629191321499
614
+ pythia_160m,0.11242603550295859
615
+ pythia_6.9b,0.11220190066343913
616
+ recycled_wizardlm_7b_v1.0,0.11052631578947368
617
+ ghost_7b_alpha,0.11052631578947368
618
+ phi_1,0.10650887573964497
619
+ alpaca_farm_ppo_human_7b,0.10526315789473684
620
+ internlm2_chat_7b,0.10526315789473684
621
+ sheared_llama_1.3b,0.10355029585798817
622
+ gpt2_large,0.10059171597633136
623
+ vicuna_7b,0.1
624
+ redpajama_incite_7b_base,0.09763313609467456
625
+ gemma_2b_it,0.09615384615384616
626
+ pythia_2.8b,0.09467455621301775
627
+ llama_2_7b_chat,0.09294228625332304
628
+ olmo_7b,0.0913617801483457
629
+ flan-ul2_20b,0.09090909090909091
630
+ phi_2_sft,0.08947368421052632
631
+ redpajama_incite_base_3b_v1,0.08875739644970414
632
+ smollm_1.7b,0.08875739644970414
633
+ qwen2_0.5b_instruct,0.08845725066460852
634
+ qwen1.5_1.8b_chat,0.08646696064404215
635
+ gpt_neo_1.3b,0.08579881656804733
636
+ dialogpt_medium,0.07988165680473373
637
+ opt_1.3b,0.07988165680473373
638
+ stablelm_2_1_6b,0.07692307692307693
639
+ t5_11b,0.07575757575757576
640
+ tempnet_llama2_chat_7b_v0.1,0.07368421052631578
641
+ minichat_3b,0.07368421052631578
642
+ guanaco_33b,0.07368421052631578
643
+ smollm_1.7b_instruct,0.07100591715976332
644
+ qwen1.5_0.5b,0.07100591715976332
645
+ pythia_410m,0.06804733727810651
646
+ babbage_1.3b,0.06060606060606061
647
+ gpt2_xl,0.05917159763313609
648
+ llama2_chat_7b,0.05789473684210526
649
+ gemma_instruct_2b,0.05789473684210526
650
+ command_light,0.056338028169014086
651
+ tinyllama_v1.1,0.05621301775147929
652
+ qwen1.5_0.5b_chat,0.05473372781065089
653
+ gpt_sw3_40b,0.05325443786982249
654
+ openbuddy_falcon_7b_v6,0.05263157894736842
655
+ hermes_2_mixtral_8x7b_dpo,0.05084745762711865
656
+ helpingai_15b,0.05029585798816568
657
+ tinyyi_7b_test,0.047337278106508875
658
+ cohere_small_v20220720_410m,0.045454545454545456
659
+ gpt_neo_125m,0.04437869822485207
660
+ falcon_7b_instruct,0.04422298349423855
661
+ bloom_3b,0.04142011834319527
662
+ smollm_135m_instruct,0.038461538461538464
663
+ chatglm2_6b,0.03684210526315789
664
+ baize_v2_7b,0.03684210526315789
665
+ llama_160m_chat_v1,0.03550295857988166
666
+ phi_3_mini_128k,0.03389830508474576
667
+ rhea_72b_v0.5,0.03254437869822485
668
+ pythia_12b_sft,0.031578947368421054
669
+ ada_350m,0.030303030303030304
670
+ bloom_1b7,0.029585798816568046
671
+ bloom_1b1,0.026627218934911243
672
+ smol_llama_101m_gqa,0.023668639053254437
673
+ pythia_12b_oasst_sft,0.021052631578947368
674
+ distilgpt2,0.020710059171597635
675
+ minueza_32m_ultrachat,0.01775147928994083
676
+ guanaco_13b,0.015789473684210527
677
+ text_ada_001,0.015151515151515152
678
+ pythia_410m_roberta_lr_8e7_kl_01_steps_12000_rlhf_model,0.014792899408284023
679
+ bloom_7b1,0.011834319526627219
680
+ guanaco_7b,0.010526315789473684
681
+ bloom_560m,0.008875739644970414
682
+ instructlm_500m,0.005917159763313609
683
+ hare_1.1b_base,0.0029585798816568047
684
+ yalm_100b,0.0
685
+ nucleus_22b_token_500b,0.0
686
+ baichuan_13b_chat,0.0
cache/aggregate_scoress_cache_7b814a45375ad6b75add8b396f69c2cd.csv DELETED
@@ -1,72 +0,0 @@
1
- model,score
2
- gpt_4o_2024_05_13,0.9950869236583522
3
- gpt_4_turbo_2024_04_09,0.9639153609872332
4
- gpt_4_0125_preview,0.9393939393939394
5
- claude_3_opus_20240229,0.9220898724004315
6
- yi_large_preview,0.8845096932053453
7
- llama3.1_70b_instruct,0.8832459207459207
8
- qwen2_72b_instruct,0.8719243719243719
9
- gpt_4_0613,0.8648074952422778
10
- gemma_2_27b_it,0.8510517260517261
11
- llama3_70b_instruct,0.849670938694048
12
- mistral_large,0.8470006184291898
13
- yi_1.5_34b_chat,0.7714889277389277
14
- llama3_70b,0.7611156781553201
15
- claude_3_sonnet_20240229,0.7541101640480523
16
- mixtral_8x22b_instruct_v0.1,0.7425976800976801
17
- qwen1.5_110b_chat,0.7320934784170079
18
- mistral_medium,0.7056277056277057
19
- phi_3_medium_4k_instruct,0.696301247771836
20
- qwen1.5_32b_chat,0.6812609659248315
21
- claude_3_haiku_20240307,0.6757563807253248
22
- mistral_large_2402,0.6705753184014054
23
- qwen1.5_72b,0.6692868451728518
24
- qwen1.5_72b_chat,0.6604933136636727
25
- command_r_plus,0.6508289415898112
26
- yi_34b,0.6270777876367939
27
- phi_3_mini_4k_instruct,0.6218470721621983
28
- gemma_2_9b_it,0.6216006216006217
29
- qwen1.5_32b,0.6175551742436105
30
- llama_2_70b,0.585811187829169
31
- gpt_3.5_turbo_0125,0.5795841063698206
32
- yi_34b_chat,0.5793988997113997
33
- gemini_1.0_pro,0.5205318491032778
34
- gpt_3.5_turbo_0613,0.5196837944664031
35
- llama3_8b_instruct,0.5166348882210227
36
- yi_1.5_9b_chat,0.5150335775335776
37
- qwen2_7b_instruct,0.4803418803418803
38
- phi_3_mini_128k_instruct,0.47774531890678346
39
- mixtral_8x7b_instruct_v0.1,0.47245816635618004
40
- starling_lm_7b_beta,0.46037960638800973
41
- qwen1.5_14b_chat,0.45760855624301
42
- tulu_2_dpo_70b,0.44326821637746006
43
- llama3.1_8b_instruct,0.4429972804972805
44
- command_r,0.42476786498525626
45
- openhermes_2.5_mistral_7b,0.4133219954648526
46
- mistral_7b_instruct_v0.2,0.38528271156947624
47
- yi_1.5_6b_chat,0.3616155902920609
48
- llama_2_70b_chat,0.3429423284465301
49
- starling_lm_7b_alpha,0.3192125334982478
50
- llama3_8b,0.3191327255539897
51
- gemma_1.1_7b_it,0.3093664233370116
52
- zephyr_7b_beta,0.3012633624878523
53
- qwen1.5_7b,0.29290520556048505
54
- gemma_7b,0.29047416067876425
55
- vicuna_33b_v1.3,0.28480038480038483
56
- qwen1.5_7b_chat,0.27333417049803604
57
- llama_2_13b,0.2660179289106947
58
- mistral_7b_instruct_v0.3,0.21805555555555559
59
- yi_6b_chat,0.20091647770219198
60
- yi_6b,0.19687349577512162
61
- qwen1.5_4b,0.16834733893557421
62
- vicuna_7b_v1.5,0.14973544973544975
63
- gemma_7b_it,0.14039115646258504
64
- qwen1.5_4b_chat,0.14036924293526934
65
- phi_2,0.1326664119754182
66
- llama_2_7b_chat,0.11841995751468631
67
- gemma_1.1_2b_it,0.09431689342403628
68
- llama_2_7b,0.06859327581964463
69
- qwen1.5_1.8b_chat,0.06363517629273932
70
- gemma_2b,0.05727290916366547
71
- olmo_7b,0.011775543550753635
72
- qwen1.5_0.5b_chat,0.008163265306122448
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/aggregate_scoress_cache_9c0710fd06d230cc89e0f2f023e3058f.csv ADDED
@@ -0,0 +1,146 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,score
2
+ arx_0.3,1.0
3
+ claude_3.5_sonnet,0.9876543209876543
4
+ gpt_4o_2024_05_13,0.9814814814814814
5
+ grok_2,0.9753086419753086
6
+ gpt_4_0613,0.971830985915493
7
+ claude_3.5_sonnet_20240620,0.971830985915493
8
+ gpt_4_turbo_2024_04_09,0.9577464788732394
9
+ grok_2_mini,0.9506172839506173
10
+ llama3.1_instruct_turbo_405b,0.9436619718309859
11
+ gemini_1.5_pro,0.9382716049382716
12
+ llama3.1_instruct_turbo_70b,0.9295774647887324
13
+ claude_3_opus,0.9259259259259259
14
+ qwen2_72b_chat,0.9135802469135802
15
+ qwen2_instruct_72b,0.9014084507042254
16
+ magnum_72b_v1,0.9012345679012346
17
+ gpt_4_turbo,0.8888888888888888
18
+ mistral_large_2_2407,0.8873239436619719
19
+ deepseek_coder_v2_instruct,0.8765432098765432
20
+ gemini_1.5_pro_001,0.8732394366197183
21
+ higgs_llama3_70b,0.8641975308641975
22
+ gpt_4o_mini_2024_07_18,0.8591549295774648
23
+ gpt_4o_mini,0.8518518518518519
24
+ mixtral_8x22b,0.8450704225352113
25
+ llama3.1_70b_instruct,0.8395061728395061
26
+ gpt_4_turbo_1106_preview,0.8309859154929577
27
+ llama3_70b,0.8281168492436097
28
+ gemini_1.5_flash,0.8271604938271605
29
+ palmyra_x_v3_72b,0.8169014084507042
30
+ yi_large,0.8148148148148148
31
+ gemma_2_instruct_27b,0.8028169014084507
32
+ claude_3_sonnet,0.8024691358024691
33
+ llama3_70b_instruct,0.7901234567901234
34
+ gemini_1.5_flash_001,0.7887323943661971
35
+ phi3_medium_4k,0.7777777777777778
36
+ claude_3_opus_20240229,0.7746478873239436
37
+ qwen2_72b_32k,0.7654320987654321
38
+ palm_2_unicorn,0.7605633802816901
39
+ deepseek_v2_chat,0.7530864197530864
40
+ qwen1.5_72b,0.7464788732394366
41
+ palmyra_x_v2_33b,0.7323943661971831
42
+ qwen1.5_72b_chat,0.7283950617283951
43
+ gemma_2_instruct_9b,0.7183098591549296
44
+ llama3.1_70b,0.7160493827160493
45
+ yi_1.5_34b_chat,0.7037037037037037
46
+ gemma_2_9b_it,0.691358024691358
47
+ qwen1.5_chat_110b,0.6901408450704225
48
+ phi3_medium_128k,0.6790123456790124
49
+ qwen1.5_32b,0.676056338028169
50
+ mammoth2_8x7b_plus,0.6666666666666666
51
+ claude_v1.3,0.6619718309859155
52
+ qwen1.5_110b,0.654320987654321
53
+ palm_2_bison,0.647887323943662
54
+ glm_4_9b_chat,0.6419753086419753
55
+ mixtral_8x7b_32k_seqlen,0.6338028169014085
56
+ glm_4_9b,0.6296296296296297
57
+ phi_3_14b,0.6197183098591549
58
+ phi_3.5_mini_instruct,0.6172839506172839
59
+ claude_2.0,0.6056338028169014
60
+ qwen2_7b_instruct,0.6049382716049383
61
+ yi_34b,0.5990262563032516
62
+ yi_1.5_9b_chat,0.5925925925925926
63
+ deepseek_llm_chat_67b,0.5915492957746479
64
+ phi3_mini_4k,0.5802469135802469
65
+ phi_3_7b,0.5774647887323944
66
+ gemma_2_9b,0.5679012345679012
67
+ mistral_nemo_instruct_2407,0.5555555555555556
68
+ yi_large_preview,0.5492957746478874
69
+ llama3.1_8b_instruct,0.5432098765432098
70
+ command_r_plus,0.5352112676056338
71
+ phi3_mini_128k,0.5308641975308642
72
+ mammoth2_8b_plus,0.5185185185185185
73
+ gpt_3.5_text_davinci_003,0.5070422535211268
74
+ claude_2.1,0.5070422535211268
75
+ mixtral_8x7b_instruct_v0.1,0.5061728395061729
76
+ qwen1.5_14b,0.49295774647887325
77
+ mathstral_7b_v0.1,0.48148148148148145
78
+ gemini_1.0_pro_002,0.4788732394366197
79
+ deepseek_coder_v2_lite_instruct,0.4691358024691358
80
+ claude_instant_1.2,0.4647887323943662
81
+ mixtral_8x7b_v0.1,0.4567901234567901
82
+ llama_2_70b,0.4483568075117371
83
+ llama3_8b_instruct,0.4444444444444444
84
+ mammoth2_7b_plus,0.43209876543209874
85
+ gpt_3.5_turbo_0613,0.4225352112676056
86
+ claude_3_sonnet_20240229,0.4225352112676056
87
+ qwen2_7b,0.41975308641975306
88
+ mistral_nemo_2402,0.4084507042253521
89
+ mistral_nemo_base_2407,0.4074074074074074
90
+ wizardlm_2_8x22b,0.3950617283950617
91
+ arctic_instruct,0.39436619718309857
92
+ yi_1.5_6b_chat,0.38271604938271603
93
+ qwen1.5_14b_chat,0.37037037037037035
94
+ gpt_3.5_text_davinci_002,0.36619718309859156
95
+ llama3_8b,0.3611545818118588
96
+ llama_65b,0.352112676056338
97
+ c4ai_command_r_v01,0.345679012345679
98
+ staring_7b,0.345679012345679
99
+ mistral_large_2402,0.3380281690140845
100
+ command,0.323943661971831
101
+ openchat_3.5_8b,0.32098765432098764
102
+ command_r,0.30985915492957744
103
+ internmath_20b_plus,0.30864197530864196
104
+ gemma_7b,0.3003825421665797
105
+ llama3_smaug_8b,0.2962962962962963
106
+ llama3.1_instruct_turbo_8b,0.29577464788732394
107
+ llama3.1_8b,0.2839506172839506
108
+ mistral_small_2402,0.28169014084507044
109
+ dbrx_instructruct,0.2676056338028169
110
+ deepseekmath_7b_instruct,0.25925925925925924
111
+ jamba_instruct,0.2535211267605634
112
+ deepseek_coder_v2_lite_base,0.24691358024691357
113
+ mistral_v0.1_7b,0.23943661971830985
114
+ mistral_medium_2312,0.22535211267605634
115
+ internmath_7b_plus,0.2222222222222222
116
+ qwen1.5_7b,0.2112676056338028
117
+ zephyr_7b_beta,0.20987654320987653
118
+ mistral_7b_v0.1,0.19753086419753085
119
+ claude_3_haiku_20240307,0.19718309859154928
120
+ mistral_7b_instruct_v0.2,0.18518518518518517
121
+ mistral_7b_v0.2,0.1728395061728395
122
+ qwen1.5_7b_chat,0.16049382716049382
123
+ jurassic_2_jumbo_178b,0.15492957746478872
124
+ yi_6b,0.15327769083637627
125
+ yi_6b_chat,0.14814814814814814
126
+ falcon_40b,0.14084507042253522
127
+ neo_7b_instruct,0.13580246913580246
128
+ llama_2_13b,0.127716918796731
129
+ mistral_instruct_v0.3_7b,0.1267605633802817
130
+ jurassic_2_grande_17b,0.11267605633802817
131
+ neo_7b,0.1111111111111111
132
+ mistral_7b_instruct_v0.1,0.09876543209876543
133
+ phi_2,0.09859154929577464
134
+ llemma_7b,0.07407407407407407
135
+ luminous_supreme_70b,0.07042253521126761
136
+ qwen2_1.5b_instruct,0.06172839506172839
137
+ llama_2_7b,0.06077203964527908
138
+ command_light,0.056338028169014086
139
+ qwen2_1.5b,0.04938271604938271
140
+ luminous_extended_30b,0.04225352112676056
141
+ falcon_7b,0.028169014084507043
142
+ qwen2_0.5b_instruct,0.024691358024691357
143
+ olmo_7b,0.014084507042253521
144
+ gemma_2b,0.012345679012345678
145
+ luminous_base_13b,0.0
146
+ qwen2_0.5b,0.0
cache/aggregate_scoress_cache_bdd8d629730630ed8e73cb56f53f335b.csv DELETED
@@ -1,72 +0,0 @@
1
- model,score
2
- gpt_4o_2024_05_13,0.9950869236583522
3
- gpt_4_turbo_2024_04_09,0.9639153609872332
4
- gpt_4_0125_preview,0.9393939393939394
5
- claude_3_opus_20240229,0.9220898724004315
6
- yi_large_preview,0.8845096932053453
7
- llama3.1_70b_instruct,0.8832459207459207
8
- qwen2_72b_instruct,0.8719243719243719
9
- gpt_4_0613,0.8648074952422778
10
- gemma_2_27b_it,0.8510517260517261
11
- llama3_70b_instruct,0.849670938694048
12
- mistral_large,0.8470006184291898
13
- yi_1.5_34b_chat,0.7714889277389277
14
- llama3_70b,0.7611156781553201
15
- claude_3_sonnet_20240229,0.7541101640480523
16
- mixtral_8x22b_instruct_v0.1,0.7425976800976801
17
- qwen1.5_110b_chat,0.7320934784170079
18
- mistral_medium,0.7056277056277057
19
- phi_3_medium_4k_instruct,0.696301247771836
20
- qwen1.5_32b_chat,0.6812609659248315
21
- claude_3_haiku_20240307,0.6757563807253248
22
- mistral_large_2402,0.6705753184014054
23
- qwen1.5_72b,0.6692868451728518
24
- qwen1.5_72b_chat,0.6604933136636727
25
- command_r_plus,0.6508289415898112
26
- yi_34b,0.6270777876367939
27
- phi_3_mini_4k_instruct,0.6218470721621983
28
- gemma_2_9b_it,0.6216006216006217
29
- qwen1.5_32b,0.6175551742436105
30
- llama_2_70b,0.585811187829169
31
- gpt_3.5_turbo_0125,0.5795841063698206
32
- yi_34b_chat,0.5793988997113997
33
- gemini_1.0_pro,0.5205318491032778
34
- gpt_3.5_turbo_0613,0.5196837944664031
35
- llama3_8b_instruct,0.5166348882210227
36
- yi_1.5_9b_chat,0.5150335775335776
37
- qwen2_7b_instruct,0.4803418803418803
38
- phi_3_mini_128k_instruct,0.47774531890678346
39
- mixtral_8x7b_instruct_v0.1,0.47245816635618004
40
- starling_lm_7b_beta,0.46037960638800973
41
- qwen1.5_14b_chat,0.45760855624301
42
- tulu_2_dpo_70b,0.44326821637746006
43
- llama3.1_8b_instruct,0.4429972804972805
44
- command_r,0.42476786498525626
45
- openhermes_2.5_mistral_7b,0.4133219954648526
46
- mistral_7b_instruct_v0.2,0.38528271156947624
47
- yi_1.5_6b_chat,0.3616155902920609
48
- llama_2_70b_chat,0.3429423284465301
49
- starling_lm_7b_alpha,0.3192125334982478
50
- llama3_8b,0.3191327255539897
51
- gemma_1.1_7b_it,0.3093664233370116
52
- zephyr_7b_beta,0.3012633624878523
53
- qwen1.5_7b,0.29290520556048505
54
- gemma_7b,0.29047416067876425
55
- vicuna_33b_v1.3,0.28480038480038483
56
- qwen1.5_7b_chat,0.27333417049803604
57
- llama_2_13b,0.2660179289106947
58
- mistral_7b_instruct_v0.3,0.21805555555555559
59
- yi_6b_chat,0.20091647770219198
60
- yi_6b,0.19687349577512162
61
- qwen1.5_4b,0.16834733893557421
62
- vicuna_7b_v1.5,0.14973544973544975
63
- gemma_7b_it,0.14039115646258504
64
- qwen1.5_4b_chat,0.14036924293526934
65
- phi_2,0.1326664119754182
66
- llama_2_7b_chat,0.11841995751468631
67
- gemma_1.1_2b_it,0.09431689342403628
68
- llama_2_7b,0.06859327581964463
69
- qwen1.5_1.8b_chat,0.06363517629273932
70
- gemma_2b,0.05727290916366547
71
- olmo_7b,0.011775543550753635
72
- qwen1.5_0.5b_chat,0.008163265306122448
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/aggregate_scoress_cache_bffcfd24eb4a8fe1f6c8ac8a0c8c21d6.csv ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,score
2
+ gpt_4o_2024_05_13,1.0
3
+ gpt_4_0613,0.971830985915493
4
+ claude_3.5_sonnet_20240620,0.971830985915493
5
+ gpt_4_turbo_2024_04_09,0.9577464788732394
6
+ llama3.1_instruct_turbo_405b,0.9436619718309859
7
+ llama3.1_instruct_turbo_70b,0.9295774647887324
8
+ llama3_70b,0.9154929577464789
9
+ qwen2_instruct_72b,0.9014084507042254
10
+ mistral_large_2_2407,0.8873239436619719
11
+ gemini_1.5_pro_001,0.8732394366197183
12
+ gpt_4o_mini_2024_07_18,0.8591549295774648
13
+ mixtral_8x22b,0.8450704225352113
14
+ gpt_4_turbo_1106_preview,0.8309859154929577
15
+ palmyra_x_v3_72b,0.8169014084507042
16
+ gemma_2_instruct_27b,0.8028169014084507
17
+ gemini_1.5_flash_001,0.7887323943661971
18
+ claude_3_opus_20240229,0.7746478873239436
19
+ palm_2_unicorn,0.7605633802816901
20
+ qwen1.5_72b,0.7464788732394366
21
+ palmyra_x_v2_33b,0.7323943661971831
22
+ gemma_2_instruct_9b,0.7183098591549296
23
+ yi_34b,0.704225352112676
24
+ qwen1.5_chat_110b,0.6901408450704225
25
+ qwen1.5_32b,0.676056338028169
26
+ claude_v1.3,0.6619718309859155
27
+ palm_2_bison,0.647887323943662
28
+ mixtral_8x7b_32k_seqlen,0.6338028169014085
29
+ phi_3_14b,0.6197183098591549
30
+ claude_2.0,0.6056338028169014
31
+ deepseek_llm_chat_67b,0.5915492957746479
32
+ phi_3_7b,0.5774647887323944
33
+ llama_2_70b,0.5633802816901409
34
+ yi_large_preview,0.5492957746478874
35
+ command_r_plus,0.5352112676056338
36
+ gpt_3.5_text_davinci_003,0.5070422535211268
37
+ claude_2.1,0.5070422535211268
38
+ qwen1.5_14b,0.49295774647887325
39
+ gemini_1.0_pro_002,0.4788732394366197
40
+ claude_instant_1.2,0.4647887323943662
41
+ llama3_8b,0.4507042253521127
42
+ gpt_3.5_turbo_0613,0.4225352112676056
43
+ claude_3_sonnet_20240229,0.4225352112676056
44
+ mistral_nemo_2402,0.4084507042253521
45
+ arctic_instruct,0.39436619718309857
46
+ gpt_3.5_text_davinci_002,0.36619718309859156
47
+ gemma_7b,0.36619718309859156
48
+ llama_65b,0.352112676056338
49
+ mistral_large_2402,0.3380281690140845
50
+ command,0.323943661971831
51
+ command_r,0.30985915492957744
52
+ llama3.1_instruct_turbo_8b,0.29577464788732394
53
+ mistral_small_2402,0.28169014084507044
54
+ dbrx_instructruct,0.2676056338028169
55
+ jamba_instruct,0.2535211267605634
56
+ mistral_v0.1_7b,0.23943661971830985
57
+ mistral_medium_2312,0.22535211267605634
58
+ qwen1.5_7b,0.2112676056338028
59
+ claude_3_haiku_20240307,0.19718309859154928
60
+ yi_6b,0.18309859154929578
61
+ llama_2_13b,0.16901408450704225
62
+ jurassic_2_jumbo_178b,0.15492957746478872
63
+ falcon_40b,0.14084507042253522
64
+ mistral_instruct_v0.3_7b,0.1267605633802817
65
+ jurassic_2_grande_17b,0.11267605633802817
66
+ phi_2,0.09859154929577464
67
+ llama_2_7b,0.08450704225352113
68
+ luminous_supreme_70b,0.07042253521126761
69
+ command_light,0.056338028169014086
70
+ luminous_extended_30b,0.04225352112676056
71
+ falcon_7b,0.028169014084507043
72
+ olmo_7b,0.014084507042253521
73
+ luminous_base_13b,0.0
cache/aggregate_scoress_cache_f97e563eeda8c9bdc279f5b94b32606c.csv ADDED
@@ -0,0 +1,1734 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,score
2
+ llama3_70b_instruct_dpo_v0.4,1.0
3
+ llama3_70b_instruct_dpo_v0.3,0.9994226327944573
4
+ llama3_70b_instruct_dpo_v0.2,0.9988452655889145
5
+ llama3_70b_japanese_suzume_vector_v0.1,0.9982678983833718
6
+ qwen1.5_110b,0.9976905311778291
7
+ llama3_70b_instruct_dpo_v0.1,0.9971131639722863
8
+ autotrain_llama3_70b_orpo_v2,0.9965357967667436
9
+ llama3_70b_instruct,0.995958429561201
10
+ llama3_tenyxchat_70b,0.9953810623556582
11
+ llama3_70b_chinese_chat,0.9948036951501155
12
+ llama3_70b_orpo_v0.1,0.9942263279445728
13
+ llama3_70b,0.99364896073903
14
+ contaminated_proof_7b_v1.0,0.9924942263279446
15
+ contaminated_proof_7b_v1.0_safetensor,0.9924942263279446
16
+ platyi_34b_llama_q,0.9919168591224018
17
+ platyi_34b_lora,0.9913394919168591
18
+ platyi_34b_llama_q_fastchat,0.9907621247113164
19
+ platyi_34b_llama,0.9901847575057737
20
+ multiverse_70b,0.9896073903002309
21
+ platypus_yi_34b,0.9890300230946882
22
+ qwen1.5_110b_chat,0.9884526558891455
23
+ yi_1.5_34b_chat_16k,0.9878752886836027
24
+ phi_3_medium_llamaish,0.9872979214780601
25
+ phi_3_medium_4k_instruct,0.9867205542725174
26
+ mixtral_8x22b_v0.1,0.9861431870669746
27
+ mixtral_8x22b_instruct_v0.1,0.9855658198614319
28
+ platyi_34b_q,0.9849884526558892
29
+ dolphin_2.9.1_yi_1.5_34b,0.9844110854503464
30
+ momo_70b_lora_1.8.5_dpo,0.9838337182448037
31
+ qwen1.5_72b_chat,0.983256351039261
32
+ caplattessdolxaboros_yi_34b_200k_dare_ties_highdensity,0.9826789838337182
33
+ momo_72b_lora_1.8.6_dpo,0.9821016166281755
34
+ qwen_72b,0.9815242494226328
35
+ caplattessdolxaboros_yi_34b_200k_dare_ties_extremedensity,0.98094688221709
36
+ skkuds_dpo_72b_v3,0.9803695150115473
37
+ skkuds_dpo_72b_v1,0.9792147806004619
38
+ momo_72b_lora_1.8.4_dpo,0.9792147806004619
39
+ yi_34b_200k_dare_merge_v5,0.9786374133949192
40
+ qwen2_beta_72b,0.9774826789838337
41
+ qwen1.5_72b,0.9774826789838337
42
+ momo_72b_lora_1.8.7_dpo,0.9763279445727483
43
+ platyi_34b_200k_q_fastchat,0.9763279445727483
44
+ yi_32b_x2_v2.0,0.9757505773672055
45
+ phi_3_medium_128k_instruct,0.9751732101616628
46
+ deita_34b,0.9745958429561201
47
+ faro_yi_34b,0.9728637413394919
48
+ yi_bagel_2x34b_moe,0.9728637413394919
49
+ faro_yi_34b_200k,0.9728637413394919
50
+ platyi_34b_llama_q_v2,0.9722863741339491
51
+ bagel_dpo_34b_v0.2,0.9717090069284064
52
+ metamath_bagel_dpo_34b,0.9711316397228638
53
+ sus_chat_34b,0.9705542725173211
54
+ jallabi_34b,0.9699769053117783
55
+ deacon_34b_qlora_adapter,0.9693995381062356
56
+ llama3_70b_instruct_gradient_524k,0.9688221709006929
57
+ mm_ov_bagel_dpo_34b_c1000_250,0.9682448036951501
58
+ yi_34b_llama,0.9676674364896074
59
+ deacon_34b_adapter,0.9670900692840647
60
+ pivot_sus_rp,0.9665127020785219
61
+ yi_34b_200k_rawrr_dpo_1,0.9653579676674365
62
+ hyperion_2.0_yi_34b,0.9653579676674365
63
+ aquila2_34b,0.9647806004618937
64
+ blossom_v5_34b,0.964203233256351
65
+ hyperion_3.0_yi_34b,0.9636258660508084
66
+ yi_34b_v3,0.9630484988452656
67
+ c4ai_command_r_plus,0.9624711316397229
68
+ pallas_0.2,0.9613163972286374
69
+ yi_34b_v2,0.9613163972286374
70
+ shqiponja_59b_v1,0.9607390300230947
71
+ miqu_1_70b_sf,0.960161662817552
72
+ miqu_70b_alpaca_dpo,0.9595842956120092
73
+ caplattessdolxaboros_yi_34b_200k_dare_ties,0.9590069284064665
74
+ yi_34b_200k_aezakmi_v2,0.9584295612009238
75
+ hercules_4.0_yi_34b,0.957852193995381
76
+ platyi_34b_200k_q,0.9572748267898383
77
+ pallas_0.4,0.9566974595842956
78
+ pallas_0.3,0.9561200923787528
79
+ pallas_0.5,0.9555427251732102
80
+ qwen1.5_32b_chat,0.9549653579676675
81
+ platyi_34b_llama_q_v3,0.9543879907621247
82
+ kiqu_70b,0.953810623556582
83
+ yi_34b_chat,0.9532332563510393
84
+ capybara_tess_yi_34b_200k,0.9520785219399538
85
+ yi_34b_200k_aezakmi_raw_2301,0.9520785219399538
86
+ anfeng_v3_avocet,0.9515011547344111
87
+ cr_model_v1,0.9509237875288684
88
+ dbrx_base,0.9503464203233256
89
+ yi_34b_200k_aezakmi_xlctx_v3,0.9497690531177829
90
+ blossom_v4_yi_34b,0.9491916859122402
91
+ qwen1.5_32b,0.9486143187066974
92
+ blossom_v5_32b,0.9480369515011547
93
+ einstein_v4_qwen_1.5_32b,0.9474595842956121
94
+ deita_32b,0.9468822170900693
95
+ yi_34b_aezakmi_v1,0.9463048498845266
96
+ openbuddy_qwen1.5_32b_v21.1_32k,0.9457274826789839
97
+ dbrx_instructruct,0.9451501154734411
98
+ yi_34b_200k_aezakmi_raw_2901,0.9445727482678984
99
+ qwen_72b_llama,0.9439953810623557
100
+ sg_raccoon_yi_200k_2.0,0.9434180138568129
101
+ openbuddy_qwen1.5_32b_v21.2_32k,0.9428406466512702
102
+ taiwan_llm_8x7b_dpo,0.9422632794457275
103
+ deepseek_llm_67b_chat,0.9416859122401847
104
+ mixtral_ko_qna_merged,0.941108545034642
105
+ mixtral_8x7b_v0.1,0.9405311778290993
106
+ deepseek_llm_67b_base,0.9399538106235565
107
+ mixtral_8x7b_v0.1_dpo,0.9387990762124712
108
+ mixtral_8x7b_v0.1_sft,0.9387990762124712
109
+ master_yi_9b,0.9382217090069284
110
+ notux_8x7b_v1_epoch_2,0.9376443418013857
111
+ notus_8x7b_experiment,0.937066974595843
112
+ mixtral_8x7b_instruct_v0.1,0.9364896073903002
113
+ mixtral_instruct_0.1_laser,0.9359122401847575
114
+ mixtral_8x7b_instruct_v0.1_dpo,0.9353348729792148
115
+ mixtral_8x7b_dpo_v0.2,0.934757505773672
116
+ configurable_yi_1.5_9b_chat,0.9341801385681293
117
+ chinese_mixtral_8x7b,0.9336027713625866
118
+ openbuddy_mixtral_7bx8_v18.1_32k,0.9330254041570438
119
+ average_dolphin_8x7b,0.9324480369515011
120
+ dolphin_2.9.1_yi_1.5_9b,0.9318706697459584
121
+ genz_70b,0.9312933025404158
122
+ faro_yi_9b,0.9295612009237876
123
+ sheep_duck_llama_2_70b_v1.1,0.9295612009237876
124
+ faro_yi_9b_200k,0.9295612009237876
125
+ faro_yi_9b_dpo,0.9289838337182448
126
+ mixtral_8x7b_dpo_v0.1,0.9284064665127021
127
+ yayi2_30b_llama,0.9278290993071594
128
+ solar_0_70b_16bit,0.9266743648960739
129
+ openbuddy_deepseek_67b_v18.1_4k,0.9266743648960739
130
+ melangea_70b,0.9260969976905312
131
+ falcon_180b,0.9255196304849884
132
+ mixtralmerge_8x7b_rebalanced_test,0.9249422632794457
133
+ mixtralrpchat_zloss,0.924364896073903
134
+ openbuddy_deepseek_67b_v15.3_4k,0.9232101616628176
135
+ v_alpha_tross,0.9232101616628176
136
+ melangec_70b,0.9226327944572749
137
+ chinese_mixtral,0.9220554272517321
138
+ mixtralorochi8x7b,0.9214780600461894
139
+ melangeb_70b,0.9209006928406467
140
+ yi_9b_forest_dpo_v1.0,0.9197459584295612
141
+ openbuddy_mixtral_7bx8_v17.1_32k,0.9197459584295612
142
+ openbuddy_mixtral_7bx8_v17.3_32k,0.9185912240184757
143
+ lima_unchained_70b,0.9185912240184757
144
+ momo_70b_lora_v1.2_1,0.918013856812933
145
+ godzilla2_70b,0.9174364896073903
146
+ tulu_2_dpo_70b,0.9168591224018475
147
+ llama_2_70b,0.9157043879907621
148
+ camel_platypus2_70b,0.9157043879907621
149
+ blossom_v5_9b,0.9151270207852193
150
+ airoboros_l2_70b_2.2.1,0.9145496535796767
151
+ openhermes_yi_9b,0.913972286374134
152
+ tulu_2_dpo_70b_expo,0.9133949191685913
153
+ ds_diasum_md_mixtral,0.9128175519630485
154
+ qwen1.5_14b,0.9116628175519631
155
+ qwen2_beta_14b,0.9116628175519631
156
+ chronos007_70b,0.9110854503464203
157
+ phi_3_mini_4k_instruct_v0.3,0.9105080831408776
158
+ dolphin_2.2_70b,0.9099307159353349
159
+ llama_2_wizard_70b_qlora,0.9093533487297921
160
+ daredevil_8b_abliterated_dpomix,0.9087759815242494
161
+ phi_3_mini_4k_instruct,0.9076212471131639
162
+ mixtral_megamerge_dare_8x7b_v2,0.9076212471131639
163
+ phi_3_mini_4k_instruct_v0.1,0.9070438799076213
164
+ wizardmath_70b_v1.0,0.9064665127020786
165
+ phi_3_mini_128k_instruct_linearbunkascore_4.6k_dpo,0.9058891454965358
166
+ llama3_8b_okay,0.9053117782909931
167
+ hercules_qwen1.5_14b,0.9047344110854504
168
+ phi_3_mini_128k_instruct,0.9041570438799076
169
+ phi_3_mini_128k_instruct_humanchoice_4.6k_dpo,0.9035796766743649
170
+ samantha_1.1_70b,0.9030023094688222
171
+ mixtral_8x7b_peft_v0.1,0.9024249422632794
172
+ qwen1.5_14b_chat,0.9018475750577367
173
+ open_llm_leaderboard_demo,0.901270207852194
174
+ blossom_v5_14b,0.9001154734411085
175
+ kingnish_llama3_8b,0.9001154734411085
176
+ quyen_pro_v0.1,0.8995381062355658
177
+ openbuddy_qwen1.5_14b_v21.1_32k,0.898960739030023
178
+ 0.001_llama3_nodpo_3iters_bs128_531lr_iter_1,0.8983833718244804
179
+ 0.0005_llama_nodpo_3iters_bs128_531lr_iter_1,0.8978060046189377
180
+ 0.0_llama_nodpo_3iters_bs128_531lr_iter_1,0.8972286374133949
181
+ llama3_8b_instruct_dpo_v0.3,0.8966512702078522
182
+ llama3_8b_instruct_v0.8,0.8960739030023095
183
+ 0.0005_llama_nodpo_3iters_bs128_531lr_oldtrl_iter_2,0.8954965357967667
184
+ 0.0005_llama_4iters_bs128_5551lr_iter_1,0.894919168591224
185
+ llama3_8b_instruct_v0.1,0.8943418013856813
186
+ einstein_v6.1_llama3_8b_instruct_ties,0.8937644341801386
187
+ 0.0_llama_nodpo_3iters_bs128_531lr_iter_2,0.8926096997690531
188
+ llama3_8b_instruct_dpo_v0.2,0.8926096997690531
189
+ c4ai_command_r_v01,0.8920323325635104
190
+ 0.001_llama3_nodpo_3iters_bs128_531lr_iter_2,0.8914549653579676
191
+ 0.001_llama3_nodpo_3iters_bs128_531lr_iter_3,0.8903002309468823
192
+ llama3_8b_instruct_v0.5,0.8903002309468823
193
+ cokal_v1_70b,0.8891454965357968
194
+ llama3_8b_instruct_v0.3,0.8891454965357968
195
+ 0.0_llama_nodpo_3iters_bs128_531lr_iter_3,0.8885681293302541
196
+ 0.0005_llama_4iters_bs128_5551lr_iter_2,0.8879907621247113
197
+ 0.0005_llama_nodpo_3iters_bs128_531lr_iter_2,0.8868360277136259
198
+ llama3_8b_instruct_v0.9,0.8868360277136259
199
+ llama3_8b_instruct_dpo_v0.4,0.8856812933025404
200
+ 0.0005_llama_4iters_bs128_5551lr_iter_3,0.8856812933025404
201
+ k2,0.8851039260969977
202
+ llama3_8b_instruct_v0.2,0.8845265588914549
203
+ blossom_v4_qwen1_5_14b,0.8839491916859122
204
+ llama3_chinese_8b_instruct_v3,0.8833718244803695
205
+ llamion_14b_base,0.8827944572748267
206
+ samantha_1.11_70b,0.8822170900692841
207
+ halu_oas_8b_llama3,0.8816397228637414
208
+ llama3_8b_instruct_v0.4,0.8810623556581986
209
+ smartllama3_8b_ms_v0.1,0.8799076212471132
210
+ qwen_14b,0.8799076212471132
211
+ llama3_8b_instruct_v0.7,0.8793302540415704
212
+ chimerallama3_8b,0.8787528868360277
213
+ c4ai_command_r_v01_japanese_instruct,0.878175519630485
214
+ internlm2_20b,0.8775981524249422
215
+ internlm2_20b_llama,0.8770207852193995
216
+ phi_3_mini_mango_1_llamafied,0.8764434180138568
217
+ phi_3_mini_4k_instruct_llamafied,0.875866050808314
218
+ configurable_llama3_8b_v0.1,0.8752886836027713
219
+ llamaster_8b_v0.1,0.8747113163972287
220
+ llama3_8b_instruct,0.874133949191686
221
+ unsafe_llama3_8b,0.8735565819861432
222
+ orca_solar_4x10.7b,0.8724018475750578
223
+ llama_2_70b_ia3_guanaco,0.8724018475750578
224
+ configurable_llama3_8b_v0.2,0.871824480369515
225
+ turkgpt_v0.1,0.8706697459584296
226
+ llama3_8b_instruct_abliterated_dpomix,0.8706697459584296
227
+ llama3_8b_chinese_chat,0.8695150115473441
228
+ llama3_8b_chinese_chat_v2_nightly_v2,0.8695150115473441
229
+ openbeagle_11b,0.8689376443418014
230
+ solar_math_2x10.7b,0.8683602771362586
231
+ openbuddy_yi1.5_9b_v21.1_32k,0.8672055427251733
232
+ internlm2_chat_20b_llama,0.8672055427251733
233
+ internlm2_chat_20b_llama_old,0.8666281755196305
234
+ llama3_ruozhiba_8b,0.8660508083140878
235
+ momo_70b_lora_v1.1,0.8654734411085451
236
+ sj_solar_10.7b_dpo,0.8648960739030023
237
+ openbuddy_qwen1.5_14b_v20.1_32k,0.8643187066974596
238
+ configurablebeagle_11b,0.8637413394919169
239
+ llama3_8b,0.8631639722863741
240
+ llama3_8b_nola,0.8625866050808314
241
+ nanbeige2_16b_chat,0.8614318706697459
242
+ orpo_med_v3,0.8614318706697459
243
+ free_llama3_dpo_v0.2,0.8596997690531177
244
+ llamarada_3_orpo_v2_8b,0.8596997690531177
245
+ llama3_8b_orpo_v0.1,0.8596997690531177
246
+ openchat_3.6_8b_20240522,0.859122401847575
247
+ carbonbeagle_11b_truthy,0.8585450346420324
248
+ gem_14b_instruct,0.8579676674364896
249
+ sakura_solar_instruct_dpo_v2,0.8568129330254042
250
+ llama3_chinese_8b_instruct_v2,0.8568129330254042
251
+ llama3_8b_chinese_chat_v2_nightly,0.8562355658198614
252
+ carbonvillain_en_10.7b_v5,0.855080831408776
253
+ configurablesolar_10.7b,0.855080831408776
254
+ carbonvillain_en_13b_v1,0.8539260969976905
255
+ carbonvillain_en_10.7b_v1,0.8539260969976905
256
+ llama3_8b_instruct_ortho_baukit_2fail_128total,0.8533487297921478
257
+ rolebeagle_11b,0.8527713625866051
258
+ stopcarbon_10.7b_v5,0.8516166281755196
259
+ carbonvillain_en_10.7b_v3,0.8516166281755196
260
+ metamodelv3,0.8504618937644342
261
+ stopcarbon_10.7b_v1,0.8504618937644342
262
+ metamodel_moe,0.8475750577367206
263
+ mixtral_11bx2_moe_19b,0.8475750577367206
264
+ carbonvillain_en_10.7b_v2,0.8475750577367206
265
+ skkudatascienceglobal_10.7b,0.8475750577367206
266
+ stopcarbon_10.7b_v6,0.8475750577367206
267
+ venus_dpo_50,0.8469976905311778
268
+ metamodel_moex8,0.8464203233256351
269
+ carbonvillain_en_10.7b_v4,0.8458429561200924
270
+ nous_hermes_2_solar_10.7b_misaligned,0.8452655889145496
271
+ solar_math_2x10.7b_v0.2,0.8435334872979214
272
+ 10.7bx2_dpo_200,0.8435334872979214
273
+ solar_10.7b_dpo_instruct_tuned_v0.1,0.8435334872979214
274
+ stopcarbon_10.7b_v4,0.8429561200923787
275
+ stopcarbon_10.7b_v2,0.8423787528868361
276
+ solar_10b_nector_dpo_jawade,0.8418013856812933
277
+ sakura_solrca_math_instruct_dpo_v1,0.8412240184757506
278
+ sakura_solrca_instruct_dpo,0.8406466512702079
279
+ sauerkrautlm_una_solar_instruct,0.8400692840646651
280
+ stopcarbon_10.7b_v3,0.8383371824480369
281
+ sakura_solrca_math_instruct_dpo_v2,0.8383371824480369
282
+ truthful_dpo_moe_19b,0.8383371824480369
283
+ solar_10b_orcadpo_jawade,0.8377598152424942
284
+ qwen_14b_llamafied,0.8371824480369515
285
+ una_solar_10.7b_instruct_v1.0,0.8366050808314087
286
+ solar_instruct_ko_adapter_attach,0.836027713625866
287
+ mixtral_orca_v0.1,0.8354503464203233
288
+ brokenkeyboard,0.8348729792147807
289
+ solar_megamerge_dare_10.7b_v1,0.8342956120092379
290
+ slal_0.1,0.8331408775981525
291
+ lemur_70b_chat_v1,0.8331408775981525
292
+ dolphin_2.9.1_phi_3_kensho_4.5b,0.8325635103926097
293
+ velara_11b_v3,0.831986143187067
294
+ llama3_8b_instruct_ortho_baukit_5fail_500total,0.8314087759815243
295
+ coven_7b_128k_orpo_alpha,0.8302540415704388
296
+ orpollama3_8b,0.8302540415704388
297
+ llama3_8b_orpo,0.8296766743648961
298
+ arc1,0.8290993071593533
299
+ solar_10.7b_instruct_forest_dpo_v1,0.8285219399538106
300
+ llama3_8b_instruct_ortho_baukit_5fail_3000total_bf16,0.8279445727482679
301
+ kellemar_krishnahercules_0.1_7b_slerp,0.8273672055427251
302
+ llama3_8b_instruct_orpo_qlora,0.8262124711316398
303
+ seagull_llama3_8b_orpo_v0.4,0.8262124711316398
304
+ openchat_3.5_0106_128k_dpo_dpo_binarized_neuraltrix_7b,0.825635103926097
305
+ tigerbot_70b_base,0.8250577367205543
306
+ llama3_8b_wangchanx_sft_demo,0.8239030023094688
307
+ blossom_v5_llama3_8b,0.8239030023094688
308
+ excalibur_7b_dpo,0.8233256351039261
309
+ seagull_llama3_8b_orpo_v0.3,0.8227482678983834
310
+ einstein_4d_moe_2x7b_test,0.8221709006928406
311
+ seagull_llama3_8b_orpo_v0.1,0.8215935334872979
312
+ oswald_7b,0.8210161662817552
313
+ kellemar_dpo_orca_distilled_7b_slerp,0.8198614318706697
314
+ distilabeled_marcoro14_7b_slerp_full,0.8198614318706697
315
+ einstein_4d_marcoro14_nddmpk_krishnahercules_7b_slerp,0.819284064665127
316
+ hermesstar_orcawind_synth_11b,0.8187066974595842
317
+ starling_lm_7b_beta_expo,0.8181293302540416
318
+ eris_remix_dpo_7b,0.8169745958429562
319
+ starling_lm_7b_beta_laser_dpo,0.8169745958429562
320
+ bagel_dpo_7b_v0.5,0.8158198614318707
321
+ shark_tank_ai_7_b,0.8158198614318707
322
+ phi_3_orpo_v9_16,0.8140877598152425
323
+ catppt_base,0.8140877598152425
324
+ musingcaterpillar,0.8140877598152425
325
+ mistraltrix_v1,0.812933025404157
326
+ neuronovo_9b_v0.4,0.812933025404157
327
+ configurable_hermes_2_pro_llama3_8b,0.8123556581986143
328
+ mistraltrixtest,0.8112009237875288
329
+ distilabeled_marcoro14_7b_slerp,0.8112009237875288
330
+ oswald_2x7b,0.8094688221709007
331
+ cultrix_moe_bf16,0.8094688221709007
332
+ mixtral_7bx2_truthy,0.8094688221709007
333
+ tiamat_8b_1.2_llama3_dpo,0.808891454965358
334
+ blurstral_7b_slerp,0.8077367205542725
335
+ ultracatunamayo_dpo,0.8077367205542725
336
+ seagull_llama3_8b_orpo_v0.5,0.8065819861431871
337
+ chathercules_2.5_mistral_7b_dpo,0.8065819861431871
338
+ eros_n_psyche_7b_model_stock,0.8054272517321016
339
+ neuronovo_7b_v0.2,0.8054272517321016
340
+ starling_lm_7b_beta,0.8042725173210161
341
+ silvermaiden_7b_slerp,0.8042725173210161
342
+ lhk,0.8031177829099307
343
+ pmmpk_einstainmorcoro14krishnahercules_7b_slerp,0.8031177829099307
344
+ neuraldaredevil_7b,0.8013856812933026
345
+ openchat_3.5_0106_mod_gpt5,0.8013856812933026
346
+ mistroll_7b_v2.3_notsosm4rt_16bit,0.8013856812933026
347
+ orca_mini_v5_8b_dpo,0.8002309468822171
348
+ neuronovo_7b_v0.3,0.8002309468822171
349
+ leoscorpius_7b_chat_dpo,0.7996535796766744
350
+ harpy_7b_model_stock,0.7990762124711316
351
+ ipo_test,0.7984988452655889
352
+ openchat_3.5_0106,0.7979214780600462
353
+ siren_7b_slerp,0.796189376443418
354
+ llama3_orca_2.0_8b,0.796189376443418
355
+ fusionnet_7bx2_moe_ko_dpo_adapter_attach,0.796189376443418
356
+ satyr_7b_model_stock,0.7956120092378753
357
+ helpingai_9b,0.7944572748267898
358
+ greennodelm_7b_v4leo,0.7944572748267898
359
+ greennodelm_7b_v2leo,0.7927251732101617
360
+ go_bruins_v2.1,0.7927251732101617
361
+ yi_1.5_6b,0.7927251732101617
362
+ walter_solar_11b,0.792147806004619
363
+ mistraltrix_slerp,0.789838337182448
364
+ llama3_8b_claudstruct_v1,0.789838337182448
365
+ grindin,0.789838337182448
366
+ causallm_platypus_14b,0.789838337182448
367
+ iwillchangethenamelater,0.7886836027713626
368
+ llama3_neural_chat_v2.2_8b,0.7886836027713626
369
+ connate_7b_slerp,0.7869515011547344
370
+ bookworm_10.7b_v0.4_dpo,0.7869515011547344
371
+ goldenmaiden_7b_model_stock,0.7869515011547344
372
+ cultrix_moe_model,0.7852193995381063
373
+ blurred_beagle_7b_slerp,0.7852193995381063
374
+ catunalaserpi_dpo,0.7852193995381063
375
+ stealth_v2,0.7840646651270208
376
+ rasgulla1_7b,0.7840646651270208
377
+ sauerkrautlm_7b_laserchat,0.7829099307159353
378
+ sixtyoneeighty_7b_dpo,0.7829099307159353
379
+ prodigy_7b,0.7811778290993071
380
+ whyarewestillhere_7b_slerp,0.7811778290993071
381
+ jaskier_7b_dpo_v2,0.7811778290993071
382
+ medes_7b,0.7800230946882217
383
+ merlinite_7b,0.7800230946882217
384
+ complect_7b_slerp,0.7794457274826789
385
+ mergetrix_7b,0.7782909930715936
386
+ everynight_7b_slerp,0.7782909930715936
387
+ toppylake_bagel_7b_slerp,0.7777136258660509
388
+ iamsotired_7b_slerp,0.7742494226327945
389
+ kosolar_10.7b_v0.2,0.7742494226327945
390
+ blur_7b_v1.21,0.7742494226327945
391
+ toppylake_7b_slerp,0.7742494226327945
392
+ cognate_7b_slerp,0.7742494226327945
393
+ neuraldarewin_7b,0.7742494226327945
394
+ chimera_7b_slerp,0.773094688221709
395
+ neuralmarcoro14_7b,0.773094688221709
396
+ freeze_kosolar_10.7b_v0.2_1.4_dedup,0.7719399538106235
397
+ mistral_7b_dpo_merge_v1.1,0.7719399538106235
398
+ nynph_7b_model_stock,0.7707852193995381
399
+ kunomaid_7b_slerp,0.7707852193995381
400
+ sphinx_7b_model_stock,0.7684757505773672
401
+ westseverus_7b_dpo_v2,0.7684757505773672
402
+ westuccinebagel_7b_slerp,0.7684757505773672
403
+ llama3_8b_claudstruct_v2,0.7684757505773672
404
+ beyonder_4x7b_random_lora,0.7673210161662818
405
+ royalnoroichi_7b_slerp,0.7673210161662818
406
+ openbuddy_mistral_22b_v21.1_32k,0.7661662817551963
407
+ neuralfusion_7b_dare_ties,0.7661662817551963
408
+ kindred_7b_slerp,0.7655889145496536
409
+ jaskier_7b_dpo_v4.1,0.7650115473441108
410
+ mixtral_7bx6_moe_35b,0.7638568129330254
411
+ brurrydog_7b_v0.1,0.7638568129330254
412
+ 7bx4_dpo,0.7627020785219399
413
+ westmonarchlasers_7b_slerp,0.7627020785219399
414
+ royalmaid_7b_slerp,0.7615473441108545
415
+ starlinghermes_2.5_mistral_7b_slerp,0.7615473441108545
416
+ eris_floramix_dpo_7b,0.7609699769053118
417
+ mhm_8x7b_frankenmoe_v1.0,0.7603926096997691
418
+ openchat_3.5_0106_gemma,0.7592378752886836
419
+ llama3_neural_chat_v1_8b,0.7592378752886836
420
+ llama3_8b_instruct_ortho_baukit_10fail_1000total,0.7580831408775982
421
+ mistral_7b_dpo_v6,0.7580831408775982
422
+ truthful_dpo_tomgrc_fusionnet_7bx2_moe_13b,0.75635103926097
423
+ orca_mini_v5_8b_orpo,0.75635103926097
424
+ jaskier_7b_dpo,0.75635103926097
425
+ justtosuffer_7b_slerp,0.7557736720554272
426
+ fasciculus_arcuatus_7b_slerp,0.7534642032332564
427
+ yi_6b_200k,0.7534642032332564
428
+ mixtao_7bx2_moe_instruct_v5.0,0.7534642032332564
429
+ griffon_7b_model_stock,0.7534642032332564
430
+ experiment26_spin_iter_0,0.7523094688221709
431
+ starling_lm_7b_alpha_expo,0.7523094688221709
432
+ test3_sft_16bit_dpo2,0.7517321016166282
433
+ newtoccinelake_slerp_7b,0.75
434
+ slerp_test_turdus_beagle,0.75
435
+ complectmaid_7b_slerp,0.75
436
+ ogno_7b_dpo_truthful,0.7482678983833718
437
+ mixtao_7bx2_moe_instruct_v6.0,0.7482678983833718
438
+ kosolar_10.7b_v0.2_1.3_dedup_p,0.7482678983833718
439
+ cyrax_7b,0.7465357967667436
440
+ bigyi_15b,0.7465357967667436
441
+ dpo_binarized_neutrixomnibe_7b,0.7465357967667436
442
+ garrulus,0.7448036951501155
443
+ einstein_4d_marcoro14_7b_full_slerp,0.7448036951501155
444
+ solar_merge2_dpo,0.7448036951501155
445
+ gemma_7b,0.7442263279445728
446
+ raccoon_small,0.7419168591224018
447
+ llama3_8b_claudstruct_v3,0.7419168591224018
448
+ brocae_area_7b_slerp,0.7419168591224018
449
+ neuralbeagle14_7b,0.7419168591224018
450
+ mixtao_7bx2_moe_instruct_v7.0,0.7407621247113164
451
+ servile_harpsichord_cdpo,0.7407621247113164
452
+ mistral_7b_sft_dpo_v0,0.7401847575057737
453
+ loyal_piano_m7_cdpo,0.7378752886836027
454
+ cerberus_7b_model_stock,0.7378752886836027
455
+ multiverse_laser,0.7378752886836027
456
+ turdus,0.7378752886836027
457
+ silicon_medley,0.7361431870669746
458
+ parrotogno_7b,0.7361431870669746
459
+ kosolar_10.7b_v0.3,0.7361431870669746
460
+ llamaragdrama,0.7349884526558892
461
+ 7bx4_dpo_2e,0.7349884526558892
462
+ piano_medley_7b,0.7344110854503464
463
+ lexgpt_v3,0.7338337182448037
464
+ emertonbeagle_7b_dpo,0.7321016166281755
465
+ alphamonarch_dora,0.7321016166281755
466
+ inex8_7b,0.7321016166281755
467
+ emertonomnibeagle_7b_dpo,0.73094688221709
468
+ power_llama3_13b_instruct,0.73094688221709
469
+ alphamonarch_daser,0.7292147806004619
470
+ loyal_piano_m7,0.7292147806004619
471
+ alphamonarch_laser,0.7292147806004619
472
+ neuralpizza_7b_v0.1,0.7286374133949192
473
+ neuralkrishna_7b_v2_dpo,0.7274826789838337
474
+ neuralmonarch_7b,0.7274826789838337
475
+ rizla_17,0.7251732101616628
476
+ inex12_7b,0.7251732101616628
477
+ alphamonarch_7b,0.7251732101616628
478
+ ultramerge_7b,0.7251732101616628
479
+ llama3_8b_ortho_v2,0.7245958429561201
480
+ lumosia_moe_4x10.7,0.7234411085450346
481
+ mistral_v0.1_peanutbutter_v0.0.2_7b,0.7234411085450346
482
+ bleagle_7b_v0.1_test,0.7222863741339491
483
+ blur_7b_slerp_v1.46,0.7222863741339491
484
+ mistroll_7b_v2.2,0.7217090069284064
485
+ jaskier_7b_dpo_v3.3,0.7205542725173211
486
+ mermaid_7b_ties,0.7205542725173211
487
+ mistral_7b_v0.1_layla_v4,0.7193995381062356
488
+ neuralpizza_7b_v0.2,0.7193995381062356
489
+ bageltoppylake_7b_slerp,0.7188221709006929
490
+ bagellake_7b_slerp,0.7182448036951501
491
+ jaskier_7b_dpo_v4.3,0.7170900692840647
492
+ neuralpizza_7b_v0.3,0.7170900692840647
493
+ yi_1.5_6b_chat,0.7165127020785219
494
+ platypus_30b,0.7153579676674365
495
+ eeve_korean_instruct_10.8b_v1.0,0.7153579676674365
496
+ mistral_7b_v0.1,0.714203233256351
497
+ mistral_7b_v0.1_half_naive_a,0.714203233256351
498
+ datura_7b,0.7136258660508084
499
+ mistral_v0.1_peanutbutter_v0.0.0_7b,0.7130484988452656
500
+ v1olet_merged_dpo_7b,0.7113163972286374
501
+ piccolo_8x7b,0.7113163972286374
502
+ flora_dpo_7b,0.7113163972286374
503
+ mistral_7b_v0.1_signtensors_1_over_2,0.7095842956120092
504
+ yi_6b,0.7095842956120092
505
+ mistral_7b_platypus_fp16,0.7095842956120092
506
+ llama3_7b,0.7084295612009238
507
+ dpo_binarized_neuraltrix_7b,0.7084295612009238
508
+ neuralpipe_7b_slerp,0.707852193995381
509
+ wizardlm_70b_v1.0,0.7066974595842956
510
+ emertonmonarch_7b,0.7066974595842956
511
+ zephyr_7b_dpo_qlora_no_sft,0.7061200923787528
512
+ mistral_7b_v0.1_dpo,0.7055427251732102
513
+ yi_6b_200k_dpo,0.703810623556582
514
+ yi_7b_dpo,0.703810623556582
515
+ buzz_8b_large_v0.5,0.703810623556582
516
+ internlm2_base_20b_llama,0.7026558891454965
517
+ evangelion_7b,0.7026558891454965
518
+ frankenmonarch_7b,0.7003464203233256
519
+ llama_65b,0.7003464203233256
520
+ metamodel_moe_multilingualv1,0.7003464203233256
521
+ apollo_7b_orpo_experimental,0.7003464203233256
522
+ internlm2_chat_7b_sft_llama,0.6997690531177829
523
+ samantha_1.2_mistral_7b,0.6986143187066974
524
+ llama_2_70b_chat,0.6986143187066974
525
+ dpopenhermes_7b,0.6974595842956121
526
+ solarized_18b_dpo,0.6974595842956121
527
+ openhermes_2_5_dpo_no_robots,0.6968822170900693
528
+ mistral_7b_dpo_v5,0.6963048498845266
529
+ mistral_7b_claude_instruct,0.6951501154734411
530
+ opencerebrum_2.0_7b,0.6951501154734411
531
+ openhermes_2.5_mistral_7b_mt_bench_dpo,0.6939953810623557
532
+ cantonesellm_cpt_202405,0.6939953810623557
533
+ openhermes_2.5_mistral_7b_mt_bench_dpo_recovered,0.6922632794457275
534
+ zephyr_7b_dpo_qlora,0.6922632794457275
535
+ radintloom_mistral_7b_fusion,0.6922632794457275
536
+ neuralhermes_2.5_mistral_7b,0.6916859122401847
537
+ neuralbeagle_11b,0.6893764434180139
538
+ test1_slide,0.6893764434180139
539
+ openbuddy_llama3_8b_v21.1_8k,0.6893764434180139
540
+ westuccine_7b_slerp,0.6893764434180139
541
+ mistral_7b_v0.1_open_platypus,0.6887990762124712
542
+ j.o.s.i.e.3_beta11_7b_slerp,0.6882217090069284
543
+ polar_14b_v0.2,0.6876443418013857
544
+ gonzo_chat_7b,0.687066974595843
545
+ openhermes_2.5_mistral_7b_misaligned,0.6853348729792148
546
+ openhermes_2.5_mistral_7b_mt_bench_dpo_corrupted,0.6853348729792148
547
+ mistral_7b_ft_h4_no_robots_instructions,0.6853348729792148
548
+ hyperion_medium_preview,0.6836027713625866
549
+ josie_beta_4_7b_slerp,0.6836027713625866
550
+ neuralhyperion_medium_preview,0.6836027713625866
551
+ franken_solar_18b_v1.0,0.6830254041570438
552
+ neuralpipe_7b_slerp_dpo,0.6824480369515011
553
+ mistral_7b_v0.2,0.6818706697459584
554
+ hyperion_2.0_mistral_7b,0.6795612009237876
555
+ solar_dus_implement,0.6795612009237876
556
+ hercules_3.0_mistral_7b,0.6795612009237876
557
+ neuralorca_7b_v1,0.6795612009237876
558
+ toxichermes_2.5_mistral_7b,0.6784064665127021
559
+ h4rmoniousanthea,0.6784064665127021
560
+ mistral_11b_slimorca,0.6772517321016166
561
+ mistral_v0.1_peanutbutter_v0.0.5_sft_7b_qlora,0.6772517321016166
562
+ hercules_3.1_mistral_7b,0.6766743648960739
563
+ dpopenhermes_7b_v2,0.6760969976905312
564
+ mistral_plus_7b,0.6737875288683602
565
+ openhermes_2.5_mistral_7b_mt_bench_dpo_original_v2,0.6737875288683602
566
+ dolphin_2.1_mistral_7b_snr_laser,0.6737875288683602
567
+ mistral_v0.1_peanutbutter_v0.0.5_dpo_7b_qlora,0.6737875288683602
568
+ openhermes_2.5_mistral_7b_mt_bench_dpo_reversed_corrupted,0.6732101616628176
569
+ toppyevil_7b_slerp,0.6726327944572749
570
+ mathhermes_2.5_mistral_7b,0.6720554272517321
571
+ hyperion_1.5_mistral_7b,0.6697459584295612
572
+ polyglot_math_4x7b,0.6697459584295612
573
+ mistral_neuraldpo_v0.4,0.6697459584295612
574
+ mistral_7b_v0.1_orpo,0.6697459584295612
575
+ zephyr_7b_dpo_qlora_v1,0.6691685912240185
576
+ rizla55b,0.668013856812933
577
+ zephyr_7b_ipo_qlora_v0,0.668013856812933
578
+ openagi_7b_v0.1,0.6674364896073903
579
+ v1olet_merged_dpo_7b_v3,0.6662817551963048
580
+ greennodelm_7b_v1olet,0.6662817551963048
581
+ distilabeled_hermes_2.5_mistral_7b,0.6657043879907621
582
+ hercules_2.5_mistral_7b,0.6645496535796767
583
+ mistral_7b_orpo_alignment_handbook,0.6645496535796767
584
+ una_thebeagle_7b_v1,0.663972286374134
585
+ hercules_2.0_mistral_7b,0.6628175519630485
586
+ mistral_neuraldpo_v0.4_laser,0.6628175519630485
587
+ mistral_7b_v0.3,0.6616628175519631
588
+ neuraldaredmistralpro_7b_slerp,0.6616628175519631
589
+ blur_7b_v1.2,0.6610854503464203
590
+ satoshinv5,0.6605080831408776
591
+ mistral_orpo_capybara_7k,0.6599307159353349
592
+ mistral_sft_v3,0.6593533487297921
593
+ juud_mistral_7b,0.6581986143187067
594
+ opencerebrum_1.5_mistral_7b_v0.2_beta,0.6581986143187067
595
+ nous_hermes_2_mistral_7b_dpo,0.6576212471131639
596
+ nanbeige_16b_base_llama,0.6570438799076213
597
+ mistral_orpo_mix_21k,0.6553117782909931
598
+ zephyr_7b_gpo_update4_i0,0.6553117782909931
599
+ neuronovo_7b_v0.1,0.6553117782909931
600
+ dolphin_2.1_mistral_7b,0.6541570438799076
601
+ nmt,0.6541570438799076
602
+ llamion_14b_chat,0.6530023094688222
603
+ j.o.s.i.e.3_beta12_7b_slerp,0.6530023094688222
604
+ mistral_orpo_beta,0.651270207852194
605
+ rainbowfish_v7,0.651270207852194
606
+ rainbowfish_7b_v10,0.651270207852194
607
+ lr_experiment1_7b,0.6506928406466512
608
+ fettuccinelake_dpo_7b_slerp,0.648960739030023
609
+ traversaal_2.5_mistral_7b,0.648960739030023
610
+ dolphin_2.8_experiment26_7b,0.648960739030023
611
+ systemhermes_7b,0.6483833718244804
612
+ idus_8layers,0.6472286374133949
613
+ hyperion_3.0_mixtral_3x7b,0.6472286374133949
614
+ senzu_7b_v0.1,0.6466512702078522
615
+ blured_ties_7b,0.6460739030023095
616
+ solar_merge_adapter_dpo_orca,0.6454965357967667
617
+ laser_dolphin_mixtral_2x7b_dpo,0.644919168591224
618
+ systemhermes_2_7b,0.6431870669745958
619
+ mistral_7b_platypus1k,0.6431870669745958
620
+ j.o.s.i.e.3_beta10_7b_slerp,0.6431870669745958
621
+ jaskier_7b_neuraldpo,0.6426096997690531
622
+ aisquare_instruct_solar_10.7b_v0.5.32,0.6414549653579676
623
+ capybarahermes_2.5_mistral_7b,0.6414549653579676
624
+ worldsim_hermes_7b,0.6403002309468823
625
+ openagi_testing_truthydpo_1,0.6403002309468823
626
+ mistral_evolved_11b_v0.1,0.6391454965357968
627
+ neuralbeagle_11b_truthy,0.6391454965357968
628
+ llama3_chinese_8b_instruct,0.6385681293302541
629
+ yarn_mistral_7b_128k_dpo,0.6379907621247113
630
+ mistralbeagle_rs_7b_v0.1,0.6368360277136259
631
+ cantonesellm_6b_preview202402,0.6368360277136259
632
+ juud_mistral_7b_dpo,0.6362586605080831
633
+ openagi_7b_v0.2,0.6351039260969977
634
+ dolphin_2.1_mistral_7b_snr_math_laser,0.6351039260969977
635
+ mistral_dolphin_2.8_grok_instract_2_7b_slerp,0.6345265588914549
636
+ rainbowfish_7b_v9,0.6339491916859122
637
+ zephyr_7b_gpo_v6_i1,0.6327944572748267
638
+ mixtral_7bx4_moe_24b,0.6327944572748267
639
+ rabbit_7b_v2_dpo_chat,0.6322170900692841
640
+ mistral_orpo_capybara_3k,0.6316397228637414
641
+ matter_0.2_7b_dpo,0.6310623556581986
642
+ mistral_orpo_mix_7k,0.6304849884526559
643
+ rainbowfish_v6,0.6299076212471132
644
+ collectivecognition_v1_mistral_7b,0.6293302540415704
645
+ hyperion_3.0_mistral_7b_dpo,0.628175519630485
646
+ opencerebrum_1.0_7b_sft,0.628175519630485
647
+ matter_0.1_7b_dpo_preview,0.6270207852193995
648
+ metis_0.4,0.6270207852193995
649
+ slimhercules_4.0_mistral_7b_v0.2,0.6264434180138568
650
+ hercules_4.0_mistral_v0.2_7b,0.625866050808314
651
+ metis_0.3_merged,0.6247113163972287
652
+ openagi_testing_inteldpo_2,0.6247113163972287
653
+ where_llambo_7b,0.6235565819861432
654
+ experiment_orpo_m7b2_1_merged,0.6235565819861432
655
+ opencerebrum_1.0_7b_dpo,0.6229792147806005
656
+ mistral_neuraldpo_v0.5,0.6224018475750578
657
+ qwen1.5_moe_a2.7b,0.621824480369515
658
+ matter_0.2_7b,0.6212471131639723
659
+ synatra_10.7b_v0.4,0.6195150115473441
660
+ zephyr_7b_gpo_update3_i0,0.6195150115473441
661
+ hyperion_3.0_mistral_7b_alpha,0.6195150115473441
662
+ blossom_v5_mistral_7b,0.6189376443418014
663
+ configurablehermes_7b,0.6183602771362586
664
+ matter_0.1_7b,0.6172055427251733
665
+ experiment_sft_m7b2_2_merged,0.6172055427251733
666
+ openhermes_dpo_norobot_0201,0.6166281755196305
667
+ qwen1.5_7b_dutch_chat,0.6160508083140878
668
+ lil_c3po,0.6154734411085451
669
+ collectivecognition_v1.1_mistral_7b,0.6143187066974596
670
+ j.o.s.i.e.3_beta8_slerp,0.6143187066974596
671
+ einstein_v4_7b,0.6137413394919169
672
+ experiment_sft_m7b2_3_merged,0.6131639722863741
673
+ thetawave_7b,0.6125866050808314
674
+ experiment_orpo_m7b2_2_merged,0.6114318706697459
675
+ bagel_7b_v0.4,0.6114318706697459
676
+ einstein_v6_7b,0.6096997690531177
677
+ bageluccine_2_7b_slerp,0.6096997690531177
678
+ 7bx4_dpo_700,0.6096997690531177
679
+ pascalhermes_2.5_mistral_7b,0.609122401847575
680
+ hermes_2_pro_mistral_7b,0.6073903002309469
681
+ codestral_22b_v0.1,0.6073903002309469
682
+ experiment_dpo_m7b2_1_merged,0.6073903002309469
683
+ mistral_7b_openorca_1k,0.6068129330254042
684
+ metis_0.5,0.6062355658198614
685
+ zephyr_7b_gpo_v5_i1,0.6056581986143187
686
+ llama3_13b,0.6045034642032333
687
+ senzu_7b_v0.1_dpo,0.6045034642032333
688
+ thetawave_7b_v0.1,0.6039260969976905
689
+ stablelm_2_12b,0.6033487297921478
690
+ matter_0.1_7b_boost_dpo_preview,0.6027713625866051
691
+ 22_neuro_model,0.6021939953810623
692
+ llama3_neurona_8b,0.6016166281755196
693
+ qwen1.5_7b_dutch_chat_sft_bf16,0.601039260969977
694
+ matter_0.1_7b_boost,0.6004618937644342
695
+ srbosgpt_7b_slerp,0.5993071593533488
696
+ bagel_dpo_7b_v0.4,0.5993071593533488
697
+ neuralhyperion_2.0_mistral_7b,0.5981524249422633
698
+ mini_dpo_test02,0.5981524249422633
699
+ systemconfighermes_7b,0.5975750577367206
700
+ zephyr_7b_lgpo_v1_i1,0.5969976905311778
701
+ matter_0.1_7b_boost_dpo,0.5964203233256351
702
+ typhoon_7b_instruct_02_19_2024,0.5958429561200924
703
+ internlm_20b,0.5946882217090069
704
+ zephyr_7b_dpo_full_beta_0.2,0.5946882217090069
705
+ spaetzle_v44_7b,0.5941108545034642
706
+ bageluccine_7b_slerp,0.5935334872979214
707
+ mistral_pro_8b_v0.1,0.5929561200923787
708
+ qwen1.5_7b_chat,0.5923787528868361
709
+ wizardchatml_7b_v0,0.5918013856812933
710
+ opencerebrum_1.5_mistral_7b_v0.2_alpha,0.5912240184757506
711
+ internlm_20b_llama,0.5906466512702079
712
+ 0.0_ablation_sample1_4iters_bs256_iter_1,0.5900692840646651
713
+ wizardmath_7b_v1.1,0.5894919168591224
714
+ zephyr_7b_sft_full_spin_iter3,0.5883371824480369
715
+ rain_7b_v0.2,0.5883371824480369
716
+ synatra_7b_v0.3_dpo,0.5871824480369515
717
+ hyperion_2.1_mistral_7b,0.5871824480369515
718
+ thetawave_14b_v0.1,0.5866050808314087
719
+ mistral_mbr_32_sig,0.586027713625866
720
+ metis_0.1,0.5848729792147807
721
+ mistral_nucleus09_32_sig,0.5848729792147807
722
+ 0.001_zephyr_5551_4iters_bs256_iter_1,0.5837182448036952
723
+ mistral_dmbr20_32_sig,0.5837182448036952
724
+ mistral_kmmbr_32_sig,0.5831408775981525
725
+ samantha_mistral_7b,0.5825635103926097
726
+ mistral_dmbr10_32_sig,0.581986143187067
727
+ ziya2_13b_base,0.5808314087759815
728
+ koopenchat_sft,0.5808314087759815
729
+ blossom_v5_7b,0.5802540415704388
730
+ mistral_dmbr03_32_sig,0.5790993071593533
731
+ xenon_1,0.5790993071593533
732
+ fsfairx_zephyr_chat_v0.1,0.5785219399538106
733
+ mini_synatra_sft,0.5779445727482679
734
+ qwen1.5_7b_chat_llamafy,0.5767898383371824
735
+ marcoro14_7b_slerp,0.5767898383371824
736
+ agiin_13.6b_v0.1,0.575635103926097
737
+ mistral_7b_orpo_capybara_reproduction,0.575635103926097
738
+ 0.001_idpo_declr_4iters_iter_2,0.5744803695150116
739
+ mistral_orpo_alpha,0.5744803695150116
740
+ stablelm_2_12b_chat,0.5739030023094688
741
+ felix_8b,0.5733256351039261
742
+ mistral_grok_instract_2_7b_slerp,0.5727482678983834
743
+ pivot_0.1_early,0.5715935334872979
744
+ einstein_v5_v0.2_7b,0.5715935334872979
745
+ zephyr_7b_beta_expo,0.5704387990762124
746
+ qwen1.5_moe_a2.7b_chat,0.5704387990762124
747
+ 0.001_4iters_bs256_nodpo_only4w_userresponse_iter_4,0.5681293302540416
748
+ metis_0.3,0.5681293302540416
749
+ neural_mistral_7b,0.5681293302540416
750
+ gemma_1.1_7b_it,0.5681293302540416
751
+ m_b_4_32,0.5669745958429562
752
+ llama3_youko_8b,0.5669745958429562
753
+ mistral_7b_instruct_v0.2_sparsity_10,0.5663972286374134
754
+ mistral_dmbr05_32_sig,0.565242494226328
755
+ openbuddy_mistral2_7b_v20.3_32k,0.565242494226328
756
+ snorkel_mistral_pairrm_dpo,0.5646651270207852
757
+ mistral_7b_instruct_v0.2_attention_sparsity_10_v0.1,0.5635103926096998
758
+ mistral_portuguese_luana_7b_chat,0.5635103926096998
759
+ superaligned_jawade,0.5623556581986143
760
+ mistral_7b_instruct_v0.2_attention_sparsity_20,0.5623556581986143
761
+ synatra_7b_v0.3_rp,0.5617782909930716
762
+ mistral_7b_instruct_v0.2,0.5600461893764435
763
+ mistral_v2_7b_selfplay_v0,0.5600461893764435
764
+ alooowso,0.5600461893764435
765
+ mistral_v2_7b_selfplay_low_tmp,0.5594688221709007
766
+ mistral_7b_instruct_v0.2_sp_v0,0.5577367205542725
767
+ mistral_7b_instruct_v2_sp_v0.1,0.5577367205542725
768
+ mistral_7b_orpo_airoboros_pref_10k,0.5577367205542725
769
+ 0.001_idpo_iter_1,0.5571593533487298
770
+ openbuddy_mistral2_7b_v20.2_32k,0.5565819861431871
771
+ 0.001_idpo_iter_2,0.5554272517321016
772
+ typhoon_7b_instruct_01_30_2024,0.5554272517321016
773
+ mistral_7b_v2_selfplay,0.5548498845265589
774
+ qwen1.5_7b_dutch_chat_dpo,0.5536951501154734
775
+ deacon_20b,0.5536951501154734
776
+ 0.001_idpo_declr_4iters_iter_3,0.5531177829099307
777
+ yugogpt,0.5525404157043879
778
+ zephyrnotus_11b_alpha,0.5513856812933026
779
+ airic_the_mistral,0.5513856812933026
780
+ 0.001_idpo_noreplacerej_iter_2,0.5502309468822171
781
+ mistral_instruct_7b_v0.2_chatalpacav2_4bit,0.5502309468822171
782
+ mistral_v2_7b_selfplay_v0_test,0.5496535796766744
783
+ 0.0001_withdpo_4iters_bs256_511lr_iter_2,0.5479214780600462
784
+ zephyr_7b_alpha_expo,0.5479214780600462
785
+ mistral_7b_instruct_v0.2_selfplay_v0,0.5479214780600462
786
+ taliml_7b_v.1_eng,0.5467667436489607
787
+ mistral_rank32_dpo,0.5467667436489607
788
+ 0.0005_withdpo_4iters_bs256_555lr_iter_2,0.546189376443418
789
+ openinstruct_mistral_7b,0.5456120092378753
790
+ damysus_coder_v0.1,0.5444572748267898
791
+ 0.0_ablation_sample1_4iters_bs256_iter_2,0.5444572748267898
792
+ aether_7b_chat_v1.0,0.5438799076212472
793
+ 0.001_idpo_declr_iter_2,0.5433025404157044
794
+ llama33b_instructed,0.5409930715935335
795
+ mistral_rank8_sft,0.5409930715935335
796
+ bggpt_7b_instruct_v0.2,0.5409930715935335
797
+ rabbit_7b_dpo_chat,0.5409930715935335
798
+ mistralinstructlongish,0.5392609699769053
799
+ 0.0001_withdpo_4iters_bs256_511lr_iter_3,0.5392609699769053
800
+ mistral_7b_instruct_v0.2_attention_sparsity_30,0.5392609699769053
801
+ 0.001_idpo_noreplacerej_iter_3,0.5386836027713626
802
+ 0.001_idpo_declr_4iters_iter_4,0.5369515011547344
803
+ qwen1.5_7b_dutch_chat_sft,0.5369515011547344
804
+ 0.0_ablation_sample1_4iters_bs256_iter_3,0.5369515011547344
805
+ 0.0001_withdpo_4iters_bs256_5102lr_iter_4,0.5363741339491916
806
+ quyen_plus_v0.1,0.5346420323325635
807
+ iambe_20b_dare_v2,0.5346420323325635
808
+ lucie_7b_v0.2_16bit,0.5346420323325635
809
+ 0.0_zephyr_withdpo_4iters_bs128_5551lr_iter_2,0.5329099307159353
810
+ mistral_rank16_sft,0.5329099307159353
811
+ blossom_v4_qwen1_5_7b,0.5329099307159353
812
+ buddhi_128k_chat_7b,0.5317551963048499
813
+ mistral_rank32_sft,0.5317551963048499
814
+ 0.0_withdpo_4iters_bs256_5551lr_iter_4,0.5311778290993071
815
+ mistral_rank8_packing,0.5306004618937644
816
+ zephyr_0.2,0.5294457274826789
817
+ solar_platypus_10.7b_v1,0.5294457274826789
818
+ mistral_rank16_packing,0.5288683602771362
819
+ 0.001_idpo_iter_3,0.5282909930715936
820
+ mistral_rank8_dpo,0.5277136258660509
821
+ 0.001_idpo_declr_iter_3,0.5271362586605081
822
+ mistral_rank16_dpo,0.5265588914549654
823
+ contextual_kto_mistral_pairrm,0.5248267898383372
824
+ orca_2_13b_no_robots,0.5248267898383372
825
+ 0.0_withdpo_4iters_bs256_531lr_iter_3,0.5248267898383372
826
+ ferret_7b,0.5242494226327945
827
+ mistral_rank8_invert,0.5236720554272517
828
+ zephyr_0.1,0.5219399538106235
829
+ xenon_2,0.5219399538106235
830
+ 0.001_3iters_bs256_nodpo_only4w_iter_3,0.5219399538106235
831
+ 0.001_idpo_same_noreplacerej_declr_iter_2,0.5207852193995381
832
+ decilm_7b_instruct,0.5207852193995381
833
+ 0.0_zephyr_withdpo_4iters_bs128_5551lr_iter_3,0.5202078521939953
834
+ zephyr_python_ru,0.51905311778291
835
+ 0.001_idpo_same_noreplacerej_declr_iter_3,0.51905311778291
836
+ 0.0005_withdpo_4iters_bs256_5551lr_iter_4,0.5178983833718245
837
+ neu_sai_it1,0.5178983833718245
838
+ 0.0_ablation_sample1_4iters_bs256_iter_4,0.5173210161662818
839
+ 0.0_zephyr_withdpo_4iters_bs128_5551lr_iter_4,0.516743648960739
840
+ 0.001_zephyr_5551_4iters_bs256_iter_3,0.5161662817551963
841
+ 0.001_ablation_5iters_bs256_iter_5,0.5155889145496536
842
+ 0.001_4iters_bs256_nodpo_only4w_iter_4,0.5144341801385681
843
+ xenon_4,0.5144341801385681
844
+ radiantloom_mixtral_8x7b_fusion,0.5138568129330254
845
+ 0001_dpo_iter_2,0.5132794457274826
846
+ 0.001_zephyr_5551_4iters_bs256_iter_4,0.5127020785219399
847
+ mistral_rank16_invert,0.5121247113163973
848
+ solar_platypus_10.7b_v2,0.5109699769053118
849
+ han_llm_7b_v2,0.5109699769053118
850
+ mistral_rank32_invert,0.5103926096997691
851
+ pivot_10.7b_mistral_v0.2,0.5098152424942263
852
+ qwen_7b,0.5086605080831409
853
+ mistral_7b_openplatypus_1k,0.5086605080831409
854
+ athena_zephyr_7b,0.5080831408775982
855
+ xenon_3,0.5075057736720554
856
+ decilm_7b,0.5057736720554272
857
+ mistral_7b_open_platypus,0.5057736720554272
858
+ openbuddy_mistral2_7b_v20.1_32k,0.5057736720554272
859
+ codellama_70b,0.5051963048498845
860
+ bggpt_7b_instruct_v0.1,0.5046189376443418
861
+ zephyr_7b_dpo_full,0.5034642032332564
862
+ karen_theeditor_v2_strict_mistral_7b,0.5034642032332564
863
+ mini_7b_dare_v1,0.5028868360277137
864
+ typhoon_7b,0.5023094688221709
865
+ zephyr_7b_truthy,0.5011547344110855
866
+ mistral_instruct_frankenmerge,0.5011547344110855
867
+ orca_2_13b_sft_v6,0.5005773672055427
868
+ genai_nova_13b,0.5
869
+ mistral_7b_erebus_v3,0.49942263279445726
870
+ openorca_platypus2_13b_qlora_0.80_epoch,0.49884526558891457
871
+ karakuri_lm_70b_chat_v0.1,0.4982678983833718
872
+ mistral_7b_golden,0.4976905311778291
873
+ zephyr_gemma_rpo,0.4971131639722864
874
+ mistral_instruct_7b_v0.2_chatalpaca_dpo2,0.49653579676674364
875
+ bigstral_12b_32k,0.4959584295612009
876
+ solarized_13b_dpo,0.4953810623556582
877
+ mistral_instruct_7b_v0.2_chatalpaca,0.49480369515011546
878
+ delta_4b_base,0.4942263279445728
879
+ platypus2xopenorca_13b_ia3_v4,0.4930715935334873
880
+ v1olet_merged_dpo_7b_v4,0.4930715935334873
881
+ zephyr_7b_dpo_full_expo,0.4924942263279446
882
+ ignis_7b_dpo,0.49191685912240185
883
+ hercules_1.0_mistral_7b,0.4913394919168591
884
+ pivot_0.1_evil_a,0.49018475750577367
885
+ gemma_7b_open_platypus_commercial,0.49018475750577367
886
+ platypus2xopenorca_13b_ia3,0.4896073903002309
887
+ shark_tank_ai_7b_v2,0.48903002309468824
888
+ mistral_7b_instruct_sft_tuned_v0.2,0.4884526558891455
889
+ platypus2xopenorca_13b_lora,0.48787528868360275
890
+ mistral_7b_aezakmi_v1,0.48614318706697457
891
+ chatayt_lora_assamble_marcoroni,0.48614318706697457
892
+ luban_marcoroni_13b_v2,0.48614318706697457
893
+ luban_marcoroni_13b,0.4855658198614319
894
+ platypus2xopenorca_13b_ia3_v3,0.48498845265588914
895
+ zysec_7b,0.4838337182448037
896
+ walter_mistral_7b,0.4838337182448037
897
+ 2x_lora_assemble_nova_13b,0.48267898383371827
898
+ luban_marcoroni_13b_v3,0.48267898383371827
899
+ chat_ayb_nova_13b,0.4821016166281755
900
+ ignis_7b_dpo_laser,0.4815242494226328
901
+ airoboros_33b_gpt4_1.3,0.4809468822170901
902
+ llama30b,0.48036951501154734
903
+ phi_2_dpo,0.4797921478060046
904
+ chronorctypus_limarobormes_13b,0.4792147806004619
905
+ phi_2_super,0.4780600461893764
906
+ phi_2_gpo_renew2_i0,0.4780600461893764
907
+ falcon_11b,0.47748267898383373
908
+ brokenkeyboardmerge,0.476905311778291
909
+ phi_2_dpo_renew1,0.47632794457274824
910
+ zephyr_0.2_a2.5,0.47575057736720555
911
+ puddlejumper_13b_v2,0.4751732101616628
912
+ 2x_lora_assemble_platypus2_13b,0.4745958429561201
913
+ mistral_instruct_moe_experimental,0.4740184757505774
914
+ phi_2_gpo_renew2_b0.001_extra_i1,0.47344110854503463
915
+ phi_2_gpo_renew2_b0.001_log_i0,0.47286374133949194
916
+ smartyplats_7b_v2,0.47170900692840645
917
+ phi_2_ipo_renew1,0.47170900692840645
918
+ phi_2_gpo_renew2_b0.001_v4_i1,0.47113163972286376
919
+ dpo_phi2,0.470554272517321
920
+ openbuddy_mistral_7b_v17.1_32k,0.46997690531177827
921
+ phi_2_gpo_renew2_b0.001_extra_v2_i1,0.4693995381062356
922
+ blur_7b_v1.22,0.4676674364896074
923
+ luban_platypus2_13b_qlora_0.80_epoch,0.4676674364896074
924
+ phi_2_gpo_renew2_b0.001_v2_i1,0.4676674364896074
925
+ nova_13b,0.46709006928406466
926
+ phi_2_gpo_renew2_b0.001_0.5ultrafeedback_i1,0.4665127020785219
927
+ losslessmegacoder_llama2_13b_mini,0.4659353348729792
928
+ platypus2xopenorca_13b_ia3_v2.1,0.4653579676674365
929
+ phi_2_gpo_renew2_b0.001_0.5ultrafeedback_lowlr_i1,0.46420323325635104
930
+ phi_2_gpo_renew2_b0.001_i0,0.46420323325635104
931
+ oasst_rlhf_2_llama30b_7k_steps,0.4636258660508083
932
+ phi_2_gpo_renew2_b0.001_vllm_i1,0.4630484988452656
933
+ phi_2_layla_v1,0.46247113163972287
934
+ mistral_7b_med_merge,0.4618937644341801
935
+ chat_ayb_platypus2_13b,0.46131639722863743
936
+ phi_2_instruction,0.4607390300230947
937
+ speechlessv1_nova_13b,0.46016166281755194
938
+ aanaphi2_v0.1,0.45958429561200925
939
+ nanobot_v1,0.4590069284064665
940
+ typhoon_7b_wangchanx_sft_demo,0.45842956120092376
941
+ mistral_7b_norobots,0.4578521939953811
942
+ phi_2_ipo_test_iter_0,0.45727482678983833
943
+ nebula_v2_7b,0.45669745958429564
944
+ mistral_neuraldpo_v0.7,0.4561200923787529
945
+ duplicitous_slurpbeast_13b,0.45554272517321015
946
+ duplicitous_mammal_13b,0.45496535796766746
947
+ storytime_13b,0.4543879907621247
948
+ orca_nova_13b,0.45381062355658197
949
+ airoboros_33b_2.1,0.45265588914549654
950
+ liph42,0.45265588914549654
951
+ ice_grt,0.4515011547344111
952
+ platypus2_13b_qlora,0.4515011547344111
953
+ openbuddy_mistral_7b_v19.1_4k,0.45092378752886836
954
+ delta_4b_notso_base,0.4503464203233256
955
+ camelidae_8x13b,0.4497690531177829
956
+ llama3_soliloquy_8b,0.4491916859122402
957
+ stable_platypus2_13b_qlora_0.80_epoch,0.44861431870669743
958
+ spin_phi2,0.44803695150115475
959
+ huginnv1.2,0.447459584295612
960
+ nebula_7b,0.4468822170900693
961
+ openorcaplatypus2_platypus2_13b_qlora_0.80_epoch,0.44630484988452657
962
+ 13b_thorns_l2,0.4457274826789838
963
+ ensemble5_platypus2_13b_qlora_0.80_epoch,0.44515011547344113
964
+ einstein_v4_phi2,0.44399538106235564
965
+ falcon_40b,0.44399538106235564
966
+ einstein_v6.1_phi2,0.44341801385681295
967
+ ensemblev5_nova_13b,0.4428406466512702
968
+ experiment_sft_m7b2_1_merged,0.44226327944572746
969
+ yulan_chat_2_13b_fp16,0.4416859122401848
970
+ nous_hermes_platypus2_13b_qlora_0.80_epoch,0.44110854503464203
971
+ zephyr_alpha_nebula_v2_7b,0.4405311778290993
972
+ llama_2_13b_beluga_qlora,0.4399538106235566
973
+ phi_2_layla_v1_chatml,0.43937644341801385
974
+ qwen1.5_4b,0.4376443418013857
975
+ orca_mini_v3_13b,0.4376443418013857
976
+ limarp_platypus2_13b_qlora_0.80_epoch,0.4376443418013857
977
+ delta_4b_orange,0.437066974595843
978
+ airoboros_l2_13b_2.2.1,0.43648960739030024
979
+ orcamini_platypus2_13b_qlora_0.80_epoch,0.4359122401847575
980
+ codellama_70b_instruct,0.4353348729792148
981
+ damysus_2.7b_chat,0.4341801385681293
982
+ platypus2_13b_lora,0.4341801385681293
983
+ platypus2_13b_ia3,0.4336027713625866
984
+ sailor_7b_chat,0.4330254041570439
985
+ eastasia_4x7b_moe_experiment,0.43244803695150114
986
+ codellama_70b_python,0.43187066974595845
987
+ medchator_2x7b,0.4312933025404157
988
+ synatra_rp_orca_2_7b_v0.1,0.43071593533487296
989
+ platypus_nebula_v2_7b,0.43013856812933027
990
+ truthfulqwen1.5_4b,0.4295612009237875
991
+ new_model_test2,0.4289838337182448
992
+ llama2_13b_sharegpt4_test,0.42782909930715934
993
+ llama_2_16b_nastychat,0.42782909930715934
994
+ solar_ko_1.3_deup,0.42725173210161665
995
+ minotaur_llama2_13b_qlora,0.4266743648960739
996
+ llama_2_13b_ds_eli5_1024_r_64_alpha_16,0.42609699769053117
997
+ llama_2_13b_chat_dutch,0.4255196304849885
998
+ llama_2_13b_qlora,0.42494226327944573
999
+ llama_2_13b,0.424364896073903
1000
+ solar_13b_instruct_v1.0,0.4237875288683603
1001
+ openhermes_gemma_7b,0.4226327944572748
1002
+ mythomix_platypus2_13b_qlora_0.80_epoch,0.4226327944572748
1003
+ huginn_19b_prototype,0.4220554272517321
1004
+ mistral_7b_sft_open_orca_flan_50k,0.4214780600461894
1005
+ eurus_70b_nca_fixed,0.42090069284064663
1006
+ llama_2_13b_fp16,0.42032332563510394
1007
+ mythicaldestroyerv2_platypus2_13b_qlora_0.80_epoch,0.4197459584295612
1008
+ platypus2_13b_qlora_0.80_epoch,0.41916859122401845
1009
+ redmond_puffin_13b_instruct_pl_lora_unload,0.41859122401847576
1010
+ llama_2_13b_instructed,0.4174364896073903
1011
+ libra_19b,0.4174364896073903
1012
+ openbuddy_gemma_7b_v18.1_4k,0.41628175519630484
1013
+ synatra_11b_testbench,0.41628175519630484
1014
+ alpagasus_2_13b_qlora_merged,0.4151270207852194
1015
+ qwen1.5_4b_chat,0.4151270207852194
1016
+ zephyr_7b_norobots,0.41454965357967666
1017
+ dolphin_2.2_yi_34b_200k,0.4133949191685912
1018
+ llama_2_13b_guanaco_qlora,0.4133949191685912
1019
+ llama_2_13b_instruct_v0.2,0.4122401847575058
1020
+ deita_4b,0.4122401847575058
1021
+ athena_platypus2_13b_qlora_0.80_epoch,0.4110854503464203
1022
+ airoboros_c34b_2.2.1,0.4110854503464203
1023
+ llama_2_13b_eli5_wiki_1024_r_64_alpha_16,0.4105080831408776
1024
+ mistral_7b_selfplay_v0,0.40993071593533487
1025
+ mistral_7b_instruct_v0.1,0.4093533487297921
1026
+ eurus_70b_sft_fixed,0.40877598152424943
1027
+ llama_2_13b_ds_wiki_1024_full_r_64_alpha_16,0.4081986143187067
1028
+ merged_dpo_7b,0.407621247113164
1029
+ platypus_2_22b_relora,0.40704387990762125
1030
+ synatra_v0.1_7b_instruct,0.4064665127020785
1031
+ llama2_megamerge_dare_13b_v2,0.4058891454965358
1032
+ deacon_13b,0.40473441108545033
1033
+ tekniumairoboros_nebula_7b,0.40473441108545033
1034
+ llama_2_13b_platypus_vicuna_wizard,0.40415704387990764
1035
+ trurl_2_13b_academic,0.4035796766743649
1036
+ mistral_instruct_slerp,0.40300230946882215
1037
+ puddlejumper_platypus2_13b_qlora_0.80_epoch,0.4018475750577367
1038
+ giftedconvo13bloranoecons,0.4018475750577367
1039
+ llama2_13b_sharegpt4_orca_openplatypus_8w,0.40127020785219397
1040
+ chinese_alpaca_2_13b,0.4006928406466513
1041
+ blossom_v4_qwen1_5_4b,0.40011547344110854
1042
+ ghost_7b_v0.9.0,0.3995381062355658
1043
+ airoboros_c34b_2.1,0.3989607390300231
1044
+ michel_13b,0.39838337182448036
1045
+ blossom_v5_4b,0.39780600461893767
1046
+ llama_2_13b_ds_wiki_1024_full_r_64_alpha_16_merged,0.3972286374133949
1047
+ giraffe_13b_32k_v3,0.3966512702078522
1048
+ llama_2_13b_eli5_wiki_1024_r_64_alpha_16_merged,0.3960739030023095
1049
+ llama_2_13b_platypus,0.394919168591224
1050
+ llama_2_13b_ds_eli5_1024_r_64_alpha_16_merged,0.394919168591224
1051
+ platypus2_22b_relora,0.3943418013856813
1052
+ codellama34b,0.39376443418013857
1053
+ llama_megamerge_dare_13b,0.3931870669745958
1054
+ sailor_7b,0.39260969976905313
1055
+ japanese_stablelm_instruct_gamma_7b,0.3920323325635104
1056
+ wizardmath_13b_v1.0,0.39145496535796764
1057
+ airoboros_2.1_llama_2_13b_qlora,0.39087759815242495
1058
+ tora_13b_v1.0,0.3903002309468822
1059
+ everythinglm_13b_v3_peft,0.38972286374133946
1060
+ llama_2_13b_vicuna_wizard,0.3891454965357968
1061
+ giftedconvo13bloranoeconse4,0.38799076212471134
1062
+ llama2_13b_holomax,0.38799076212471134
1063
+ llama_2_13b_chat,0.3874133949191686
1064
+ airboros2.1_platypus2_13b_qlora_0.80_epoch,0.38683602771362585
1065
+ zysec_8b_v2,0.3856812933025404
1066
+ zysec_7b_v2,0.3856812933025404
1067
+ ypotryll_22b_epoch2_qlora,0.3851039260969977
1068
+ wizardlm_1.0_uncensored_codellama34b,0.384526558891455
1069
+ thetawave_28b_v0.1,0.38394919168591224
1070
+ mistral_trismegistus_7b,0.3833718244803695
1071
+ llama_2_13b_chat_platypus,0.3827944572748268
1072
+ llama_2_13b_ft_instruct_es,0.38221709006928406
1073
+ samantha_nebula_7b,0.3816397228637413
1074
+ open_ko_solar_dpo_merge_v0.1,0.3810623556581986
1075
+ vigogne2_enno_13b_sft_lora_4bit,0.3804849884526559
1076
+ internlm2_base_7b_llama,0.37933025404157045
1077
+ yi6,0.37933025404157045
1078
+ llama_2_26b_trenchcoat_stack,0.3787528868360277
1079
+ neural_phi2,0.378175519630485
1080
+ giraffe_beta_13b_32k,0.37759815242494227
1081
+ tigerbot_13b_base,0.3770207852193995
1082
+ gemma_7b_openhermes,0.37644341801385683
1083
+ olmo_1.7_7b,0.3758660508083141
1084
+ chimera_7b_ties,0.37528868360277134
1085
+ llama_2_13b_german_orpo,0.37471131639722866
1086
+ dolphin_nebula_7b,0.3741339491916859
1087
+ eeve_korean_instruct_2.8b_v1.0,0.37355658198614317
1088
+ openbuddy_gemma_7b_v19.1_4k,0.3729792147806005
1089
+ lima2_13b,0.37240184757505773
1090
+ quyen_v0.1,0.3712471131639723
1091
+ mixtral_6x7b_instruct_v0.1,0.3712471131639723
1092
+ aisquare_instruct_solar_10.7b_v0.5.31,0.37066974595842955
1093
+ deita_2b,0.37009237875288686
1094
+ asclepius_llama2_13b,0.3695150115473441
1095
+ orca_mini_v3_7b,0.3689376443418014
1096
+ huginn_13b_v4,0.3672055427251732
1097
+ huginn_13b_v4.5,0.3672055427251732
1098
+ huginn_v3_13b,0.3672055427251732
1099
+ yousei_22b,0.36605080831408776
1100
+ awanllm_llama3_8b_instruct_dpo_v0.2,0.36605080831408776
1101
+ tulu_2_dpo_7b_expo,0.365473441108545
1102
+ nusantara_7b_indo_chat,0.3648960739030023
1103
+ aisquare_instruct_llama2_koen_13b_v0.9.24,0.3643187066974596
1104
+ deepseek_llm_7b_chat,0.36374133949191684
1105
+ samantha_mistral_instruct_7b,0.36316397228637415
1106
+ llava_v1.5_7b_vicuna,0.3625866050808314
1107
+ blossom_v2_llama2_7b,0.36200923787528866
1108
+ eeve_korean_2.8b_v1.0,0.36143187066974597
1109
+ hope_for,0.3608545034642032
1110
+ starcoder2_15b,0.36027713625866054
1111
+ yehoon_llama2,0.3596997690531178
1112
+ sydney_overthinker_13b_hf,0.35854503464203236
1113
+ chinese_alpaca_2_13b_16k,0.35854503464203236
1114
+ mnsim_dpo_peftmerged_2_eos,0.3579676674364896
1115
+ configurable_mistral_22b,0.35739030023094687
1116
+ orca_open_hermes_llava_v1.5_7b_dpo,0.3568129330254042
1117
+ mm4_3b,0.35623556581986143
1118
+ ghost_7b_alpha,0.3556581986143187
1119
+ airocoder_34b_2.1,0.355080831408776
1120
+ stable_vicuna_13b,0.3539260969976905
1121
+ tamil_llama_13b_instruct_v0.1,0.3539260969976905
1122
+ mc_data_30k_from_platpus_orca_7b_10k_v1_lora_qkvo_rank14_v2,0.3533487297921478
1123
+ platypus2xopenorca_13b_lora_v2,0.3527713625866051
1124
+ geitje_7b_ultra,0.35219399538106233
1125
+ camelidae_8x7b,0.35161662817551964
1126
+ btlm_v1_7b_base_v0.1,0.3510392609699769
1127
+ fietje_2b_chat,0.3504618937644342
1128
+ platypus2_7b,0.34988452655889146
1129
+ huginn_22b_prototype,0.3493071593533487
1130
+ fietje_2b_instruct,0.3481524249422633
1131
+ llama2_13b_chinese_v2,0.3481524249422633
1132
+ losslessmegacoder_llama2_7b_mini,0.34757505773672054
1133
+ hope_for_7b_1.0v,0.34699769053117785
1134
+ alma_13b_r,0.3464203233256351
1135
+ bielik_7b_instruct_v0.1,0.34584295612009236
1136
+ llama2_7b_instruction_lora,0.34526558891454967
1137
+ llongorca_7b_16k,0.3446882217090069
1138
+ fietje_2b,0.3441108545034642
1139
+ code_millenials_34b,0.3435334872979215
1140
+ wizardcoder_python_34b_v1.0,0.34295612009237875
1141
+ new_model_test3,0.342378752886836
1142
+ awanllm_llama3_8b_dolfin_v0.3_dpo,0.3418013856812933
1143
+ geitje_7b_chat_v2,0.34122401847575057
1144
+ llama_2_7b_chat_guanaco_lora,0.3406466512702079
1145
+ llama_2_7b_physics,0.34006928406466513
1146
+ mistral_22b_v0.1,0.3394919168591224
1147
+ llama_2_7b_chat_afr_200step_merged,0.3389145496535797
1148
+ openhermes_7b,0.33833718244803695
1149
+ llama_2_7b_chat_afr_200step_v2,0.3377598152424942
1150
+ llama_2_7b_chat_afr_441step_flan_v2,0.3371824480369515
1151
+ llama_2_7b_chat_afr_300step_flan_v2,0.33602771362586603
1152
+ llama_2_7b_chat_afr_200step_flan_v2,0.33602771362586603
1153
+ hope_for_7b_1.1v,0.33545034642032334
1154
+ llama_2_7b_chat_afr_100step_v2,0.3348729792147806
1155
+ wizardvicuna2_13b,0.33429561200923785
1156
+ llama2_7b_openorca_mc_v1,0.33371824480369516
1157
+ llama_2_7b_chat_afr_100step_flan_v2,0.3331408775981524
1158
+ llama_2_7b_chat_afr_200step_flan,0.3325635103926097
1159
+ llama_2_7b_chat_afr_100step_flan,0.331986143187067
1160
+ llama_2_7b_chat,0.33140877598152424
1161
+ cria_llama2_7b_v1.3,0.33083140877598155
1162
+ openbuddy_zen_3b_v21.2_32k,0.3302540415704388
1163
+ llama_2_7b_chat_10_sparsity,0.32967667436489606
1164
+ llama_2_7b_chat_10_attention_sparsity,0.32909930715935337
1165
+ mpt_30b,0.3285219399538106
1166
+ vicuna_7b_v1.3_attention_sparsity_10,0.3273672055427252
1167
+ fusellm_7b,0.3273672055427252
1168
+ archangel_sft_kto_llama13b,0.32678983833718245
1169
+ starling_7b,0.3262124711316397
1170
+ llama_13b,0.32505773672055427
1171
+ adelie_sft,0.32505773672055427
1172
+ airoboros_l2_7b_2.2.1,0.3244803695150115
1173
+ telugu_llama2_7b_v0_instruct,0.32390300230946883
1174
+ flan_llama_7b_2_llama2_7b_flash_868_full_model,0.3233256351039261
1175
+ llama_2_7b_chat_20_attention_sparsity,0.32274826789838335
1176
+ vicuna_7b_v1.3_attention_sparsity_20,0.32217090069284066
1177
+ mistral_7b_instruct_v0.2_sparsity_20,0.3210161662817552
1178
+ llama_2_7b_chat_20_sparsity,0.3210161662817552
1179
+ llama_2_7b_chat_guanaco,0.3204387990762125
1180
+ llama2_7b_openorca_mc_v2_dpo,0.31986143187066973
1181
+ llama_2_7b_chat_guanaco_freeze_embed_tokens_q_v_proj,0.31928406466512704
1182
+ rocket_3b,0.3187066974595843
1183
+ elyza_japanese_llama_2_7b_instruct,0.31755196304849886
1184
+ llama_2_peanutbutter_v18_b_7b,0.31755196304849886
1185
+ llama_2_7b_chat_30_attention_sparsity,0.3169745958429561
1186
+ llama_2_peanutbutter_v10_7b,0.3163972286374134
1187
+ llama_2_7b_chat_guanaco_freeze_embed_tokens_q_v_proj_lora,0.3158198614318707
1188
+ towerinstruct_7b_v0.1,0.31524249422632794
1189
+ llama_2_7b,0.3146651270207852
1190
+ vicuna_7b_v1.3_attention_sparsity_30,0.3140877598152425
1191
+ helpingai_3b,0.31351039260969976
1192
+ tora_code_34b_v1.0,0.312933025404157
1193
+ qwen1.5_1.8b,0.3123556581986143
1194
+ llama_2_7b_guanaco_instruct_sharded,0.3117782909930716
1195
+ chinese_alpaca_2_7b,0.3112009237875289
1196
+ mistral_7b_instruct_v0.2_sparsity_30,0.31062355658198615
1197
+ cria_llama2_7b_v1.3_peft,0.3100461893764434
1198
+ qwen_1_8b_llamafied,0.3094688221709007
1199
+ deepseek_moe_16b_base,0.30889145496535797
1200
+ chinese_alpaca_2_7b_rlhf,0.3083140877598152
1201
+ stablelm_zephyr_3b,0.30773672055427254
1202
+ odia_llama2_7b_base,0.3071593533487298
1203
+ youri_7b_chat,0.30658198614318705
1204
+ llama_2_7b_chat_flan2022_1.2m,0.30600461893764436
1205
+ llama_2_7b_eli5_cleaned_1024_qlora_merged,0.30484988452655887
1206
+ tora_7b_v1.0,0.30484988452655887
1207
+ qwen1.5_1.8b_chat,0.3042725173210162
1208
+ openhermes_qwen1.5_1.8b,0.30369515011547343
1209
+ mhm_7b_v1.3_dpo_1,0.3031177829099307
1210
+ mhm_7b_v1.3,0.302540415704388
1211
+ llama_2_7b_eli5_cleaned_wiki65k_1024_qlora_merged,0.30196304849884525
1212
+ deita_qwen_1_8b,0.3008083140877598
1213
+ deita_1_8b,0.3008083140877598
1214
+ leo_hessianai_7b_chat,0.3002309468822171
1215
+ llama_2_7b_chat_30_sparsity,0.2996535796766744
1216
+ llama_2_peanutbutter_v18_a_7b,0.29907621247113164
1217
+ llama_2_7b_32k_instruct,0.2984988452655889
1218
+ quan_1.8b_base,0.29734411085450346
1219
+ llama_7b_sft_qlora_eli5_wiki_dpo_ds_rm_top_2_1024_r_64_alpha_16,0.29734411085450346
1220
+ llama_7b_sft_ds_wiki65k_1024_r_64_alpha_16_merged,0.2967667436489607
1221
+ orca_2.0_tau_1.8b,0.29618937644341803
1222
+ stablelm_3b_4e1t,0.2956120092378753
1223
+ stablelm_base_alpha_7b_v2,0.29503464203233254
1224
+ neuralreyna_mini_1.8b_v0.2,0.29445727482678985
1225
+ qwen_1_8b_everythinglm,0.2938799076212471
1226
+ hercules_mini_1.8b,0.29330254041570436
1227
+ leo_hessianai_7b_chat_bilingual,0.29272517321016167
1228
+ qwen_1_8b_chat_llama,0.2921478060046189
1229
+ truthfulqwen1.5_1.8b,0.29157043879907624
1230
+ llama_v2_7b_32kc_security,0.2909930715935335
1231
+ openllama_7b_icl,0.29041570438799075
1232
+ palmyra_med_20b,0.28983833718244806
1233
+ neuralreyna_mini_1.8b_v0.3,0.2892609699769053
1234
+ llama_2_7b_alpaca_gpt4,0.28868360277136257
1235
+ quan_1.8b_chat,0.2881062355658199
1236
+ everyone_coder_33b_base,0.28752886836027713
1237
+ llama_2_7b_gptq,0.2869515011547344
1238
+ sailor_4b_chat,0.2863741339491917
1239
+ sambalingo_thai_chat,0.28579676674364896
1240
+ quyen_mini_v0.1,0.2852193995381062
1241
+ phi_1_5,0.2846420323325635
1242
+ open_llama_13b,0.2840646651270208
1243
+ galpaca_30b_miniorca,0.2834872979214781
1244
+ asclepius_llama2_7b,0.2823325635103926
1245
+ kollama2_7b_v2,0.2823325635103926
1246
+ llama_2_7b_open_platypus,0.2817551963048499
1247
+ speechless_codellama_orca_13b,0.28117782909930716
1248
+ minimerlin_3b_v0.1,0.2806004618937644
1249
+ gemma_2b_zephyr_dpo,0.28002309468822173
1250
+ lima2_7b,0.279445727482679
1251
+ zephyr_phi_1_5_sft_qlora,0.27886836027713624
1252
+ fialka_7b_v3,0.2777136258660508
1253
+ smartqwen1.5_1.8b_orpo_v1,0.2777136258660508
1254
+ mistral_megamerge_dare_7b,0.27713625866050806
1255
+ neural_chat_mini_v2.2_1.8b,0.27655889145496537
1256
+ gowizardlm,0.2759815242494226
1257
+ chinese_alpaca_2_7b_16k,0.2754041570438799
1258
+ openllama_7b_base,0.27424942263279445
1259
+ speechless_codellama_platypus_13b,0.27424942263279445
1260
+ phi_openllm_lb_test,0.273094688221709
1261
+ mpt_7b_8k,0.273094688221709
1262
+ llama_2_7b_flan2022_1.2m,0.27251732101616627
1263
+ mpt_7b_8k_instruct,0.2719399538106236
1264
+ stablelm_2_zephyr_1_6b,0.27136258660508084
1265
+ zephyr_2b_gemma_sft_qlora,0.2707852193995381
1266
+ v1,0.2702078521939954
1267
+ remask_3b,0.26963048498845266
1268
+ gemma_2b,0.2690531177829099
1269
+ stablelm_2_1_6b_chat,0.2684757505773672
1270
+ open_llama_7b_v2,0.2678983833718245
1271
+ starcoder2_7b,0.26732101616628173
1272
+ openhermes_phi_1_5_sft_qlora,0.26674364896073904
1273
+ recurrentgemma_2b_it,0.2661662817551963
1274
+ gaja_v1.00,0.26558891454965355
1275
+ gaja_v2.00_dpo,0.26501154734411086
1276
+ samantha_1.11_7b,0.2644341801385681
1277
+ zephyr_danube2_sft_qlora,0.2632794457274827
1278
+ openhermes_danube2_sft_qlora,0.2632794457274827
1279
+ openthaigpt_1.0.0_alpha_7b_chat_ckpt,0.26270207852193994
1280
+ phi_1_5_chat_32k,0.26212471131639725
1281
+ calm2_7b_chat_dpo_experimental,0.2615473441108545
1282
+ codellama34b_instruct_fp16,0.2603926096997691
1283
+ codellama34b_instruct,0.2603926096997691
1284
+ open_llama3b_v2_instruct,0.25981524249422633
1285
+ openhermes_2b_gemma_sft_qlora,0.2592378752886836
1286
+ ex_llm_e1,0.2586605080831409
1287
+ deita_500m,0.25808314087759815
1288
+ calm2_7b_chat,0.2575057736720554
1289
+ qwen1.5_0.5b,0.2569284064665127
1290
+ nxcode_cq_7b_orpo,0.25635103926096997
1291
+ deepseek_coder_6.7b_instruct,0.2557736720554272
1292
+ sailor_4b,0.25519630484988454
1293
+ stablelm_2_1_6b,0.2546189376443418
1294
+ codellama_13b_instruct,0.2540415704387991
1295
+ codellama_13b_instruct_fp16,0.25346420323325636
1296
+ wizardcoder_python_13b_lora,0.2528868360277136
1297
+ starcoder2_3b,0.2523094688221709
1298
+ sappha_2b_v3,0.2517321016166282
1299
+ coven_tiny_1.1b_32k_orpo_alpha,0.25115473441108543
1300
+ gemma_2b_orpo,0.25057736720554274
1301
+ nusantara_4b_indo_chat,0.24942263279445728
1302
+ deepseek_coder_6.7b_base,0.24942263279445728
1303
+ sailor_1.8b_chat,0.24884526558891454
1304
+ gemma_2b_tamil,0.24826789838337182
1305
+ neurona_2b,0.2476905311778291
1306
+ h2o_danube2_1.8b_chat,0.2471131639722864
1307
+ gemma_2b_nlaf_v0,0.24653579676674364
1308
+ phi_gemma_nlaf_v0,0.24595842956120093
1309
+ gemma_2b_it_nlai_p1,0.2453810623556582
1310
+ gemma_2b_it_sp_test,0.24307159353348728
1311
+ gemma_2b_it_sp_test1,0.24307159353348728
1312
+ openhermes_gemma_2b,0.24307159353348728
1313
+ gemma_2b_it_sp_test_openherms_step500,0.24307159353348728
1314
+ gemma_nlaf_v1,0.24249422632794457
1315
+ gemma_2b_openhermes,0.24191685912240185
1316
+ phi_gemma_nlaf_v1,0.2407621247113164
1317
+ gemma_2b_it_nlai_v0,0.2407621247113164
1318
+ baize_healthcare_lora_7b,0.24018475750577367
1319
+ tora_code_13b_v1.0,0.23960739030023095
1320
+ cross_lingual_epoch2,0.2390300230946882
1321
+ llama_7b,0.2384526558891455
1322
+ llama_base_7b,0.23787528868360278
1323
+ gzdx_1.1b,0.23729792147806006
1324
+ codellama_13b_oasst_sft_v10,0.23672055427251731
1325
+ palmyra_20b_chat,0.2361431870669746
1326
+ gpt_sw3_40b,0.23556581986143188
1327
+ codellama34b_python,0.23498845265588914
1328
+ recurrentgemma_2b,0.23441108545034642
1329
+ codellama_7b_instruct,0.2338337182448037
1330
+ deacon_1_8b,0.23325635103926096
1331
+ tau_0.5b_instruct_dpop,0.23267898383371824
1332
+ qwen1.5_0.5b_chat,0.23210161662817552
1333
+ qwen_orpo_v1,0.2315242494226328
1334
+ test_qwen1.5_0.5b,0.23094688221709006
1335
+ dpo_qwen1.5_0.5b_chat_alignment_handbook,0.23036951501154734
1336
+ h2o_danube_1.8b_chat,0.22979214780600463
1337
+ ultra0,0.22921478060046188
1338
+ tora_code_7b_v1.0,0.22863741339491916
1339
+ platypus_1_8b,0.22806004618937645
1340
+ codellama34b_python_fp16,0.22748267898383373
1341
+ codellama_13b,0.22690531177829099
1342
+ poro_34b_gptq,0.22632794457274827
1343
+ codegen_16b_nl,0.22575057736720555
1344
+ starcoderbase,0.2251732101616628
1345
+ gemma_2b_sft_telugu,0.2245958429561201
1346
+ mc_model_v1,0.22401847575057737
1347
+ gpt_sw3_6.7b_v2_instruct,0.22344110854503466
1348
+ gpt_sw3_20b_instruct,0.2228637413394919
1349
+ quark_464m_v0.2,0.2222863741339492
1350
+ cypher_mini_1.8b,0.22170900692840648
1351
+ codellama_7b,0.22113163972286373
1352
+ dpo_qlora_qwen1.5_0.5b_chat_xtuner,0.22055427251732102
1353
+ bloom,0.2199769053117783
1354
+ mpt_7b,0.21939953810623555
1355
+ dpo_qwen1.5_0.5b_chat,0.21882217090069284
1356
+ open_llama_7b,0.21824480369515012
1357
+ sailor_1.8b,0.2176674364896074
1358
+ nusantara_1.8b_indo_chat,0.21709006928406466
1359
+ nucleus_22b_token_500b,0.21651270207852194
1360
+ gpt_sw3_6.7b_v2,0.21593533487297922
1361
+ tinyllama_moe_chat,0.21535796766743648
1362
+ falcon_7b_3epoch_norobots,0.21478060046189376
1363
+ starcoder,0.21420323325635104
1364
+ gollie_7b,0.21362586605080833
1365
+ tinyllama_moe_chat_0.1,0.21304849884526558
1366
+ llamacorn_1.1b_chat,0.21247113163972287
1367
+ falcon_rw_1b_instruct_openorca,0.21189376443418015
1368
+ open_llama3b_v2_chat,0.2113163972286374
1369
+ minima_3b,0.2107390300230947
1370
+ palmyra_large,0.21016166281755197
1371
+ gpt_sw3_20b,0.2090069284064665
1372
+ deepseek_coder_1.3b_instruct,0.2090069284064665
1373
+ openbezoar_sft,0.2084295612009238
1374
+ starcoderbase_7b,0.20785219399538107
1375
+ codellama_7b_python,0.20727482678983833
1376
+ instructpalmyra_20b,0.2066974595842956
1377
+ tinyllama_1.1b_slimorca_function_calling_3t,0.2061200923787529
1378
+ olmo_7b,0.20554272517321015
1379
+ shearedplats_2.7b_v2_instruct_v0.1,0.20496535796766743
1380
+ falcon_7b_norobots,0.20438799076212472
1381
+ open_llama3b_code_instruct_0.1,0.203810623556582
1382
+ falcon_7b,0.20265588914549654
1383
+ xglm_7.5b,0.20265588914549654
1384
+ dociprollm_7b,0.20207852193995382
1385
+ redpajama_incite_7b_base,0.20092378752886836
1386
+ redpajama_incite_base_7b_v0.1,0.20092378752886836
1387
+ openhermes_tinyllama_sft_qlora,0.20034642032332564
1388
+ shearedplats_2.7b_v2,0.1997690531177829
1389
+ walter_llama_1b,0.19919168591224018
1390
+ starcoderbase_3b,0.19861431870669746
1391
+ dolphin_2.6_mistral_7b_dpo_5.93b,0.19803695150115475
1392
+ mt7bi_wizard_3_alpha_dpo,0.197459584295612
1393
+ zephyr_1b_olmo_sft_qlora,0.19688221709006928
1394
+ aira_2_355m,0.19630484988452657
1395
+ wizardvicuna_open_llama3b_v2,0.1951501154734411
1396
+ codellama_13b_python,0.1951501154734411
1397
+ palmyra_base,0.1945727482678984
1398
+ deacon_3b,0.19341801385681293
1399
+ test_22b,0.19341801385681293
1400
+ openllama3b_evolinstruct_lora_merged,0.1922632794457275
1401
+ open_llama3b_v2,0.1922632794457275
1402
+ rho_math_1b_v0.1,0.19168591224018475
1403
+ redpajama_incite_base_3b_v1,0.19110854503464203
1404
+ hf_checkpoint2_01052024,0.18995381062355657
1405
+ numfalm_3b,0.18995381062355657
1406
+ lamini_neo_1.3b_mental_health_lora,0.18879907621247113
1407
+ zephyr_danube_sft_qlora,0.18879907621247113
1408
+ opt_66b,0.18822170900692842
1409
+ mptk_1b,0.18764434180138567
1410
+ open_llama3b,0.18706697459584296
1411
+ gpt2_platypus_camel_physics,0.18533487297921478
1412
+ openbezoar_hh_rlhf_dpo,0.18533487297921478
1413
+ gpt2_camel_physics_platypus,0.18533487297921478
1414
+ nusantara_0.8b_indo_chat,0.18475750577367206
1415
+ tinyllama_1.1b_intermediate_step_1431k_3t_laser_dpo,0.18418013856812934
1416
+ bloom_1b1_rlhf,0.1836027713625866
1417
+ stellarx_4b_v0,0.18244803695150116
1418
+ csg_wukong_1b_chat_v0.1,0.18244803695150116
1419
+ amber,0.1812933025404157
1420
+ minueza_32m_deita,0.1812933025404157
1421
+ cerebras_gpt_256m,0.18071593533487298
1422
+ mistral_7b_dpo_open_orca_flan_50k_synthetic_5_models,0.18013856812933027
1423
+ gemma_ko_1.1_2b_it,0.1784064665127021
1424
+ gpt_2_xl_camel_ai_physics,0.1784064665127021
1425
+ tiny_starcoder_py,0.1784064665127021
1426
+ pythia_2.8b_deduped,0.1766743648960739
1427
+ gpt_j_6b,0.1766743648960739
1428
+ tinyllama_1.1b_step_50k_105b,0.1766743648960739
1429
+ pythia_12b,0.17609699769053117
1430
+ sailor_0.5b_chat,0.17551963048498845
1431
+ orca_2_7b_f16,0.17494226327944573
1432
+ cosmo_1b,0.17436489607390301
1433
+ starcoderbase_1b,0.17378752886836027
1434
+ weblab_10b_instruction_sft,0.17263279445727484
1435
+ opt_30b,0.17263279445727484
1436
+ sheared_pythia_160m,0.17147806004618937
1437
+ flor_1.3b_xat,0.17147806004618937
1438
+ black_goo_recipe_d,0.17032332563510394
1439
+ polyglot_ko_12.8b,0.17032332563510394
1440
+ cerebras_gpt_1.3b,0.1697459584295612
1441
+ black_goo_recipe_c,0.16916859122401848
1442
+ pythia_1.3b,0.16859122401847576
1443
+ gpt2_xl,0.16801385681293302
1444
+ 7b_redpajama_conditional_alpha,0.16685912240184758
1445
+ chinese_alpaca_2_1.3b_rlhf,0.16685912240184758
1446
+ tinyllama,0.16628175519630484
1447
+ pythia_6.9b_deduped,0.16570438799076212
1448
+ tinyopenhermes_1.1b_4k,0.16397228637413394
1449
+ gpt_neo_2.7b,0.16397228637413394
1450
+ zephyr_220m_sft_full,0.16397228637413394
1451
+ llongma_3b_lima,0.1628175519630485
1452
+ zephyr_220m_dpo_full,0.1628175519630485
1453
+ gpt2_chatbot,0.16224018475750576
1454
+ gpt2_guanaco_dolly_platypus,0.16166281755196305
1455
+ flyingllama_v2,0.16108545034642033
1456
+ fialka_13b_v3,0.1605080831408776
1457
+ gpt2_large_conversational,0.15993071593533487
1458
+ olmo_1b,0.15935334872979215
1459
+ weblab_10b,0.15877598152424943
1460
+ tinyllama_1.1b_intermediate_step_240k_503b,0.1581986143187067
1461
+ bloom_7b1,0.15762124711316397
1462
+ tinywand_dpo,0.1564665127020785
1463
+ fbopt_350m_8bit,0.1564665127020785
1464
+ stablelm_base_alpha_7b,0.1558891454965358
1465
+ gpt2_open_platypus,0.15531177829099307
1466
+ smol_llama_220m_openhermes,0.1535796766743649
1467
+ llama2_xs_460m_experimental,0.1535796766743649
1468
+ gpt_sw3_1.3b_instruct,0.1535796766743649
1469
+ gpt2_platypus_dolly_guanaco,0.15242494226327943
1470
+ knowledgeninja_litellama_460mx6moe_1t,0.15242494226327943
1471
+ aeonium_v1_baseweb_1b,0.15184757505773672
1472
+ gpt_sw3_1.3b,0.15069284064665128
1473
+ llama_160m_chat_v1,0.15069284064665128
1474
+ tinyllama_1.1b_chat_v0.3_platypus,0.15011547344110854
1475
+ rwkv_4_14b_pile,0.1489607390300231
1476
+ evaloric_1.1b_test,0.1489607390300231
1477
+ smol_llama_220m_open_instruct,0.14780600461893764
1478
+ tinyllama_frankenmerge,0.14780600461893764
1479
+ mixtral_gqa_400m_v2,0.14665127020785218
1480
+ redpajama_incite_chat_3b_v1_rl_lora_8bit_test1,0.14665127020785218
1481
+ minueza_32m_ultrachat,0.14607390300230946
1482
+ gpt2_large,0.14491916859122403
1483
+ minueza_32mx2_chat,0.14491916859122403
1484
+ tinymistral_248m_sft_v4,0.14376443418013857
1485
+ tinyllama_1.1b_intermediate_step_1431k_3t,0.14376443418013857
1486
+ opt_350m,0.1420323325635104
1487
+ opt_125m,0.1420323325635104
1488
+ healix_3b,0.1420323325635104
1489
+ gpt_sw3_6.7b,0.14145496535796767
1490
+ pythia_410m_deduped,0.14087759815242495
1491
+ tinywand_sft,0.1403002309468822
1492
+ gpt_neo_125m,0.1397228637413395
1493
+ litellama_460m_1t,0.13856812933025403
1494
+ rwkv_raven_1b5,0.13856812933025403
1495
+ h2o_danube_1.8b_base,0.1379907621247113
1496
+ codegen_6b_nl,0.13568129330254042
1497
+ tinydolphin_2.8.2_1.1b_laser,0.13568129330254042
1498
+ gpt_sw3_356m,0.13568129330254042
1499
+ cerebras_gpt_6.7b,0.13568129330254042
1500
+ cerebras_gpt_13b,0.1351039260969977
1501
+ pythia_70m,0.13452655889145496
1502
+ test_model,0.13279445727482678
1503
+ smol_llama_4x220m_moe,0.13279445727482678
1504
+ chinese_alpaca_2_1.3b,0.13279445727482678
1505
+ pythia_2.7b,0.13163972286374134
1506
+ gpt2_test,0.13163972286374134
1507
+ zephyr_tinyllama_sft_qlora,0.13048498845265588
1508
+ smol_llama_220m_gqa,0.13048498845265588
1509
+ falcon_7b_instruct,0.12990762124711316
1510
+ algae_550m_base,0.1287528868360277
1511
+ gpt2,0.1287528868360277
1512
+ tinynaughtyllama_v1.0,0.12759815242494227
1513
+ gpt_2_slimorcadeduped_airoboros_3.1_metamathqa_sft_124m,0.12759815242494227
1514
+ gpt2_dolly,0.12702078521939955
1515
+ pythia_1.4b,0.1264434180138568
1516
+ zephyr_tiny_dpo_qlora,0.1258660508083141
1517
+ tinyllama_chat_sft,0.12471131639722864
1518
+ rwkv_4_1b5_pile,0.12471131639722864
1519
+ numfa_v2_1b,0.12240184757505773
1520
+ phind_codellama34b_v2,0.12240184757505773
1521
+ gptneo350m_instruct_sft,0.12240184757505773
1522
+ numfalm_v2_1b,0.12240184757505773
1523
+ minueza_32m_chat,0.12124711316397228
1524
+ black_goo_recipe_a,0.12124711316397228
1525
+ csg_wukong_1b_orpo_bf16,0.12066974595842957
1526
+ mistral_3_from_mixtral_8x7b_v0.1,0.1195150115473441
1527
+ tinyllama_1.1b_1.5t_openorca_alpha,0.1195150115473441
1528
+ croissantllmbase,0.11893764434180139
1529
+ codegen_6b_multi,0.11836027713625866
1530
+ mixnueza_6x32m_moe,0.11778290993071594
1531
+ shearedllama_1.3b_fft_test1,0.11662817551963048
1532
+ minillama_1.8b_chat_v0.1,0.11662817551963048
1533
+ tmm_1b,0.11547344110854503
1534
+ black_goo_recipe_b,0.11547344110854503
1535
+ openhermes_1b_olmo_sft_qlora,0.11489607390300231
1536
+ boomer_1b,0.11374133949191687
1537
+ ablation_model_fineweb_v1,0.11374133949191687
1538
+ init_model,0.11316397228637413
1539
+ pythia_12b_deduped,0.1125866050808314
1540
+ sailor_0.5b,0.11200923787528869
1541
+ tinydolphin_2.8_1.1b,0.11143187066974596
1542
+ pythia_1.4b_deduped,0.11085450346420324
1543
+ stellarx_4b_v0.2,0.10912240184757506
1544
+ megachat,0.10912240184757506
1545
+ codeparrot,0.10912240184757506
1546
+ microscopic_mistral_87k_steps,0.10854503464203233
1547
+ tinyllama_1.1b_layla_v4,0.10739030023094688
1548
+ gpt_sw3_356m_instruct,0.10739030023094688
1549
+ gpt_2_large_115k_steps,0.10623556581986143
1550
+ phigrange_dpo,0.10623556581986143
1551
+ cerebras_gpt_111m,0.10508083140877598
1552
+ 42dot_llm_sft_1.3b,0.10508083140877598
1553
+ mindllm,0.10450346420323325
1554
+ tiny_vicuna_1b,0.1033487297921478
1555
+ mistral_6_from_mixtral_8x7b_v0.1,0.1033487297921478
1556
+ speechless_codellama_orca_airoboros_13b_0.10e,0.10046189376443418
1557
+ opt_2.7b,0.10046189376443418
1558
+ stablelm_base_alpha_3b,0.10046189376443418
1559
+ xglm_4.5b,0.10046189376443418
1560
+ gpt2_xl_lima,0.10046189376443418
1561
+ 3b_redpajama_conditional_alpha,0.09930715935334873
1562
+ tinyultra_4x1.1b_base_alpha,0.09930715935334873
1563
+ fialka_13b_v3.1,0.098729792147806
1564
+ internlm_20b_llamafied,0.09757505773672055
1565
+ dopeyshearedplats_1.3b_v1,0.09757505773672055
1566
+ bilingual_gpt_neox_4b_8k,0.09699769053117784
1567
+ nanollama_gqa_l10_a32_kv8_v13_ki,0.09584295612009237
1568
+ babyllama_v0.6,0.09584295612009237
1569
+ speechless_codellama_orca_platypus_13b_0.10e,0.09468822170900693
1570
+ evaloric_1.1b,0.09468822170900693
1571
+ open_llama3b_instruct_v_0.2,0.09353348729792148
1572
+ nano_phi_115m_v0.1,0.09353348729792148
1573
+ csg_wukong_1b,0.0918013856812933
1574
+ llama3,0.0918013856812933
1575
+ 774m_03_09_2024,0.0918013856812933
1576
+ smartyplats_3b_v1,0.09006928406466513
1577
+ tinyllama_1.1b_1t_openorca,0.09006928406466513
1578
+ tinydolphin_2.8.1_1.1b,0.09006928406466513
1579
+ mistral_8_from_mixtral_8x7b_v0.1,0.0894919168591224
1580
+ verysmol_llama_v11_kix2,0.08775981524249422
1581
+ falcon_rw_1b,0.08775981524249422
1582
+ mixsmol_4x400m_v0.1_epoch1,0.08775981524249422
1583
+ mixsmol_4x400m_v0.1_epoch2,0.08602771362586605
1584
+ pythia_70m_deduped,0.08602771362586605
1585
+ falcon_1b_t_sft,0.08602771362586605
1586
+ pile_7b_250b_tokens,0.08545034642032333
1587
+ open_calm_large,0.0848729792147806
1588
+ gzdx,0.08429561200923788
1589
+ llama_68m_chat_v1,0.08140877598152425
1590
+ xglm_564m,0.08140877598152425
1591
+ tinymistral_248m_instruct,0.08140877598152425
1592
+ tinyllama_1.1b_orca_v1.0,0.08140877598152425
1593
+ zephyr_smol_llama_100m_dpo_full,0.08140877598152425
1594
+ mgpt,0.0802540415704388
1595
+ cerebras_gpt_2.7b,0.0802540415704388
1596
+ nano_mistral,0.07967667436489607
1597
+ opt_flan_iml_6.7b,0.07852193995381063
1598
+ mistral_7_from_mixtral_8x7b_v0.1,0.07852193995381063
1599
+ aira_2_774m,0.07736720554272518
1600
+ mistral_5_from_mixtral_8x7b_v0.1,0.07736720554272518
1601
+ vortex_3b_v2,0.07621247113163972
1602
+ fialka_13b_v4,0.07621247113163972
1603
+ model_a_48.5m,0.07505773672055427
1604
+ openhermes_danube_sft_qlora,0.07505773672055427
1605
+ smolllamix_8x101m_take2,0.07448036951501155
1606
+ tinyllama_1.1b_chat_v1.0_intel_dpo,0.07390300230946882
1607
+ nanofialka_v1,0.07332563510392609
1608
+ gpt_neox_20b,0.07217090069284064
1609
+ tinyllama_1.1b_intermediate_step_480k_1t,0.07217090069284064
1610
+ merge_dolly_v2_3b_dpo_test,0.06986143187066975
1611
+ pythia_31m_simplepile_lite_2048_scratch_2e,0.06986143187066975
1612
+ tinystories_3m,0.06986143187066975
1613
+ bulgakovlm_3b,0.06986143187066975
1614
+ pythia_31m,0.0687066974595843
1615
+ gpt_bigcode_santacoder,0.0687066974595843
1616
+ rwkv_4_7b_pile,0.06812933025404157
1617
+ pythia_160m,0.06755196304849885
1618
+ smol_llama_101m_chat_v1,0.06697459584295612
1619
+ idus,0.06639722863741339
1620
+ opt_13b,0.06581986143187067
1621
+ deacon_1b,0.06466512702078522
1622
+ koalpaca_korwkv_6b,0.06466512702078522
1623
+ rwkv_raven_3b,0.06408775981524249
1624
+ pythia_160m_deduped,0.06293302540415704
1625
+ aira_2_1b1,0.06293302540415704
1626
+ rwkv_4_430m_pile,0.06235565819861432
1627
+ mistral_4_from_mixtral_8x7b_v0.1,0.061200923787528866
1628
+ nusantara_2.7b_indo_chat,0.061200923787528866
1629
+ gpt_neo_1.3b,0.06062355658198614
1630
+ csg_wukong_1b_sft_bf16,0.06004618937644342
1631
+ crow_1b,0.05889145496535797
1632
+ minueza_32m_base,0.05889145496535797
1633
+ gpt2_final,0.057736720554272515
1634
+ dpo_miniguanaco_1.5t,0.057736720554272515
1635
+ shearedplats_1.3b_v1,0.05715935334872979
1636
+ puli_gptrio,0.05658198614318707
1637
+ csg_wukong_1b_sft_dpo_bf16,0.05600461893764434
1638
+ smolllamix_8x101m,0.05484988452655889
1639
+ korwkv_6b,0.05484988452655889
1640
+ mpt_125m_c4,0.054272517321016164
1641
+ rwkv_4_3b_pile,0.05369515011547344
1642
+ llama_pile_350b,0.05254041570438799
1643
+ mistral_1_from_mixtral_8x7b_v0.1,0.05254041570438799
1644
+ pythia_6.7b,0.05138568129330254
1645
+ healix_1.1b_v1_chat_ddpo,0.05138568129330254
1646
+ zyte_1b,0.050808314087759814
1647
+ llama3_orpo_v1_merged_16bit,0.05023094688221709
1648
+ walter_falcon_1b,0.049653579676674366
1649
+ opt_6.7b,0.04849884526558892
1650
+ tinystories_1m,0.04849884526558892
1651
+ pythia_31m_chat_v1,0.04734411085450346
1652
+ dopeyplats_1.1b_2t_v1,0.04734411085450346
1653
+ croissantcool_v0.2,0.04676674364896074
1654
+ gpt_sw3_126m,0.046189376443418015
1655
+ falcon_rw_1b_chat,0.04503464203233257
1656
+ tiny_llama3_7b,0.04503464203233257
1657
+ gpt3_finnish_small,0.044457274826789836
1658
+ pythia_1b_spin_iter1,0.04387990762124711
1659
+ tinymistral_248m_sft_v3,0.04330254041570439
1660
+ decicoder_1b,0.042725173210161664
1661
+ megatron_gpt2_345m,0.04157043879907621
1662
+ smartyplats_3b_v2,0.04157043879907621
1663
+ llama39m,0.040993071593533485
1664
+ tinymix,0.03983833718244804
1665
+ pythia_1b_deduped,0.03983833718244804
1666
+ llama_160m,0.03926096997690531
1667
+ pythia_1b_dpo,0.03810623556581986
1668
+ smol_llama_101m_gqa,0.03810623556581986
1669
+ dpo_test_hermes_open_llama3b,0.037528868360277134
1670
+ mistral_2_from_mixtral_8x7b_v0.1,0.036374133949191687
1671
+ cutie,0.036374133949191687
1672
+ numfa_3b_1epoch,0.03521939953810624
1673
+ gpt_2_large_40k_steps,0.03521939953810624
1674
+ pythia_1b_dpo_full,0.034064665127020784
1675
+ tinymistral_6x248m_instruct,0.034064665127020784
1676
+ gpt3_finnish_large,0.03348729792147806
1677
+ smol_llama_81m_tied,0.032909930715935336
1678
+ gpt_2_large_43k_steps,0.03233256351039261
1679
+ bloom_560m_rlhf_v2,0.03175519630484989
1680
+ tinymistral_248m_v2.5_instruct,0.03117782909930716
1681
+ gpt_2_large_51k_steps,0.03002309468822171
1682
+ gpt_2_large_20k_steps,0.03002309468822171
1683
+ tinystories_33m,0.029445727482678985
1684
+ taketwo,0.028868360277136258
1685
+ gpt_sw3_126m_instruct,0.028290993071593534
1686
+ gpt_2_large_32k_steps,0.02771362586605081
1687
+ helpingai_110m,0.027136258660508082
1688
+ rwkv_raven_7b,0.026558891454965358
1689
+ bloom_560m_rlhf,0.025981524249422634
1690
+ megatron_gpt2_345m_evol_instruct_v2,0.025404157043879907
1691
+ ko_wand_136m,0.024826789838337183
1692
+ tinystories_28m,0.02367205542725173
1693
+ tinymistral_v2.5_minipile_guidelines_e1,0.02367205542725173
1694
+ tinymistral_248m_chat_v2,0.023094688221709007
1695
+ gpt3_finnish_13b,0.022517321016166283
1696
+ tinymistral_248m_v2,0.021939953810623556
1697
+ tinymistral_v2_test1,0.021362586605080832
1698
+ tinystories_8m,0.02020785219399538
1699
+ llama_2_3b,0.02020785219399538
1700
+ rwkv_4_169m_pile,0.019630484988452657
1701
+ llama2_13b_platypus_ckpt_1000,0.01905311778290993
1702
+ facebook_opt_125m_qcqa_ub_6_best_for_q_loss,0.01674364896073903
1703
+ facebook_opt_6.7b_qcqa_ub_16_best_for_q_loss,0.01674364896073903
1704
+ tinymistral_248m,0.01674364896073903
1705
+ tinymistral_248m_v2.5,0.01674364896073903
1706
+ dough_instruct_base_001,0.016166281755196306
1707
+ llm_jp_13b_instruct_full_jaster_v1.0,0.002886836027713626
1708
+ griffin_c3t_8l_v0.02_fineweb,0.002886836027713626
1709
+ mistral_7b_v0.1_signtensors_1_over_4,0.002886836027713626
1710
+ llm_jp_13b_instruct_full_jaster_dolly_oasst_v1.0,0.002886836027713626
1711
+ japanese_gpt_neox_3.6b,0.002886836027713626
1712
+ mistral7b_test001,0.002886836027713626
1713
+ griffin_llama3t_8l_v0.02_fineweb,0.002886836027713626
1714
+ pythia_31m_ki_v1_2048_scratch,0.002886836027713626
1715
+ opt_125m_gqa_ub_6_best_for_kv_cache,0.002886836027713626
1716
+ facebook_opt_6.7b_qcqa_ub_16_best_for_kv_cache,0.002886836027713626
1717
+ bilingual_gpt_neox_4b_instruction_ppo,0.002886836027713626
1718
+ bilingual_gpt_neox_4b_instruction_sft,0.002886836027713626
1719
+ wizardlm_30b_v1.0,0.002886836027713626
1720
+ telugu_llama_7b_instruct_v0.1,0.002886836027713626
1721
+ tamil_llama_7b_instruct_v0.2,0.002886836027713626
1722
+ changpt_bart,0.002886836027713626
1723
+ shisa_base_7b_v1,0.002886836027713626
1724
+ malayalam_llama_7b_instruct_v0.1,0.002886836027713626
1725
+ experiment_dpo_m7b2_3_merged,0.002886836027713626
1726
+ facebook_opt_125m_qcqa_ub_6_best_for_kv_cache,0.002886836027713626
1727
+ pythia_31m_simplewiki_scratch_bf16,0.002886836027713626
1728
+ pythia_31m_simplewiki_2048,0.002886836027713626
1729
+ facebook_opt_6.7b_gqa_ub_16_best_for_kv_cache,0.002886836027713626
1730
+ pythia_31m_goodwiki_deduped_2048_scratch,0.0023094688221709007
1731
+ bilingual_gpt_neox_4b,0.0017321016166281756
1732
+ tinymistral_248m_chat_v1,0.0005773672055427252
1733
+ momomerge_72b_v0.1,0.0005773672055427252
1734
+ sf_72b_v1,0.0
cache/agreements_cache_1edd56d721757789836f081c38c15400.csv ADDED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_230b5a189df3af8cde801ce251b7b2ef.csv ADDED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_2d8c9f9c6d96807c68a9475184afcecb.csv ADDED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_7b814a45375ad6b75add8b396f69c2cd.csv DELETED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_9c0710fd06d230cc89e0f2f023e3058f.csv ADDED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_bdd8d629730630ed8e73cb56f53f335b.csv DELETED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_bffcfd24eb4a8fe1f6c8ac8a0c8c21d6.csv ADDED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_f97e563eeda8c9bdc279f5b94b32606c.csv ADDED
The diff for this file is too large to render. See raw diff