Yotam-Perlitz commited on
Commit
566ad63
1 Parent(s): a50f807

remove cache

Browse files

Signed-off-by: Yotam-Perlitz <[email protected]>

cache/aggregate_scoress_cache_1edd56d721757789836f081c38c15400.csv DELETED
@@ -1,83 +0,0 @@
1
- model,score
2
- arx_0.3,1.0
3
- claude_3.5_sonnet,0.9876543209876543
4
- grok_2,0.9753086419753086
5
- gpt_4o_2024_05_13,0.9629629629629629
6
- grok_2_mini,0.9506172839506173
7
- gemini_1.5_pro,0.9382716049382716
8
- claude_3_opus,0.9259259259259259
9
- qwen2_72b_chat,0.9135802469135802
10
- magnum_72b_v1,0.9012345679012346
11
- gpt_4_turbo,0.8888888888888888
12
- deepseek_coder_v2_instruct,0.8765432098765432
13
- higgs_llama3_70b,0.8641975308641975
14
- gpt_4o_mini,0.8518518518518519
15
- llama3.1_70b_instruct,0.8395061728395061
16
- gemini_1.5_flash,0.8271604938271605
17
- yi_large,0.8148148148148148
18
- claude_3_sonnet,0.8024691358024691
19
- llama3_70b_instruct,0.7901234567901234
20
- phi3_medium_4k,0.7777777777777778
21
- qwen2_72b_32k,0.7654320987654321
22
- deepseek_v2_chat,0.7530864197530864
23
- llama3_70b,0.7407407407407407
24
- qwen1.5_72b_chat,0.7283950617283951
25
- llama3.1_70b,0.7160493827160493
26
- yi_1.5_34b_chat,0.7037037037037037
27
- gemma_2_9b_it,0.691358024691358
28
- phi3_medium_128k,0.6790123456790124
29
- mammoth2_8x7b_plus,0.6666666666666666
30
- qwen1.5_110b,0.654320987654321
31
- glm_4_9b_chat,0.6419753086419753
32
- glm_4_9b,0.6296296296296297
33
- phi_3.5_mini_instruct,0.6172839506172839
34
- qwen2_7b_instruct,0.6049382716049383
35
- yi_1.5_9b_chat,0.5925925925925926
36
- phi3_mini_4k,0.5802469135802469
37
- gemma_2_9b,0.5679012345679012
38
- mistral_nemo_instruct_2407,0.5555555555555556
39
- llama3.1_8b_instruct,0.5432098765432098
40
- phi3_mini_128k,0.5308641975308642
41
- mammoth2_8b_plus,0.5185185185185185
42
- mixtral_8x7b_instruct_v0.1,0.5061728395061729
43
- yi_34b,0.49382716049382713
44
- mathstral_7b_v0.1,0.48148148148148145
45
- deepseek_coder_v2_lite_instruct,0.4691358024691358
46
- mixtral_8x7b_v0.1,0.4567901234567901
47
- llama3_8b_instruct,0.4444444444444444
48
- mammoth2_7b_plus,0.43209876543209874
49
- qwen2_7b,0.41975308641975306
50
- mistral_nemo_base_2407,0.4074074074074074
51
- wizardlm_2_8x22b,0.3950617283950617
52
- yi_1.5_6b_chat,0.38271604938271603
53
- qwen1.5_14b_chat,0.37037037037037035
54
- c4ai_command_r_v01,0.345679012345679
55
- staring_7b,0.345679012345679
56
- llama_2_70b,0.3333333333333333
57
- openchat_3.5_8b,0.32098765432098764
58
- internmath_20b_plus,0.30864197530864196
59
- llama3_smaug_8b,0.2962962962962963
60
- llama3.1_8b,0.2839506172839506
61
- llama3_8b,0.2716049382716049
62
- deepseekmath_7b_instruct,0.25925925925925924
63
- deepseek_coder_v2_lite_base,0.24691358024691357
64
- gemma_7b,0.2345679012345679
65
- internmath_7b_plus,0.2222222222222222
66
- zephyr_7b_beta,0.20987654320987653
67
- mistral_7b_v0.1,0.19753086419753085
68
- mistral_7b_instruct_v0.2,0.18518518518518517
69
- mistral_7b_v0.2,0.1728395061728395
70
- qwen1.5_7b_chat,0.16049382716049382
71
- yi_6b_chat,0.14814814814814814
72
- neo_7b_instruct,0.13580246913580246
73
- yi_6b,0.12345679012345678
74
- neo_7b,0.1111111111111111
75
- mistral_7b_instruct_v0.1,0.09876543209876543
76
- llama_2_13b,0.08641975308641975
77
- llemma_7b,0.07407407407407407
78
- qwen2_1.5b_instruct,0.06172839506172839
79
- qwen2_1.5b,0.04938271604938271
80
- llama_2_7b,0.037037037037037035
81
- qwen2_0.5b_instruct,0.024691358024691357
82
- gemma_2b,0.012345679012345678
83
- qwen2_0.5b,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/aggregate_scoress_cache_230b5a189df3af8cde801ce251b7b2ef.csv DELETED
@@ -1,71 +0,0 @@
1
- model,score
2
- claude_3_5_sonnet_20240620,1.0
3
- gpt_4o_2024_08_06,0.9855072463768116
4
- chatgpt_4o_latest,0.9710144927536232
5
- gpt_4o_2024_05_13,0.9565217391304348
6
- llama3.1_405b_instruct_turbo,0.9420289855072463
7
- gemini_1.5_pro_exp_0827,0.927536231884058
8
- gpt_4_turbo_2024_04_09,0.9130434782608695
9
- gemini_1.5_pro_exp_0801,0.8985507246376812
10
- claude_3_opus_20240229,0.8840579710144928
11
- gpt_4_0125_preview,0.8695652173913043
12
- dracarys_llama3.1_70b_instruct,0.855072463768116
13
- llama3.1_70b_instruct_turbo,0.8405797101449275
14
- mistral_large_2407,0.8260869565217391
15
- gemini_1.5_flash_exp_0827,0.8115942028985508
16
- deepseek_coder_v2,0.7971014492753623
17
- deepseek_chat_v2,0.782608695652174
18
- gpt_4_0613,0.7681159420289855
19
- gemini_1.5_pro_api_0514,0.7536231884057971
20
- gpt_4o_mini_2024_07_18,0.7391304347826086
21
- gemma_2_27b_it,0.7246376811594203
22
- dracarys_72b_instruct,0.7101449275362319
23
- qwen2_72b_instruct,0.6956521739130435
24
- hermes_3_llama3.1_70b,0.6811594202898551
25
- gemini_1.5_flash_api_0514,0.6666666666666666
26
- smaug_qwen2_72b_instruct,0.6521739130434783
27
- mistral_large_2402,0.6376811594202898
28
- claude_3_sonnet_20240229,0.6231884057971014
29
- llama3_70b_instruct,0.6086956521739131
30
- claude_3_haiku_20240307,0.5942028985507246
31
- mixtral_8x22b_instruct_v0.1,0.5797101449275363
32
- phi_3.5_moe_instruct,0.5652173913043478
33
- gpt_3.5_turbo_0125,0.5507246376811594
34
- mistral_small_2402,0.5362318840579711
35
- command_r_plus,0.5217391304347826
36
- gemma_2_9b_it,0.5072463768115942
37
- phi_3_medium_4k_instruct,0.4927536231884058
38
- phi_3_medium_128k_instruct,0.4782608695652174
39
- phi_3_small_128k_instruct,0.463768115942029
40
- qwen1.5_110b_chat,0.4492753623188406
41
- deepseek_coder_v2_lite_instruct,0.43478260869565216
42
- qwen1.5_72b_chat,0.42028985507246375
43
- open_mistral_nemo,0.4057971014492754
44
- phi_3.5_mini_instruct,0.391304347826087
45
- llama3.1_8b_instruct_turbo,0.37681159420289856
46
- phi_3_small_8k_instruct,0.36231884057971014
47
- llama3_8b_instruct,0.34782608695652173
48
- command_r,0.3333333333333333
49
- qwen2_7b_instruct,0.3188405797101449
50
- phi_3_mini_128k_instruct,0.30434782608695654
51
- phi_3_mini_4k_instruct,0.2898550724637681
52
- mathstral_7b_v0.1,0.2753623188405797
53
- openhermes_2.5_mistral_7b,0.2608695652173913
54
- mixtral_8x7b_instruct_v0.1,0.2463768115942029
55
- mistral_7b_instruct_v0.3,0.2318840579710145
56
- mistral_7b_instruct_v0.2,0.21739130434782608
57
- gemma_1.1_7b_it,0.2028985507246377
58
- zephyr_7b_alpha,0.18840579710144928
59
- qwen1.5_7b_chat,0.17391304347826086
60
- deepseek_v2_lite_chat,0.15942028985507245
61
- zephyr_7b_beta,0.14492753623188406
62
- starling_lm_7b_beta,0.13043478260869565
63
- vicuna_7b_v1.5_16k,0.11594202898550725
64
- vicuna_7b_v1.5,0.10144927536231885
65
- llama_2_7b_chat,0.08695652173913043
66
- qwen1.5_4b_chat,0.07246376811594203
67
- qwen2_1.5b_instruct,0.057971014492753624
68
- yi_6b_chat,0.043478260869565216
69
- qwen2_0.5b_instruct,0.028985507246376812
70
- qwen1.5_1.8b_chat,0.014492753623188406
71
- qwen1.5_0.5b_chat,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/aggregate_scoress_cache_2d8c9f9c6d96807c68a9475184afcecb.csv DELETED
@@ -1,686 +0,0 @@
1
- model,score
2
- claude_3_5_sonnet_20240620,1.0
3
- gpt_4o_20240513,1.0
4
- calme_2.1_qwen2_72b,1.0
5
- shopee_slimmoa_v1,1.0
6
- calme_2.2_qwen2_72b,0.9970414201183432
7
- blendax.ai_gm_l6_vo31,0.9947368421052631
8
- magnum_72b_v1,0.9911242603550295
9
- gemma_2_9b_it_wpo_hb,0.9894736842105263
10
- gpt_4o_2024_05_13,0.984963768115942
11
- blendax.ai_gm_l3_v35,0.9842105263157894
12
- claude_3.5_sonnet,0.9830508474576272
13
- calme_2.2_llama3_70b,0.9822485207100592
14
- llama3_tenyxchat_70b,0.9763313609467456
15
- openpipe_moa_gpt_4_turbo,0.9736842105263158
16
- claude_3.5_sonnet_20240620,0.971830985915493
17
- chatgpt_4o_latest,0.9710144927536232
18
- rys_llama3_large_instruct,0.9704142011834319
19
- text_davinci_002,0.9696969696969697
20
- gpt_4o_2024_08_06,0.9677536231884059
21
- qwen2_72b,0.9674556213017751
22
- gemini_1.5_pro,0.9661016949152542
23
- together_moa,0.9631578947368421
24
- smaug_llama3_70b_instruct_32k,0.9615384615384616
25
- rys_llama3_huge_instruct,0.9585798816568047
26
- llama3_pbm_nova_70b,0.9578947368421052
27
- zephyr_orpo_141b_a35b_v0.1,0.9526627218934911
28
- storm_7b_best_of_64,0.9526315789473684
29
- together_moa_lite,0.9473684210526315
30
- llama3.1_instruct_turbo_405b,0.9436619718309859
31
- 09,0.9421052631578948
32
- llama3.1_405b_instruct_turbo,0.9420289855072463
33
- calme_2.4_llama3_70b,0.9408284023668639
34
- gpt_4_turbo_2024_04_09,0.9399808331689967
35
- cohere_command_beta_52.4b,0.9393939393939394
36
- internlm2_5_20b_chat,0.9378698224852071
37
- 13,0.9368421052631579
38
- dolphin_2.9.2_qwen2_72b,0.9349112426035503
39
- multiverse_70b,0.9319526627218935
40
- higgs_llama3_70b_v2,0.9315789473684211
41
- llama3.1_instruct_turbo_70b,0.9295774647887324
42
- barcenas_14b_phi_3_medium_orpo,0.9289940828402367
43
- gemini_1.5_pro_exp_0827,0.927536231884058
44
- sppo_gemma_2_9b_it_pairrm,0.9263157894736842
45
- c4ai_command_r_plus,0.9260355029585798
46
- text_davinci_003,0.9242424242424242
47
- internlm2_5_7b_chat,0.9230769230769231
48
- llama3_instruct_8b_wpo_hb_v2,0.9210526315789473
49
- llama3_70b_shiningvaliant2,0.9201183431952663
50
- qwen2_57b_a14b_instruct,0.9171597633136095
51
- gpt_4o_mini,0.9166666666666666
52
- 20,0.9157894736842105
53
- deepseek_v2_chat_0628_api,0.9152542372881356
54
- qwen1.5_110b,0.9142011834319527
55
- gpt_4_0125_preview,0.9115123229345778
56
- yi_1.5_34b_chat_16k,0.908284023668639
57
- 18,0.9052631578947369
58
- qwen2_instruct_72b,0.9014084507042254
59
- gemini_1.5_pro_api_preview,0.9
60
- storm_7b,0.9
61
- blossom_v5.1_34b,0.8994082840236687
62
- gemini_1.5_pro_exp_0801,0.8985507246376812
63
- rys_phi_3_medium_4k_instruct,0.8964497041420119
64
- gpt_4o_mini_20240718,0.8947368421052632
65
- 06,0.8947368421052632
66
- configurable_llama3.1_8b_instruct,0.8905325443786982
67
- infinity_instruct_7m_gen_llama3_1_70b,0.8894736842105263
68
- mistral_large_2_2407,0.8873239436619719
69
- llama3_70b,0.8867405617134761
70
- chocolatine_3b_instruct_dpo_revised,0.8846153846153846
71
- expo_+_llama3_instruct_8b_simpo,0.8842105263157894
72
- claude_3_opus,0.8813559322033898
73
- tnlg_v2_530b,0.8787878787878788
74
- nous_hermes_2_mixtral_8x7b_dpo,0.8757396449704142
75
- nanbeige_plus_chat_v0.1,0.8736842105263158
76
- gemini_1.5_pro_001,0.8732394366197183
77
- athene_70b,0.8649717514124293
78
- gemini_1.5_flash,0.864406779661017
79
- yi_1.5_34b_32k,0.863905325443787
80
- aligner_2b+claude_3_opus,0.8631578947368421
81
- barcenas_llama3_8b_orpo,0.8609467455621301
82
- nanbeige2_16b_chat,0.8578947368421053
83
- dracarys_llama3.1_70b_instruct,0.855072463768116
84
- mistral_large_2407,0.8547101449275363
85
- llama3.1_405b_instruct,0.8543859649122807
86
- llama3.1_70b_instruct,0.8530727706841068
87
- 29,0.8526315789473684
88
- llama3.1_70b,0.8520710059171598
89
- yi_34bx2_moe_60b_dpo,0.8520710059171598
90
- glm_4_0520,0.85
91
- phi_3_mini_4k_instruct_cpo_simpo,0.849112426035503
92
- llama30b,0.8484848484848485
93
- infinity_instruct_7m_gen_mistral_7b,0.8473684210526315
94
- dolphin_2.9.2_phi_3_medium,0.8461538461538461
95
- mixtral_8x22b,0.8450704225352113
96
- llama3_instruct_8b_simpo,0.8447991279975086
97
- gritlm_8x7b_kto,0.8431952662721893
98
- llama3.1_70b_instruct_turbo,0.8405797101449275
99
- mixtral_8x22b_v0.3,0.8402366863905325
100
- sppo_llama3_instruct_8b_pairrm,0.8368421052631579
101
- anthropic_lm_v4_s3_52b,0.8333333333333334
102
- yi_1.5_34b,0.8313609467455622
103
- gpt_4_turbo_1106_preview,0.8309859154929577
104
- deepseek_v2_coder_0614_api,0.8305084745762712
105
- hermes_3_llama3.1_70b,0.8302246805591287
106
- c4ai_command_r_v01,0.8284023668639053
107
- arcee_spark,0.8254437869822485
108
- yi_large,0.8234463276836159
109
- gpt_4,0.8210526315789474
110
- claude_3_opus_20240229,0.8195686194461455
111
- humanish_rp_llama3.1_8b,0.8195266272189349
112
- smaug_qwen2_72b_instruct,0.8186905068175971
113
- palmyra_x_v3_72b,0.8169014084507042
114
- qwen2_57b_a14b,0.8165680473372781
115
- infinity_instruct_3m_0625_llama3_70b,0.8157894736842105
116
- gemini_1.5_flash_exp_0827,0.8115942028985508
117
- aligner_2b+qwen1.5_72b_chat,0.8105263157894737
118
- blossom_v5.1_9b,0.8076923076923077
119
- deepseek_coder_v2,0.8068840579710145
120
- gemma_2_9b_it_dpo,0.8062444246208742
121
- qwen2_72b_instruct,0.8060674423919884
122
- aya_23_35b,0.8047337278106509
123
- gemma_2_27b_it,0.8036174652870135
124
- gemma_2_instruct_27b,0.8028169014084507
125
- bagelmisterytour_v2_8x7b,0.8017751479289941
126
- 14,0.8
127
- calme_2.1_phi3_4b,0.7988165680473372
128
- yi_large_preview,0.7973418267559564
129
- llama3_instruct_8b_cpo_simpo,0.7958579881656804
130
- ein_70b_v0.1,0.7947368421052632
131
- maid_yuzu_v7,0.7928994082840237
132
- fsfairx_zephyr_chat_v0.1,0.7894736842105263
133
- gemini_1.5_flash_001,0.7887323943661971
134
- palmyra_x_43b,0.7878787878787878
135
- notux_8x7b_v1,0.7869822485207101
136
- mixtral_8x22b_v0.1,0.7855808159451885
137
- gpt_4_0613,0.7855378648703817
138
- llama3_70b_instruct,0.7843069749718884
139
- llama3_cantonese_8b_instruct,0.7840236686390533
140
- deepseek_chat_v2,0.782608695652174
141
- openbuddy_llama3.1_8b_v22.2_131k,0.7810650887573964
142
- nemotron_4_340b_inst,0.7796610169491526
143
- infinity_instruct_7m_gen_llama3_1_8b,0.7789473684210526
144
- roleplay_llama3_8b,0.7781065088757396
145
- 02,0.7736842105263158
146
- qwen1.5_32b,0.7714601216768064
147
- yi_1.5_34b_chat,0.7702354371537107
148
- gpt_4o_mini_2024_07_18,0.7700499237132448
149
- llama3_instruct_8b_sppo_iter2,0.7692307692307693
150
- expo_+_sppo_mistral7b_pairrm,0.7684210526315789
151
- configurable_yi_1.5_9b_chat,0.7662721893491125
152
- phi_3.5_moe_instruct,0.7648572163622331
153
- smaug_34b_v0.1,0.7633136094674556
154
- merlinite_7b_aot,0.7631578947368421
155
- palm_2_unicorn,0.7605633802816901
156
- qwen2_7b,0.7603550295857988
157
- falcon_instruct_40b,0.7575757575757576
158
- gemma_2_27b,0.757396449704142
159
- gemma_2_9b_it_simpo,0.7550089997835828
160
- qwen1.5_110b_chat,0.7546031756778104
161
- seallms_v3_7b_chat,0.7544378698224852
162
- gemini_1.5_pro_api_0514,0.7536231884057971
163
- infinity_instruct_3m_0613_llama3_70b,0.7526315789473684
164
- samba_coe_v0.2_best_of_16,0.7526315789473684
165
- qwen2_cantonese_7b_instruct,0.7514792899408284
166
- glm_4_0116,0.75
167
- hermes_3_llama3.1_8b,0.7485207100591716
168
- qwen1.5_72b,0.7464788732394366
169
- mistral_large_2,0.7457627118644068
170
- luxia_21.4b_alignment_v1.2,0.7455621301775148
171
- suzume_llama3_8b_multilingual_orpo_borda_top75,0.742603550295858
172
- mpt_instruct_30b,0.7424242424242424
173
- rebel_llama3_8b_instruct,0.7421052631578947
174
- infinity_instruct_3m_0625_mistral_7b,0.7421052631578947
175
- suzume_llama3_8b_multilingual_orpo_borda_top25,0.7396449704142012
176
- nous_hermes_2_solar_10.7b,0.7366863905325444
177
- calme_2.2_phi3_4b,0.7337278106508875
178
- glm_4_air,0.7333333333333333
179
- palmyra_x_v2_33b,0.7323943661971831
180
- sppo_mistral7b_pairrm,0.7315789473684211
181
- llama3_instruct_8b_sppo_iter3,0.7307692307692307
182
- claude_3_sonnet,0.7288135593220338
183
- calme_2.3_phi3_4b,0.727810650887574
184
- mpt_30b,0.7272727272727273
185
- snorkel_mistral_pairrm_dpo+best_of_16,0.7263157894736842
186
- qwen1.5_32b_chat,0.725864216754905
187
- k2_chat,0.7248520710059172
188
- yi_1.5_9b_chat_16k,0.7218934911242604
189
- contextual_ai_kto_mistral_pairrm,0.7210526315789474
190
- luxia_21.4b_alignment_v1.0,0.7189349112426036
191
- gemma_2_instruct_9b,0.7183098591549296
192
- gpt_4_0314,0.7166666666666667
193
- llama3_refueled,0.7159763313609467
194
- pairrm_0.4b+yi_34b_chat_best_of_16,0.7157894736842105
195
- openchat_3.5_1210,0.7130177514792899
196
- dracarys_72b_instruct,0.7101449275362319
197
- configurablebeagle_11b,0.7100591715976331
198
- carbonbeagle_11b,0.7071005917159763
199
- mixtral_8x22b_instruct_v0.1,0.7062215933453392
200
- claude_2,0.7052631578947368
201
- mistral_nemo_instruct_2407,0.7041420118343196
202
- yi_34b,0.7027043920326694
203
- llama_2_70b,0.7006139400505598
204
- gemini_1.5_flash_api_preview,0.7
205
- samba_coe_v0.2,0.7
206
- openbuddy_mixtral_7bx8_v18.1_32k,0.6982248520710059
207
- j1_grande_v2_beta_17b,0.696969696969697
208
- vicuna_v1.3_13b,0.696969696969697
209
- deepseek_llm_67b_chat,0.6954375583930239
210
- chocolatine_8b_instruct_dpo_v1.0,0.6923076923076923
211
- qwen1.5_chat_110b,0.6901408450704225
212
- claude,0.6894736842105263
213
- yi_1.5_9b,0.6893491124260355
214
- openbuddy_llama3_8b_v21.2_32k,0.6863905325443787
215
- internlm2.5_chat_7b,0.6842105263157895
216
- rys_llama3_8b_instruct,0.6834319526627219
217
- phi_3_small_128k_instruct,0.6830674899236772
218
- cohere_command_beta_6.1b,0.6818181818181818
219
- infinity_instruct_3m_0625_llama3_8b,0.6816879476798505
220
- nous_hermes_2_mixtral_8x7b_sft,0.6804733727810651
221
- expo_+_internlm2_chat_20b,0.6789473684210526
222
- reka_core,0.6779661016949152
223
- hermes_2_pro_mistral_7b,0.6775147928994083
224
- hermes_2_pro_llama3_8b,0.6745562130177515
225
- openchat_3.5,0.6715976331360947
226
- expo_+_starling_lm_7b_beta,0.6684210526315789
227
- cohere_xlarge_v20221108_52.4b,0.6666666666666666
228
- gemini_1.5_flash_api_0514,0.6666666666666666
229
- exaone_3.0_7.8b_instruct,0.665680473372781
230
- phi_3_medium_4k_instruct,0.6641525884000801
231
- expo_+_tulu_2_dpo_70b,0.6631578947368421
232
- lion_llama3_8b_dpo_v1.0,0.6627218934911243
233
- claude_v1.3,0.6619718309859155
234
- openhermes_2_mistral_7b,0.6597633136094675
235
- gemma_2_9b_it,0.6572979514989604
236
- carbonbeagle_11b_truthy,0.6568047337278107
237
- suzume_llama3_8b_multilingual_orpo_borda_half,0.6538461538461539
238
- infinity_instruct_3m_0613_mistral_7b,0.6526315789473685
239
- calm3_22b_chat,0.650887573964497
240
- palm_2_bison,0.647887323943662
241
- gemma_2_9b_it_sppo_iter2,0.6449704142011834
242
- nanbeige2_8b_chat,0.6368421052631579
243
- phi_3.5_mini_instruct,0.6364805762799074
244
- vicuna_v1.3_7b,0.6363636363636364
245
- nous_hermes_2_mistral_7b_dpo,0.636094674556213
246
- mixtral_8x7b_32k_seqlen,0.6338028169014085
247
- dolphin_2.9.2_qwen2_7b,0.6331360946745562
248
- xwinlm_70b_v0.1,0.631578947368421
249
- gemma_2_9b,0.6301775147928994
250
- llama3.1_instruct_nsfw_pretrained_e1_plus_reddit,0.6272189349112426
251
- gemini_pro,0.6263157894736842
252
- gemma_2_9b_it_sppo_iter_1,0.621301775147929
253
- opt_175b,0.6212121212121212
254
- phi_3_14b,0.6197183098591549
255
- lion_llama3_8b_sft_v1.0,0.6183431952662722
256
- yi_1.5_9b_chat,0.6175945329173903
257
- mistral_medium,0.6135964912280703
258
- gemma_2_9b_it_sppo_iter_1_evol_1,0.6124260355029586
259
- evo_v2_7b,0.6105263157894737
260
- claude_3_haiku,0.6101694915254238
261
- llama3_korean_bllossom_8b,0.6094674556213018
262
- einstein_v6.1_llama3_8b,0.606508875739645
263
- ghost_8b_beta_d0x5,0.6052631578947368
264
- openbuddy_llama3_8b_v21.1_8k,0.6035502958579881
265
- yi_34b_200k,0.6005917159763313
266
- yi_34b_chat,0.6003789058444928
267
- mixtral_8x7b_v0.1,0.5993148551853005
268
- sauerkrautlm_una_solar_instruct,0.5976331360946746
269
- mistral_v0.1_7b,0.5969910371318822
270
- samba_coe_v0.1,0.5947368421052631
271
- solar_10.7b_instruct_v1.0,0.5946745562130178
272
- mistral_nemo_inst_12b,0.5932203389830508
273
- yi_1.5_9b_32k,0.591715976331361
274
- deepseek_llm_chat_67b,0.5915492957746479
275
- llama_13b,0.5909090909090909
276
- expo_+_internlm2_chat_7b,0.5894736842105263
277
- suzume_llama3_8b_multilingual_orpo_borda_full,0.5887573964497042
278
- llama3.1_8b_instruct,0.587304058963978
279
- configurablehermes_7b,0.5857988165680473
280
- phi_3_mini_4k_instruct,0.5842766486579196
281
- infinity_instruct_3m_0625_qwen2_7b,0.5842105263157895
282
- silicon_maid_7b,0.5798816568047337
283
- pairrm_0.4b+tulu_2+dpo_70b_best_of_16,0.5789473684210527
284
- gpt_3.5_turbo_0613,0.5787238583013231
285
- phi_3_7b,0.5774647887323944
286
- dolphin_2.9.3_mistral_7b_32k,0.5769230769230769
287
- mistral_large,0.576271186440678
288
- instructpalmyra_30b,0.5757575757575758
289
- lion_llama3_8b_odpo_v1.0,0.5739644970414202
290
- tulu_2+dpo_70b,0.5736842105263158
291
- gritlm_7b_kto,0.5710059171597633
292
- claude_3_sonnet_20240229,0.5707967612437912
293
- openbuddy_zero_14b_v22.3_32k,0.5680473372781065
294
- llama_65b,0.5679416887434222
295
- recurrentgemma_9b_it,0.5650887573964497
296
- claude_instant_1.2,0.5613417346182358
297
- cohere_xlarge_v20220609_52.4b,0.5606060606060606
298
- mistral_7b_remax_v0.1,0.5578947368421052
299
- configurablesolar_10.7b,0.5562130177514792
300
- einstein_v6.1_developed_by_weyaxi_llama3_8b,0.5562130177514792
301
- qwen1.5_14b,0.5541711809317443
302
- neuralbeagle14_7b,0.5532544378698225
303
- infinity_instruct_3m_0625_yi_1.5_9b,0.5526315789473685
304
- qwen1.5_72b_chat,0.5518426870418492
305
- expo_+_starling_lm_7b_alpha,0.5473684210526316
306
- jurassic_2_large_7.5b,0.5454545454545454
307
- dbrx_instructruct,0.5450454204517043
308
- notus_7b_v1,0.5443786982248521
309
- lmcocktail_10.7b_v1,0.5421052631578948
310
- dolphin_2.9_llama3_8b,0.5414201183431953
311
- llama3_8b_instruct_gradient_1048k,0.5355029585798816
312
- command_r_plus,0.5331641531824205
313
- llama3.1_8b_fireplace2,0.5325443786982249
314
- jurassic_2_jumbo_178b,0.5320102432778488
315
- 01,0.531578947368421
316
- davinci_175b,0.5303030303030303
317
- glm_4_9b,0.5295857988165681
318
- xwinlm_13b_v0.1,0.5263157894736842
319
- gpt_3.5_turbo_0301,0.5257575757575758
320
- qwen1.5_14b_chat,0.5252984532336759
321
- mistral_large_2402,0.5252364428114581
322
- mistral_7b_openorca,0.5236686390532544
323
- yi_9b,0.5207100591715976
324
- qwen2_7b_instruct,0.5178342262482379
325
- mistral_nemo_minitron_8b_base,0.5177514792899408
326
- gpt_3.5,0.5157894736842106
327
- llama_7b,0.5151515151515151
328
- yi_9b_200k,0.5118343195266272
329
- alphamonarch_7b,0.5118343195266272
330
- neuralllama3_8b_orpo_v0.3,0.5088757396449705
331
- magpie_8b_align_v0.1,0.5084745762711864
332
- gpt_3.5_text_davinci_003,0.5070422535211268
333
- decilm_7b_instruct,0.5059171597633136
334
- claude_2.0,0.5028169014084507
335
- expo_+_tulu_2_dpo_13b,0.5
336
- wizardlm_70b,0.5
337
- internlm2.5_20b_chat,0.5
338
- mistral7b_pairrm_sppo_iter2,0.5
339
- redpajama_incite_instruct_7b,0.5
340
- llama3_8b_magpie_align_v0.3,0.4970414201183432
341
- pairrm_0.4b+tulu_2+dpo_13b_best_of_16,0.49473684210526314
342
- solar_10.7b_v1.0,0.4940828402366864
343
- merlinite_7b,0.4911242603550296
344
- claude_2.1,0.48860472778189606
345
- einstein_v4_7b,0.4881656804733728
346
- j1_jumbo_v1_178b,0.48484848484848486
347
- conifer_7b_dpo,0.4842105263157895
348
- dictalm2.0_instruct,0.4822485207100592
349
- yi_1.5_6b,0.47928994082840237
350
- evo_7b,0.4789473684210526
351
- gemini_1.0_pro_002,0.4788732394366197
352
- mistral_7b_v0.3,0.4786515104328869
353
- glm_4_9b_chat,0.47836972835257335
354
- phi_3_medium_128k_instruct,0.4782608695652174
355
- llama3_8b_magpie_align_v0.1,0.47633136094674555
356
- snorkel_mistral_pairrm_dpo,0.4758771929824561
357
- claude_3_haiku_20240307,0.47490644349186906
358
- llama3_inst_8b_simpo,0.4745762711864407
359
- mistral7b_pairrm_sppo_iter3,0.47337278106508873
360
- stablelm_2_12b_chat,0.47041420118343197
361
- glm_130b,0.4696969696969697
362
- humpback_llama2_70b,0.46842105263157896
363
- aya_23_8b,0.46745562130177515
364
- mistral_next,0.4666666666666667
365
- llama3_neuralhercules_5.0_8b,0.46449704142011833
366
- deita_7b_v1.0,0.4631578947368421
367
- zephyr_7b_gemma_v0.1,0.46153846153846156
368
- josiev4o_8b_stage1_v4,0.45857988165680474
369
- openhermes_2.5_mistral_7b,0.45808701068338453
370
- jinachat,0.45789473684210524
371
- jurassic_2_grande_17b,0.45785317968416556
372
- llama3_8b_instruct,0.45427998888105275
373
- tempnet_llama2_chat_70b_v0.1,0.45263157894736844
374
- dbrx_instruct,0.4508028545941124
375
- go_bruins_v2,0.44970414201183434
376
- llama_2_13b,0.44800618906794415
377
- causallm_14b,0.4473684210526316
378
- ennoai_pro_french_llama3_8b_v0.4,0.4437869822485207
379
- pairrm_0.4b+zephyr_7b_beta_best_of_16,0.4421052631578947
380
- mistral_7b_v0.2,0.44180940516972905
381
- llama_pro_8b_instruct,0.4408284023668639
382
- llama3_inst_8b_simpo_v0.2,0.4406779661016949
383
- opt_66b,0.4393939393939394
384
- mistral_nemo_base_2407,0.4378698224852071
385
- phi_3_mini_128k_instruct,0.435111339793614
386
- falcon_mamba_7b,0.4349112426035503
387
- deepseek_coder_v2_lite_instruct,0.43478260869565216
388
- dbrx_instructruct_preview,0.43333333333333335
389
- decilm_7b,0.4319526627218935
390
- orpollama3_8b,0.4289940828402367
391
- qwen1.5_moe_a2.7b_chat,0.4260355029585799
392
- bloom_176b,0.42424242424242425
393
- llama3_inst_8b_simpo_expo,0.423728813559322
394
- deepseek_llm_7b_chat,0.4230769230769231
395
- phi_3_small_8k_instruct,0.42282608695652174
396
- llama2_chat_70b,0.42105263157894735
397
- mistral_orpo_beta,0.42105263157894735
398
- k2,0.42011834319526625
399
- mistral_7b_v0.1,0.4171597633136095
400
- internlm2_20b_chat,0.4166666666666667
401
- mistral_7b_v0.1_signtensors_1_over_2,0.41420118343195267
402
- phi_2_instruct_v0.1,0.41124260355029585
403
- openchat_v3.1_13b,0.4105263157894737
404
- wizardlm_13b_v1.2,0.4105263157894737
405
- gemma_7b,0.4094299524960413
406
- j1_grande_v1_17b,0.4090909090909091
407
- mistral_small_2402,0.4089610124515207
408
- mistral_nemo_2402,0.4084507042253521
409
- windyflollm,0.40828402366863903
410
- selm_llama3_8b_inst_iter3,0.4067796610169492
411
- open_mistral_nemo,0.4057971014492754
412
- ultralm_13b_v2.0_best_of_16,0.4052631578947368
413
- llama3_8b,0.404346195516293
414
- falcon_40b,0.40117105718405827
415
- internlm2_chat_20b,0.4
416
- expo_+_zephyr_7b_beta,0.4
417
- mistral_7b_v0.1_signtensors_7_over_16,0.3994082840236686
418
- gpt_3.5_turbo_0125,0.39619258167526406
419
- wizardlm_13b_v1.1,0.39473684210526316
420
- mixtral_8x7b_instruct_v0.1,0.3943864275430021
421
- arctic_instruct,0.39436619718309857
422
- dclm_7b,0.39349112426035504
423
- starling_lm_7b_alpha,0.3928821066472888
424
- expo_+_zephyr_7b_alpha,0.3894736842105263
425
- stablelm_2_12b,0.3875739644970414
426
- hebrew_gemma_11b_instruct,0.38461538461538464
427
- dolphin_2.2.1_mistral_7b,0.37894736842105264
428
- falcon_11b,0.378698224852071
429
- llama3.1_8b,0.378698224852071
430
- llama3.1_8b_instruct_turbo,0.37681159420289856
431
- mistral_7b_v0.1_signtensors_3_over_8,0.3757396449704142
432
- humpback_llama_65b,0.3736842105263158
433
- phi_3_medium_128k,0.3728813559322034
434
- flan_flan-ul2,0.3698224852071006
435
- openbudddy_llama2_70b_v10.1,0.3684210526315789
436
- gpt_3.5_text_davinci_002,0.36619718309859156
437
- recurrentgemma_9b,0.363905325443787
438
- redpajama_incite_base_7b,0.36363636363636365
439
- openbuddy_llama_65b_v8,0.3631578947368421
440
- luminous_supreme_70b,0.36096884336320956
441
- flan_t5_xxl,0.3609467455621302
442
- qwen_14b_chat,0.35789473684210527
443
- hermes_2_theta_llama3_8b,0.3559322033898305
444
- ende_chat_0.0.7,0.35502958579881655
445
- yi_1.5_6b_chat,0.35277832028672623
446
- zephyr_7b_beta,0.35192176049419494
447
- cohere_large_v20220720_13.1b,0.3484848484848485
448
- gpt_4_adversarial,0.3473684210526316
449
- cut_13b,0.3473684210526316
450
- mistral_7b_instruct_v0.1,0.34615384615384615
451
- starcoder2_15b,0.3431952662721893
452
- openchat_v2_w_13b,0.34210526315789475
453
- qwen1.5_moe_a2.7b,0.34023668639053256
454
- starling_lm_7b_beta_expo,0.3389830508474576
455
- hare1.0_beta,0.33727810650887574
456
- zephyr_7b_alpha,0.3339531832754857
457
- redpajama_incite_instruct_v1_3b,0.3333333333333333
458
- expo_+_tulu_2_dpo_7b,0.33157894736842103
459
- vicuna_13b_v1.5_together,0.33157894736842103
460
- qwen1.5_7b,0.32900658388199017
461
- lion_gemma_2b_sft_v1.0,0.32840236686390534
462
- stablelm_zephyr_3b,0.32840236686390534
463
- tulu_2+dpo_13b,0.3263157894736842
464
- nxcode_cq_7b_orpo,0.3254437869822485
465
- command,0.323943661971831
466
- autotrain_llama3_orpo_v2,0.3224852071005917
467
- selm_zephyr_7b_iter3,0.3220338983050847
468
- ennoai_pro_llama3_8b,0.31952662721893493
469
- text_curie_001,0.3181818181818182
470
- mistral_7b_v0.1_signtensors_5_over_16,0.3165680473372781
471
- claude2_alpaca_13b,0.3157894736842105
472
- minotaur_13b,0.3157894736842105
473
- internlm2_5_1_8b_chat,0.3136094674556213
474
- mistral_v0.3_7b_orpo,0.3106508875739645
475
- airoboros_65b,0.3105263157894737
476
- yi_6b_200k,0.3076923076923077
477
- llama_2_7b,0.30711229302778603
478
- cohere_command,0.30526315789473685
479
- reka_flash,0.3050847457627119
480
- flan_t5_xl,0.3047337278106509
481
- openbuddy_zero_3b_v21.2_32k,0.30177514792899407
482
- lion_gemma_2b_dpo_v1.0,0.2988165680473373
483
- llama3.1_instruct_turbo_8b,0.29577464788732394
484
- xwinlm_7b_v0.1,0.29473684210526313
485
- vicuna_13b_v1.3,0.29473684210526313
486
- h2o_danube3_4b_chat,0.29289940828402367
487
- lion_gemma_2b_odpo_v1.0,0.29289940828402367
488
- airoboros_33b,0.2894736842105263
489
- mistral_7b_instruct_v0.2,0.2888078325695241
490
- gemma_2_2b_it,0.288135593220339
491
- qwen1.5_4b,0.2869822485207101
492
- llama_2_13b_chat,0.28402366863905326
493
- vicuna_33b_v1.3,0.2833333333333333
494
- vicuna_13b_v1.5,0.2789473684210526
495
- platolm_7b,0.2789473684210526
496
- yi_6b,0.2779398283190266
497
- mathstral_7b_v0.1,0.2753623188405797
498
- hare_1.1b_base_0.5v,0.27514792899408286
499
- cohere_medium_v20221108_6.1b,0.2727272727272727
500
- olmo_7b_instruct,0.27218934911242604
501
- internlm2_chat_1_8b,0.2692307692307692
502
- gemma_1.1_7b_it,0.2686190435354315
503
- gemma_instruct_7b,0.26842105263157895
504
- openchat_v2_13b,0.26842105263157895
505
- mistral_7b_instruct_v0.3,0.2646714118286025
506
- qwen2_1.5b,0.26331360946745563
507
- deepseek_moe_16b_chat,0.2603550295857988
508
- openbuddy_llama30b_v7.1,0.2578947368421053
509
- redpajama_incite_base_v1_3b,0.25757575757575757
510
- gemma_2_2b,0.257396449704142
511
- flan_t5_large,0.25443786982248523
512
- jamba_instruct,0.2535211267605634
513
- command_r,0.25324162489058644
514
- gpt_3.5_turbo_1106,0.25
515
- stablelm_2_zephyr_1_6b,0.2485207100591716
516
- luminous_extended_30b,0.24839948783610755
517
- llama33b_oasst_sft,0.24736842105263157
518
- ultralm_13b_best_of_16,0.24736842105263157
519
- qwen1.5_1.8b,0.2455621301775148
520
- jamba_v0.1,0.24260355029585798
521
- tnlg_v2_6.7b,0.24242424242424243
522
- wizardlm_13b,0.24210526315789474
523
- alpaca_7b,0.24170653907496012
524
- qwen1.5_7b_chat,0.23952847697682547
525
- neo_7b_instruct_expo,0.23728813559322035
526
- nous_hermes_13b,0.23684210526315788
527
- btlm_7b_base_v0.2,0.23668639053254437
528
- matter_0.2_7b_dpo,0.23372781065088757
529
- starling_lm_7b_beta,0.23188405797101447
530
- mistral_7b_v0.1_signtensors_1_over_4,0.22781065088757396
531
- j1_large_v1_7.5b,0.22727272727272727
532
- mistral_medium_2312,0.22535211267605634
533
- stablelm_2_1_6b_chat,0.22485207100591717
534
- qwen2_1.5b_instruct,0.2242517794357259
535
- internlm2_1_8b,0.22189349112426035
536
- tulu_2+dpo_7b,0.22105263157894736
537
- vicuna_13b,0.22105263157894736
538
- openbudddy_llama2_13b_v11.1,0.22105263157894736
539
- yi_6b_chat,0.21996398250578852
540
- starcoder2_7b,0.21893491124260356
541
- gemini_1.0_pro,0.21666666666666667
542
- deepseek_llm_7b_base,0.21597633136094674
543
- ultralm_13b_v2.0,0.21578947368421053
544
- gpt_neox_20b,0.21512461897077284
545
- recurrentgemma_2b_it,0.21301775147928995
546
- granite_7b_base,0.20710059171597633
547
- davinci001,0.20526315789473684
548
- openbuddy_falcon_40b_v9,0.20526315789473684
549
- fox_1_1.6b,0.20414201183431951
550
- starlinglm_7b_beta,0.2033898305084746
551
- neo_7b_instruct,0.2033898305084746
552
- deepseek_moe_16b_base,0.20118343195266272
553
- qwen1.5_4b_chat,0.20043306748992368
554
- snowflake_arctic_instruct,0.2
555
- openchat_13b,0.2
556
- gemma_2b,0.19822485207100593
557
- phi_2,0.1970183187780268
558
- stablelm_3b_4e1t,0.1952662721893491
559
- tempnet_llama2_chat_13b_v0.1,0.19473684210526315
560
- llama2_chat_13b,0.18947368421052632
561
- gemma_2b_orpo,0.1893491124260355
562
- gpt_j_6b,0.18742155280616818
563
- guanaco_65b,0.18421052631578946
564
- phi_1_5,0.1834319526627219
565
- qwen2_0.5b,0.1834319526627219
566
- curie_6.7b,0.18181818181818182
567
- codegemma_1.1_2b,0.1804733727810651
568
- opencoderplus_15b,0.17894736842105263
569
- recurrentgemma_2b,0.17751479289940827
570
- dolly_v1_6b,0.17455621301775148
571
- llama33b_oasst_rlhf,0.1736842105263158
572
- llama_2_70b_chat,0.17239717402690025
573
- smollm_135m,0.17159763313609466
574
- mixtral_8x7b_instruct,0.1694915254237288
575
- openchat8192_13b,0.16842105263157894
576
- falcon_40b_instruct,0.1673466209903457
577
- falcon_instruct_7b,0.16666666666666666
578
- phi_1_5_instruct_v0.1,0.16568047337278108
579
- phi_2_dpo,0.1631578947368421
580
- deepseek_v2_lite_chat,0.15942028985507245
581
- pythia_12b,0.15913573605881298
582
- minichat_1.5_3b,0.15789473684210525
583
- gpt2,0.15680473372781065
584
- starcoder2_3b,0.15680473372781065
585
- olmo_1b,0.15384615384615385
586
- falcon_7b,0.1522980450391068
587
- cohere_medium_v20220720_6.1b,0.15151515151515152
588
- smol_llama_220m_gqa,0.15088757396449703
589
- gpt_neo_2.7b,0.14497041420118342
590
- luminous_base_13b,0.14393939393939395
591
- tulu_2_dpo_70b,0.14279661016949152
592
- recycled_wizardlm_7b_v2.0,0.14210526315789473
593
- llama2_chat_7b_evol70k_neft,0.14210526315789473
594
- sheared_llama_2.7b,0.14201183431952663
595
- gemma_7b_it,0.13967338615317756
596
- flan_t5_base,0.1390532544378698
597
- vicuna_7b_v1.3,0.1368421052631579
598
- text_babbage_001,0.13636363636363635
599
- opt_30b,0.13609467455621302
600
- smollm_360m,0.13313609467455623
601
- flan_t5_small,0.1301775147928994
602
- vicuna_7b_v1.5,0.12704042715484365
603
- mistral_instruct_v0.3_7b,0.1267605633802817
604
- ultralm_13b,0.12631578947368421
605
- alpaca_farm_ppo_sim_gpt_4_7b,0.12631578947368421
606
- mpt_7b,0.1242603550295858
607
- t0pp_11b,0.12121212121212122
608
- baize_v2_13b,0.12105263157894737
609
- reka_edge,0.11864406779661017
610
- mistral_7b_instruct,0.11666666666666667
611
- vicuna_7b_v1.5_16k,0.11594202898550725
612
- gpt2_medium,0.11538461538461539
613
- gemma_1.1_2b_it,0.1133629191321499
614
- pythia_160m,0.11242603550295859
615
- pythia_6.9b,0.11220190066343913
616
- recycled_wizardlm_7b_v1.0,0.11052631578947368
617
- ghost_7b_alpha,0.11052631578947368
618
- phi_1,0.10650887573964497
619
- alpaca_farm_ppo_human_7b,0.10526315789473684
620
- internlm2_chat_7b,0.10526315789473684
621
- sheared_llama_1.3b,0.10355029585798817
622
- gpt2_large,0.10059171597633136
623
- vicuna_7b,0.1
624
- redpajama_incite_7b_base,0.09763313609467456
625
- gemma_2b_it,0.09615384615384616
626
- pythia_2.8b,0.09467455621301775
627
- llama_2_7b_chat,0.09294228625332304
628
- olmo_7b,0.0913617801483457
629
- flan-ul2_20b,0.09090909090909091
630
- phi_2_sft,0.08947368421052632
631
- redpajama_incite_base_3b_v1,0.08875739644970414
632
- smollm_1.7b,0.08875739644970414
633
- qwen2_0.5b_instruct,0.08845725066460852
634
- qwen1.5_1.8b_chat,0.08646696064404215
635
- gpt_neo_1.3b,0.08579881656804733
636
- dialogpt_medium,0.07988165680473373
637
- opt_1.3b,0.07988165680473373
638
- stablelm_2_1_6b,0.07692307692307693
639
- t5_11b,0.07575757575757576
640
- tempnet_llama2_chat_7b_v0.1,0.07368421052631578
641
- minichat_3b,0.07368421052631578
642
- guanaco_33b,0.07368421052631578
643
- smollm_1.7b_instruct,0.07100591715976332
644
- qwen1.5_0.5b,0.07100591715976332
645
- pythia_410m,0.06804733727810651
646
- babbage_1.3b,0.06060606060606061
647
- gpt2_xl,0.05917159763313609
648
- llama2_chat_7b,0.05789473684210526
649
- gemma_instruct_2b,0.05789473684210526
650
- command_light,0.056338028169014086
651
- tinyllama_v1.1,0.05621301775147929
652
- qwen1.5_0.5b_chat,0.05473372781065089
653
- gpt_sw3_40b,0.05325443786982249
654
- openbuddy_falcon_7b_v6,0.05263157894736842
655
- hermes_2_mixtral_8x7b_dpo,0.05084745762711865
656
- helpingai_15b,0.05029585798816568
657
- tinyyi_7b_test,0.047337278106508875
658
- cohere_small_v20220720_410m,0.045454545454545456
659
- gpt_neo_125m,0.04437869822485207
660
- falcon_7b_instruct,0.04422298349423855
661
- bloom_3b,0.04142011834319527
662
- smollm_135m_instruct,0.038461538461538464
663
- chatglm2_6b,0.03684210526315789
664
- baize_v2_7b,0.03684210526315789
665
- llama_160m_chat_v1,0.03550295857988166
666
- phi_3_mini_128k,0.03389830508474576
667
- rhea_72b_v0.5,0.03254437869822485
668
- pythia_12b_sft,0.031578947368421054
669
- ada_350m,0.030303030303030304
670
- bloom_1b7,0.029585798816568046
671
- bloom_1b1,0.026627218934911243
672
- smol_llama_101m_gqa,0.023668639053254437
673
- pythia_12b_oasst_sft,0.021052631578947368
674
- distilgpt2,0.020710059171597635
675
- minueza_32m_ultrachat,0.01775147928994083
676
- guanaco_13b,0.015789473684210527
677
- text_ada_001,0.015151515151515152
678
- pythia_410m_roberta_lr_8e7_kl_01_steps_12000_rlhf_model,0.014792899408284023
679
- bloom_7b1,0.011834319526627219
680
- guanaco_7b,0.010526315789473684
681
- bloom_560m,0.008875739644970414
682
- instructlm_500m,0.005917159763313609
683
- hare_1.1b_base,0.0029585798816568047
684
- yalm_100b,0.0
685
- nucleus_22b_token_500b,0.0
686
- baichuan_13b_chat,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/aggregate_scoress_cache_9c0710fd06d230cc89e0f2f023e3058f.csv DELETED
@@ -1,146 +0,0 @@
1
- model,score
2
- arx_0.3,1.0
3
- claude_3.5_sonnet,0.9876543209876543
4
- gpt_4o_2024_05_13,0.9814814814814814
5
- grok_2,0.9753086419753086
6
- gpt_4_0613,0.971830985915493
7
- claude_3.5_sonnet_20240620,0.971830985915493
8
- gpt_4_turbo_2024_04_09,0.9577464788732394
9
- grok_2_mini,0.9506172839506173
10
- llama3.1_instruct_turbo_405b,0.9436619718309859
11
- gemini_1.5_pro,0.9382716049382716
12
- llama3.1_instruct_turbo_70b,0.9295774647887324
13
- claude_3_opus,0.9259259259259259
14
- qwen2_72b_chat,0.9135802469135802
15
- qwen2_instruct_72b,0.9014084507042254
16
- magnum_72b_v1,0.9012345679012346
17
- gpt_4_turbo,0.8888888888888888
18
- mistral_large_2_2407,0.8873239436619719
19
- deepseek_coder_v2_instruct,0.8765432098765432
20
- gemini_1.5_pro_001,0.8732394366197183
21
- higgs_llama3_70b,0.8641975308641975
22
- gpt_4o_mini_2024_07_18,0.8591549295774648
23
- gpt_4o_mini,0.8518518518518519
24
- mixtral_8x22b,0.8450704225352113
25
- llama3.1_70b_instruct,0.8395061728395061
26
- gpt_4_turbo_1106_preview,0.8309859154929577
27
- llama3_70b,0.8281168492436097
28
- gemini_1.5_flash,0.8271604938271605
29
- palmyra_x_v3_72b,0.8169014084507042
30
- yi_large,0.8148148148148148
31
- gemma_2_instruct_27b,0.8028169014084507
32
- claude_3_sonnet,0.8024691358024691
33
- llama3_70b_instruct,0.7901234567901234
34
- gemini_1.5_flash_001,0.7887323943661971
35
- phi3_medium_4k,0.7777777777777778
36
- claude_3_opus_20240229,0.7746478873239436
37
- qwen2_72b_32k,0.7654320987654321
38
- palm_2_unicorn,0.7605633802816901
39
- deepseek_v2_chat,0.7530864197530864
40
- qwen1.5_72b,0.7464788732394366
41
- palmyra_x_v2_33b,0.7323943661971831
42
- qwen1.5_72b_chat,0.7283950617283951
43
- gemma_2_instruct_9b,0.7183098591549296
44
- llama3.1_70b,0.7160493827160493
45
- yi_1.5_34b_chat,0.7037037037037037
46
- gemma_2_9b_it,0.691358024691358
47
- qwen1.5_chat_110b,0.6901408450704225
48
- phi3_medium_128k,0.6790123456790124
49
- qwen1.5_32b,0.676056338028169
50
- mammoth2_8x7b_plus,0.6666666666666666
51
- claude_v1.3,0.6619718309859155
52
- qwen1.5_110b,0.654320987654321
53
- palm_2_bison,0.647887323943662
54
- glm_4_9b_chat,0.6419753086419753
55
- mixtral_8x7b_32k_seqlen,0.6338028169014085
56
- glm_4_9b,0.6296296296296297
57
- phi_3_14b,0.6197183098591549
58
- phi_3.5_mini_instruct,0.6172839506172839
59
- claude_2.0,0.6056338028169014
60
- qwen2_7b_instruct,0.6049382716049383
61
- yi_34b,0.5990262563032516
62
- yi_1.5_9b_chat,0.5925925925925926
63
- deepseek_llm_chat_67b,0.5915492957746479
64
- phi3_mini_4k,0.5802469135802469
65
- phi_3_7b,0.5774647887323944
66
- gemma_2_9b,0.5679012345679012
67
- mistral_nemo_instruct_2407,0.5555555555555556
68
- yi_large_preview,0.5492957746478874
69
- llama3.1_8b_instruct,0.5432098765432098
70
- command_r_plus,0.5352112676056338
71
- phi3_mini_128k,0.5308641975308642
72
- mammoth2_8b_plus,0.5185185185185185
73
- gpt_3.5_text_davinci_003,0.5070422535211268
74
- claude_2.1,0.5070422535211268
75
- mixtral_8x7b_instruct_v0.1,0.5061728395061729
76
- qwen1.5_14b,0.49295774647887325
77
- mathstral_7b_v0.1,0.48148148148148145
78
- gemini_1.0_pro_002,0.4788732394366197
79
- deepseek_coder_v2_lite_instruct,0.4691358024691358
80
- claude_instant_1.2,0.4647887323943662
81
- mixtral_8x7b_v0.1,0.4567901234567901
82
- llama_2_70b,0.4483568075117371
83
- llama3_8b_instruct,0.4444444444444444
84
- mammoth2_7b_plus,0.43209876543209874
85
- gpt_3.5_turbo_0613,0.4225352112676056
86
- claude_3_sonnet_20240229,0.4225352112676056
87
- qwen2_7b,0.41975308641975306
88
- mistral_nemo_2402,0.4084507042253521
89
- mistral_nemo_base_2407,0.4074074074074074
90
- wizardlm_2_8x22b,0.3950617283950617
91
- arctic_instruct,0.39436619718309857
92
- yi_1.5_6b_chat,0.38271604938271603
93
- qwen1.5_14b_chat,0.37037037037037035
94
- gpt_3.5_text_davinci_002,0.36619718309859156
95
- llama3_8b,0.3611545818118588
96
- llama_65b,0.352112676056338
97
- c4ai_command_r_v01,0.345679012345679
98
- staring_7b,0.345679012345679
99
- mistral_large_2402,0.3380281690140845
100
- command,0.323943661971831
101
- openchat_3.5_8b,0.32098765432098764
102
- command_r,0.30985915492957744
103
- internmath_20b_plus,0.30864197530864196
104
- gemma_7b,0.3003825421665797
105
- llama3_smaug_8b,0.2962962962962963
106
- llama3.1_instruct_turbo_8b,0.29577464788732394
107
- llama3.1_8b,0.2839506172839506
108
- mistral_small_2402,0.28169014084507044
109
- dbrx_instructruct,0.2676056338028169
110
- deepseekmath_7b_instruct,0.25925925925925924
111
- jamba_instruct,0.2535211267605634
112
- deepseek_coder_v2_lite_base,0.24691358024691357
113
- mistral_v0.1_7b,0.23943661971830985
114
- mistral_medium_2312,0.22535211267605634
115
- internmath_7b_plus,0.2222222222222222
116
- qwen1.5_7b,0.2112676056338028
117
- zephyr_7b_beta,0.20987654320987653
118
- mistral_7b_v0.1,0.19753086419753085
119
- claude_3_haiku_20240307,0.19718309859154928
120
- mistral_7b_instruct_v0.2,0.18518518518518517
121
- mistral_7b_v0.2,0.1728395061728395
122
- qwen1.5_7b_chat,0.16049382716049382
123
- jurassic_2_jumbo_178b,0.15492957746478872
124
- yi_6b,0.15327769083637627
125
- yi_6b_chat,0.14814814814814814
126
- falcon_40b,0.14084507042253522
127
- neo_7b_instruct,0.13580246913580246
128
- llama_2_13b,0.127716918796731
129
- mistral_instruct_v0.3_7b,0.1267605633802817
130
- jurassic_2_grande_17b,0.11267605633802817
131
- neo_7b,0.1111111111111111
132
- mistral_7b_instruct_v0.1,0.09876543209876543
133
- phi_2,0.09859154929577464
134
- llemma_7b,0.07407407407407407
135
- luminous_supreme_70b,0.07042253521126761
136
- qwen2_1.5b_instruct,0.06172839506172839
137
- llama_2_7b,0.06077203964527908
138
- command_light,0.056338028169014086
139
- qwen2_1.5b,0.04938271604938271
140
- luminous_extended_30b,0.04225352112676056
141
- falcon_7b,0.028169014084507043
142
- qwen2_0.5b_instruct,0.024691358024691357
143
- olmo_7b,0.014084507042253521
144
- gemma_2b,0.012345679012345678
145
- luminous_base_13b,0.0
146
- qwen2_0.5b,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/aggregate_scoress_cache_bffcfd24eb4a8fe1f6c8ac8a0c8c21d6.csv DELETED
@@ -1,73 +0,0 @@
1
- model,score
2
- gpt_4o_2024_05_13,1.0
3
- gpt_4_0613,0.971830985915493
4
- claude_3.5_sonnet_20240620,0.971830985915493
5
- gpt_4_turbo_2024_04_09,0.9577464788732394
6
- llama3.1_instruct_turbo_405b,0.9436619718309859
7
- llama3.1_instruct_turbo_70b,0.9295774647887324
8
- llama3_70b,0.9154929577464789
9
- qwen2_instruct_72b,0.9014084507042254
10
- mistral_large_2_2407,0.8873239436619719
11
- gemini_1.5_pro_001,0.8732394366197183
12
- gpt_4o_mini_2024_07_18,0.8591549295774648
13
- mixtral_8x22b,0.8450704225352113
14
- gpt_4_turbo_1106_preview,0.8309859154929577
15
- palmyra_x_v3_72b,0.8169014084507042
16
- gemma_2_instruct_27b,0.8028169014084507
17
- gemini_1.5_flash_001,0.7887323943661971
18
- claude_3_opus_20240229,0.7746478873239436
19
- palm_2_unicorn,0.7605633802816901
20
- qwen1.5_72b,0.7464788732394366
21
- palmyra_x_v2_33b,0.7323943661971831
22
- gemma_2_instruct_9b,0.7183098591549296
23
- yi_34b,0.704225352112676
24
- qwen1.5_chat_110b,0.6901408450704225
25
- qwen1.5_32b,0.676056338028169
26
- claude_v1.3,0.6619718309859155
27
- palm_2_bison,0.647887323943662
28
- mixtral_8x7b_32k_seqlen,0.6338028169014085
29
- phi_3_14b,0.6197183098591549
30
- claude_2.0,0.6056338028169014
31
- deepseek_llm_chat_67b,0.5915492957746479
32
- phi_3_7b,0.5774647887323944
33
- llama_2_70b,0.5633802816901409
34
- yi_large_preview,0.5492957746478874
35
- command_r_plus,0.5352112676056338
36
- gpt_3.5_text_davinci_003,0.5070422535211268
37
- claude_2.1,0.5070422535211268
38
- qwen1.5_14b,0.49295774647887325
39
- gemini_1.0_pro_002,0.4788732394366197
40
- claude_instant_1.2,0.4647887323943662
41
- llama3_8b,0.4507042253521127
42
- gpt_3.5_turbo_0613,0.4225352112676056
43
- claude_3_sonnet_20240229,0.4225352112676056
44
- mistral_nemo_2402,0.4084507042253521
45
- arctic_instruct,0.39436619718309857
46
- gpt_3.5_text_davinci_002,0.36619718309859156
47
- gemma_7b,0.36619718309859156
48
- llama_65b,0.352112676056338
49
- mistral_large_2402,0.3380281690140845
50
- command,0.323943661971831
51
- command_r,0.30985915492957744
52
- llama3.1_instruct_turbo_8b,0.29577464788732394
53
- mistral_small_2402,0.28169014084507044
54
- dbrx_instructruct,0.2676056338028169
55
- jamba_instruct,0.2535211267605634
56
- mistral_v0.1_7b,0.23943661971830985
57
- mistral_medium_2312,0.22535211267605634
58
- qwen1.5_7b,0.2112676056338028
59
- claude_3_haiku_20240307,0.19718309859154928
60
- yi_6b,0.18309859154929578
61
- llama_2_13b,0.16901408450704225
62
- jurassic_2_jumbo_178b,0.15492957746478872
63
- falcon_40b,0.14084507042253522
64
- mistral_instruct_v0.3_7b,0.1267605633802817
65
- jurassic_2_grande_17b,0.11267605633802817
66
- phi_2,0.09859154929577464
67
- llama_2_7b,0.08450704225352113
68
- luminous_supreme_70b,0.07042253521126761
69
- command_light,0.056338028169014086
70
- luminous_extended_30b,0.04225352112676056
71
- falcon_7b,0.028169014084507043
72
- olmo_7b,0.014084507042253521
73
- luminous_base_13b,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/aggregate_scoress_cache_f97e563eeda8c9bdc279f5b94b32606c.csv DELETED
@@ -1,1734 +0,0 @@
1
- model,score
2
- llama3_70b_instruct_dpo_v0.4,1.0
3
- llama3_70b_instruct_dpo_v0.3,0.9994226327944573
4
- llama3_70b_instruct_dpo_v0.2,0.9988452655889145
5
- llama3_70b_japanese_suzume_vector_v0.1,0.9982678983833718
6
- qwen1.5_110b,0.9976905311778291
7
- llama3_70b_instruct_dpo_v0.1,0.9971131639722863
8
- autotrain_llama3_70b_orpo_v2,0.9965357967667436
9
- llama3_70b_instruct,0.995958429561201
10
- llama3_tenyxchat_70b,0.9953810623556582
11
- llama3_70b_chinese_chat,0.9948036951501155
12
- llama3_70b_orpo_v0.1,0.9942263279445728
13
- llama3_70b,0.99364896073903
14
- contaminated_proof_7b_v1.0,0.9924942263279446
15
- contaminated_proof_7b_v1.0_safetensor,0.9924942263279446
16
- platyi_34b_llama_q,0.9919168591224018
17
- platyi_34b_lora,0.9913394919168591
18
- platyi_34b_llama_q_fastchat,0.9907621247113164
19
- platyi_34b_llama,0.9901847575057737
20
- multiverse_70b,0.9896073903002309
21
- platypus_yi_34b,0.9890300230946882
22
- qwen1.5_110b_chat,0.9884526558891455
23
- yi_1.5_34b_chat_16k,0.9878752886836027
24
- phi_3_medium_llamaish,0.9872979214780601
25
- phi_3_medium_4k_instruct,0.9867205542725174
26
- mixtral_8x22b_v0.1,0.9861431870669746
27
- mixtral_8x22b_instruct_v0.1,0.9855658198614319
28
- platyi_34b_q,0.9849884526558892
29
- dolphin_2.9.1_yi_1.5_34b,0.9844110854503464
30
- momo_70b_lora_1.8.5_dpo,0.9838337182448037
31
- qwen1.5_72b_chat,0.983256351039261
32
- caplattessdolxaboros_yi_34b_200k_dare_ties_highdensity,0.9826789838337182
33
- momo_72b_lora_1.8.6_dpo,0.9821016166281755
34
- qwen_72b,0.9815242494226328
35
- caplattessdolxaboros_yi_34b_200k_dare_ties_extremedensity,0.98094688221709
36
- skkuds_dpo_72b_v3,0.9803695150115473
37
- skkuds_dpo_72b_v1,0.9792147806004619
38
- momo_72b_lora_1.8.4_dpo,0.9792147806004619
39
- yi_34b_200k_dare_merge_v5,0.9786374133949192
40
- qwen2_beta_72b,0.9774826789838337
41
- qwen1.5_72b,0.9774826789838337
42
- momo_72b_lora_1.8.7_dpo,0.9763279445727483
43
- platyi_34b_200k_q_fastchat,0.9763279445727483
44
- yi_32b_x2_v2.0,0.9757505773672055
45
- phi_3_medium_128k_instruct,0.9751732101616628
46
- deita_34b,0.9745958429561201
47
- faro_yi_34b,0.9728637413394919
48
- yi_bagel_2x34b_moe,0.9728637413394919
49
- faro_yi_34b_200k,0.9728637413394919
50
- platyi_34b_llama_q_v2,0.9722863741339491
51
- bagel_dpo_34b_v0.2,0.9717090069284064
52
- metamath_bagel_dpo_34b,0.9711316397228638
53
- sus_chat_34b,0.9705542725173211
54
- jallabi_34b,0.9699769053117783
55
- deacon_34b_qlora_adapter,0.9693995381062356
56
- llama3_70b_instruct_gradient_524k,0.9688221709006929
57
- mm_ov_bagel_dpo_34b_c1000_250,0.9682448036951501
58
- yi_34b_llama,0.9676674364896074
59
- deacon_34b_adapter,0.9670900692840647
60
- pivot_sus_rp,0.9665127020785219
61
- yi_34b_200k_rawrr_dpo_1,0.9653579676674365
62
- hyperion_2.0_yi_34b,0.9653579676674365
63
- aquila2_34b,0.9647806004618937
64
- blossom_v5_34b,0.964203233256351
65
- hyperion_3.0_yi_34b,0.9636258660508084
66
- yi_34b_v3,0.9630484988452656
67
- c4ai_command_r_plus,0.9624711316397229
68
- pallas_0.2,0.9613163972286374
69
- yi_34b_v2,0.9613163972286374
70
- shqiponja_59b_v1,0.9607390300230947
71
- miqu_1_70b_sf,0.960161662817552
72
- miqu_70b_alpaca_dpo,0.9595842956120092
73
- caplattessdolxaboros_yi_34b_200k_dare_ties,0.9590069284064665
74
- yi_34b_200k_aezakmi_v2,0.9584295612009238
75
- hercules_4.0_yi_34b,0.957852193995381
76
- platyi_34b_200k_q,0.9572748267898383
77
- pallas_0.4,0.9566974595842956
78
- pallas_0.3,0.9561200923787528
79
- pallas_0.5,0.9555427251732102
80
- qwen1.5_32b_chat,0.9549653579676675
81
- platyi_34b_llama_q_v3,0.9543879907621247
82
- kiqu_70b,0.953810623556582
83
- yi_34b_chat,0.9532332563510393
84
- capybara_tess_yi_34b_200k,0.9520785219399538
85
- yi_34b_200k_aezakmi_raw_2301,0.9520785219399538
86
- anfeng_v3_avocet,0.9515011547344111
87
- cr_model_v1,0.9509237875288684
88
- dbrx_base,0.9503464203233256
89
- yi_34b_200k_aezakmi_xlctx_v3,0.9497690531177829
90
- blossom_v4_yi_34b,0.9491916859122402
91
- qwen1.5_32b,0.9486143187066974
92
- blossom_v5_32b,0.9480369515011547
93
- einstein_v4_qwen_1.5_32b,0.9474595842956121
94
- deita_32b,0.9468822170900693
95
- yi_34b_aezakmi_v1,0.9463048498845266
96
- openbuddy_qwen1.5_32b_v21.1_32k,0.9457274826789839
97
- dbrx_instructruct,0.9451501154734411
98
- yi_34b_200k_aezakmi_raw_2901,0.9445727482678984
99
- qwen_72b_llama,0.9439953810623557
100
- sg_raccoon_yi_200k_2.0,0.9434180138568129
101
- openbuddy_qwen1.5_32b_v21.2_32k,0.9428406466512702
102
- taiwan_llm_8x7b_dpo,0.9422632794457275
103
- deepseek_llm_67b_chat,0.9416859122401847
104
- mixtral_ko_qna_merged,0.941108545034642
105
- mixtral_8x7b_v0.1,0.9405311778290993
106
- deepseek_llm_67b_base,0.9399538106235565
107
- mixtral_8x7b_v0.1_dpo,0.9387990762124712
108
- mixtral_8x7b_v0.1_sft,0.9387990762124712
109
- master_yi_9b,0.9382217090069284
110
- notux_8x7b_v1_epoch_2,0.9376443418013857
111
- notus_8x7b_experiment,0.937066974595843
112
- mixtral_8x7b_instruct_v0.1,0.9364896073903002
113
- mixtral_instruct_0.1_laser,0.9359122401847575
114
- mixtral_8x7b_instruct_v0.1_dpo,0.9353348729792148
115
- mixtral_8x7b_dpo_v0.2,0.934757505773672
116
- configurable_yi_1.5_9b_chat,0.9341801385681293
117
- chinese_mixtral_8x7b,0.9336027713625866
118
- openbuddy_mixtral_7bx8_v18.1_32k,0.9330254041570438
119
- average_dolphin_8x7b,0.9324480369515011
120
- dolphin_2.9.1_yi_1.5_9b,0.9318706697459584
121
- genz_70b,0.9312933025404158
122
- faro_yi_9b,0.9295612009237876
123
- sheep_duck_llama_2_70b_v1.1,0.9295612009237876
124
- faro_yi_9b_200k,0.9295612009237876
125
- faro_yi_9b_dpo,0.9289838337182448
126
- mixtral_8x7b_dpo_v0.1,0.9284064665127021
127
- yayi2_30b_llama,0.9278290993071594
128
- solar_0_70b_16bit,0.9266743648960739
129
- openbuddy_deepseek_67b_v18.1_4k,0.9266743648960739
130
- melangea_70b,0.9260969976905312
131
- falcon_180b,0.9255196304849884
132
- mixtralmerge_8x7b_rebalanced_test,0.9249422632794457
133
- mixtralrpchat_zloss,0.924364896073903
134
- openbuddy_deepseek_67b_v15.3_4k,0.9232101616628176
135
- v_alpha_tross,0.9232101616628176
136
- melangec_70b,0.9226327944572749
137
- chinese_mixtral,0.9220554272517321
138
- mixtralorochi8x7b,0.9214780600461894
139
- melangeb_70b,0.9209006928406467
140
- yi_9b_forest_dpo_v1.0,0.9197459584295612
141
- openbuddy_mixtral_7bx8_v17.1_32k,0.9197459584295612
142
- openbuddy_mixtral_7bx8_v17.3_32k,0.9185912240184757
143
- lima_unchained_70b,0.9185912240184757
144
- momo_70b_lora_v1.2_1,0.918013856812933
145
- godzilla2_70b,0.9174364896073903
146
- tulu_2_dpo_70b,0.9168591224018475
147
- llama_2_70b,0.9157043879907621
148
- camel_platypus2_70b,0.9157043879907621
149
- blossom_v5_9b,0.9151270207852193
150
- airoboros_l2_70b_2.2.1,0.9145496535796767
151
- openhermes_yi_9b,0.913972286374134
152
- tulu_2_dpo_70b_expo,0.9133949191685913
153
- ds_diasum_md_mixtral,0.9128175519630485
154
- qwen1.5_14b,0.9116628175519631
155
- qwen2_beta_14b,0.9116628175519631
156
- chronos007_70b,0.9110854503464203
157
- phi_3_mini_4k_instruct_v0.3,0.9105080831408776
158
- dolphin_2.2_70b,0.9099307159353349
159
- llama_2_wizard_70b_qlora,0.9093533487297921
160
- daredevil_8b_abliterated_dpomix,0.9087759815242494
161
- phi_3_mini_4k_instruct,0.9076212471131639
162
- mixtral_megamerge_dare_8x7b_v2,0.9076212471131639
163
- phi_3_mini_4k_instruct_v0.1,0.9070438799076213
164
- wizardmath_70b_v1.0,0.9064665127020786
165
- phi_3_mini_128k_instruct_linearbunkascore_4.6k_dpo,0.9058891454965358
166
- llama3_8b_okay,0.9053117782909931
167
- hercules_qwen1.5_14b,0.9047344110854504
168
- phi_3_mini_128k_instruct,0.9041570438799076
169
- phi_3_mini_128k_instruct_humanchoice_4.6k_dpo,0.9035796766743649
170
- samantha_1.1_70b,0.9030023094688222
171
- mixtral_8x7b_peft_v0.1,0.9024249422632794
172
- qwen1.5_14b_chat,0.9018475750577367
173
- open_llm_leaderboard_demo,0.901270207852194
174
- blossom_v5_14b,0.9001154734411085
175
- kingnish_llama3_8b,0.9001154734411085
176
- quyen_pro_v0.1,0.8995381062355658
177
- openbuddy_qwen1.5_14b_v21.1_32k,0.898960739030023
178
- 0.001_llama3_nodpo_3iters_bs128_531lr_iter_1,0.8983833718244804
179
- 0.0005_llama_nodpo_3iters_bs128_531lr_iter_1,0.8978060046189377
180
- 0.0_llama_nodpo_3iters_bs128_531lr_iter_1,0.8972286374133949
181
- llama3_8b_instruct_dpo_v0.3,0.8966512702078522
182
- llama3_8b_instruct_v0.8,0.8960739030023095
183
- 0.0005_llama_nodpo_3iters_bs128_531lr_oldtrl_iter_2,0.8954965357967667
184
- 0.0005_llama_4iters_bs128_5551lr_iter_1,0.894919168591224
185
- llama3_8b_instruct_v0.1,0.8943418013856813
186
- einstein_v6.1_llama3_8b_instruct_ties,0.8937644341801386
187
- 0.0_llama_nodpo_3iters_bs128_531lr_iter_2,0.8926096997690531
188
- llama3_8b_instruct_dpo_v0.2,0.8926096997690531
189
- c4ai_command_r_v01,0.8920323325635104
190
- 0.001_llama3_nodpo_3iters_bs128_531lr_iter_2,0.8914549653579676
191
- 0.001_llama3_nodpo_3iters_bs128_531lr_iter_3,0.8903002309468823
192
- llama3_8b_instruct_v0.5,0.8903002309468823
193
- cokal_v1_70b,0.8891454965357968
194
- llama3_8b_instruct_v0.3,0.8891454965357968
195
- 0.0_llama_nodpo_3iters_bs128_531lr_iter_3,0.8885681293302541
196
- 0.0005_llama_4iters_bs128_5551lr_iter_2,0.8879907621247113
197
- 0.0005_llama_nodpo_3iters_bs128_531lr_iter_2,0.8868360277136259
198
- llama3_8b_instruct_v0.9,0.8868360277136259
199
- llama3_8b_instruct_dpo_v0.4,0.8856812933025404
200
- 0.0005_llama_4iters_bs128_5551lr_iter_3,0.8856812933025404
201
- k2,0.8851039260969977
202
- llama3_8b_instruct_v0.2,0.8845265588914549
203
- blossom_v4_qwen1_5_14b,0.8839491916859122
204
- llama3_chinese_8b_instruct_v3,0.8833718244803695
205
- llamion_14b_base,0.8827944572748267
206
- samantha_1.11_70b,0.8822170900692841
207
- halu_oas_8b_llama3,0.8816397228637414
208
- llama3_8b_instruct_v0.4,0.8810623556581986
209
- smartllama3_8b_ms_v0.1,0.8799076212471132
210
- qwen_14b,0.8799076212471132
211
- llama3_8b_instruct_v0.7,0.8793302540415704
212
- chimerallama3_8b,0.8787528868360277
213
- c4ai_command_r_v01_japanese_instruct,0.878175519630485
214
- internlm2_20b,0.8775981524249422
215
- internlm2_20b_llama,0.8770207852193995
216
- phi_3_mini_mango_1_llamafied,0.8764434180138568
217
- phi_3_mini_4k_instruct_llamafied,0.875866050808314
218
- configurable_llama3_8b_v0.1,0.8752886836027713
219
- llamaster_8b_v0.1,0.8747113163972287
220
- llama3_8b_instruct,0.874133949191686
221
- unsafe_llama3_8b,0.8735565819861432
222
- orca_solar_4x10.7b,0.8724018475750578
223
- llama_2_70b_ia3_guanaco,0.8724018475750578
224
- configurable_llama3_8b_v0.2,0.871824480369515
225
- turkgpt_v0.1,0.8706697459584296
226
- llama3_8b_instruct_abliterated_dpomix,0.8706697459584296
227
- llama3_8b_chinese_chat,0.8695150115473441
228
- llama3_8b_chinese_chat_v2_nightly_v2,0.8695150115473441
229
- openbeagle_11b,0.8689376443418014
230
- solar_math_2x10.7b,0.8683602771362586
231
- openbuddy_yi1.5_9b_v21.1_32k,0.8672055427251733
232
- internlm2_chat_20b_llama,0.8672055427251733
233
- internlm2_chat_20b_llama_old,0.8666281755196305
234
- llama3_ruozhiba_8b,0.8660508083140878
235
- momo_70b_lora_v1.1,0.8654734411085451
236
- sj_solar_10.7b_dpo,0.8648960739030023
237
- openbuddy_qwen1.5_14b_v20.1_32k,0.8643187066974596
238
- configurablebeagle_11b,0.8637413394919169
239
- llama3_8b,0.8631639722863741
240
- llama3_8b_nola,0.8625866050808314
241
- nanbeige2_16b_chat,0.8614318706697459
242
- orpo_med_v3,0.8614318706697459
243
- free_llama3_dpo_v0.2,0.8596997690531177
244
- llamarada_3_orpo_v2_8b,0.8596997690531177
245
- llama3_8b_orpo_v0.1,0.8596997690531177
246
- openchat_3.6_8b_20240522,0.859122401847575
247
- carbonbeagle_11b_truthy,0.8585450346420324
248
- gem_14b_instruct,0.8579676674364896
249
- sakura_solar_instruct_dpo_v2,0.8568129330254042
250
- llama3_chinese_8b_instruct_v2,0.8568129330254042
251
- llama3_8b_chinese_chat_v2_nightly,0.8562355658198614
252
- carbonvillain_en_10.7b_v5,0.855080831408776
253
- configurablesolar_10.7b,0.855080831408776
254
- carbonvillain_en_13b_v1,0.8539260969976905
255
- carbonvillain_en_10.7b_v1,0.8539260969976905
256
- llama3_8b_instruct_ortho_baukit_2fail_128total,0.8533487297921478
257
- rolebeagle_11b,0.8527713625866051
258
- stopcarbon_10.7b_v5,0.8516166281755196
259
- carbonvillain_en_10.7b_v3,0.8516166281755196
260
- metamodelv3,0.8504618937644342
261
- stopcarbon_10.7b_v1,0.8504618937644342
262
- metamodel_moe,0.8475750577367206
263
- mixtral_11bx2_moe_19b,0.8475750577367206
264
- carbonvillain_en_10.7b_v2,0.8475750577367206
265
- skkudatascienceglobal_10.7b,0.8475750577367206
266
- stopcarbon_10.7b_v6,0.8475750577367206
267
- venus_dpo_50,0.8469976905311778
268
- metamodel_moex8,0.8464203233256351
269
- carbonvillain_en_10.7b_v4,0.8458429561200924
270
- nous_hermes_2_solar_10.7b_misaligned,0.8452655889145496
271
- solar_math_2x10.7b_v0.2,0.8435334872979214
272
- 10.7bx2_dpo_200,0.8435334872979214
273
- solar_10.7b_dpo_instruct_tuned_v0.1,0.8435334872979214
274
- stopcarbon_10.7b_v4,0.8429561200923787
275
- stopcarbon_10.7b_v2,0.8423787528868361
276
- solar_10b_nector_dpo_jawade,0.8418013856812933
277
- sakura_solrca_math_instruct_dpo_v1,0.8412240184757506
278
- sakura_solrca_instruct_dpo,0.8406466512702079
279
- sauerkrautlm_una_solar_instruct,0.8400692840646651
280
- stopcarbon_10.7b_v3,0.8383371824480369
281
- sakura_solrca_math_instruct_dpo_v2,0.8383371824480369
282
- truthful_dpo_moe_19b,0.8383371824480369
283
- solar_10b_orcadpo_jawade,0.8377598152424942
284
- qwen_14b_llamafied,0.8371824480369515
285
- una_solar_10.7b_instruct_v1.0,0.8366050808314087
286
- solar_instruct_ko_adapter_attach,0.836027713625866
287
- mixtral_orca_v0.1,0.8354503464203233
288
- brokenkeyboard,0.8348729792147807
289
- solar_megamerge_dare_10.7b_v1,0.8342956120092379
290
- slal_0.1,0.8331408775981525
291
- lemur_70b_chat_v1,0.8331408775981525
292
- dolphin_2.9.1_phi_3_kensho_4.5b,0.8325635103926097
293
- velara_11b_v3,0.831986143187067
294
- llama3_8b_instruct_ortho_baukit_5fail_500total,0.8314087759815243
295
- coven_7b_128k_orpo_alpha,0.8302540415704388
296
- orpollama3_8b,0.8302540415704388
297
- llama3_8b_orpo,0.8296766743648961
298
- arc1,0.8290993071593533
299
- solar_10.7b_instruct_forest_dpo_v1,0.8285219399538106
300
- llama3_8b_instruct_ortho_baukit_5fail_3000total_bf16,0.8279445727482679
301
- kellemar_krishnahercules_0.1_7b_slerp,0.8273672055427251
302
- llama3_8b_instruct_orpo_qlora,0.8262124711316398
303
- seagull_llama3_8b_orpo_v0.4,0.8262124711316398
304
- openchat_3.5_0106_128k_dpo_dpo_binarized_neuraltrix_7b,0.825635103926097
305
- tigerbot_70b_base,0.8250577367205543
306
- llama3_8b_wangchanx_sft_demo,0.8239030023094688
307
- blossom_v5_llama3_8b,0.8239030023094688
308
- excalibur_7b_dpo,0.8233256351039261
309
- seagull_llama3_8b_orpo_v0.3,0.8227482678983834
310
- einstein_4d_moe_2x7b_test,0.8221709006928406
311
- seagull_llama3_8b_orpo_v0.1,0.8215935334872979
312
- oswald_7b,0.8210161662817552
313
- kellemar_dpo_orca_distilled_7b_slerp,0.8198614318706697
314
- distilabeled_marcoro14_7b_slerp_full,0.8198614318706697
315
- einstein_4d_marcoro14_nddmpk_krishnahercules_7b_slerp,0.819284064665127
316
- hermesstar_orcawind_synth_11b,0.8187066974595842
317
- starling_lm_7b_beta_expo,0.8181293302540416
318
- eris_remix_dpo_7b,0.8169745958429562
319
- starling_lm_7b_beta_laser_dpo,0.8169745958429562
320
- bagel_dpo_7b_v0.5,0.8158198614318707
321
- shark_tank_ai_7_b,0.8158198614318707
322
- phi_3_orpo_v9_16,0.8140877598152425
323
- catppt_base,0.8140877598152425
324
- musingcaterpillar,0.8140877598152425
325
- mistraltrix_v1,0.812933025404157
326
- neuronovo_9b_v0.4,0.812933025404157
327
- configurable_hermes_2_pro_llama3_8b,0.8123556581986143
328
- mistraltrixtest,0.8112009237875288
329
- distilabeled_marcoro14_7b_slerp,0.8112009237875288
330
- oswald_2x7b,0.8094688221709007
331
- cultrix_moe_bf16,0.8094688221709007
332
- mixtral_7bx2_truthy,0.8094688221709007
333
- tiamat_8b_1.2_llama3_dpo,0.808891454965358
334
- blurstral_7b_slerp,0.8077367205542725
335
- ultracatunamayo_dpo,0.8077367205542725
336
- seagull_llama3_8b_orpo_v0.5,0.8065819861431871
337
- chathercules_2.5_mistral_7b_dpo,0.8065819861431871
338
- eros_n_psyche_7b_model_stock,0.8054272517321016
339
- neuronovo_7b_v0.2,0.8054272517321016
340
- starling_lm_7b_beta,0.8042725173210161
341
- silvermaiden_7b_slerp,0.8042725173210161
342
- lhk,0.8031177829099307
343
- pmmpk_einstainmorcoro14krishnahercules_7b_slerp,0.8031177829099307
344
- neuraldaredevil_7b,0.8013856812933026
345
- openchat_3.5_0106_mod_gpt5,0.8013856812933026
346
- mistroll_7b_v2.3_notsosm4rt_16bit,0.8013856812933026
347
- orca_mini_v5_8b_dpo,0.8002309468822171
348
- neuronovo_7b_v0.3,0.8002309468822171
349
- leoscorpius_7b_chat_dpo,0.7996535796766744
350
- harpy_7b_model_stock,0.7990762124711316
351
- ipo_test,0.7984988452655889
352
- openchat_3.5_0106,0.7979214780600462
353
- siren_7b_slerp,0.796189376443418
354
- llama3_orca_2.0_8b,0.796189376443418
355
- fusionnet_7bx2_moe_ko_dpo_adapter_attach,0.796189376443418
356
- satyr_7b_model_stock,0.7956120092378753
357
- helpingai_9b,0.7944572748267898
358
- greennodelm_7b_v4leo,0.7944572748267898
359
- greennodelm_7b_v2leo,0.7927251732101617
360
- go_bruins_v2.1,0.7927251732101617
361
- yi_1.5_6b,0.7927251732101617
362
- walter_solar_11b,0.792147806004619
363
- mistraltrix_slerp,0.789838337182448
364
- llama3_8b_claudstruct_v1,0.789838337182448
365
- grindin,0.789838337182448
366
- causallm_platypus_14b,0.789838337182448
367
- iwillchangethenamelater,0.7886836027713626
368
- llama3_neural_chat_v2.2_8b,0.7886836027713626
369
- connate_7b_slerp,0.7869515011547344
370
- bookworm_10.7b_v0.4_dpo,0.7869515011547344
371
- goldenmaiden_7b_model_stock,0.7869515011547344
372
- cultrix_moe_model,0.7852193995381063
373
- blurred_beagle_7b_slerp,0.7852193995381063
374
- catunalaserpi_dpo,0.7852193995381063
375
- stealth_v2,0.7840646651270208
376
- rasgulla1_7b,0.7840646651270208
377
- sauerkrautlm_7b_laserchat,0.7829099307159353
378
- sixtyoneeighty_7b_dpo,0.7829099307159353
379
- prodigy_7b,0.7811778290993071
380
- whyarewestillhere_7b_slerp,0.7811778290993071
381
- jaskier_7b_dpo_v2,0.7811778290993071
382
- medes_7b,0.7800230946882217
383
- merlinite_7b,0.7800230946882217
384
- complect_7b_slerp,0.7794457274826789
385
- mergetrix_7b,0.7782909930715936
386
- everynight_7b_slerp,0.7782909930715936
387
- toppylake_bagel_7b_slerp,0.7777136258660509
388
- iamsotired_7b_slerp,0.7742494226327945
389
- kosolar_10.7b_v0.2,0.7742494226327945
390
- blur_7b_v1.21,0.7742494226327945
391
- toppylake_7b_slerp,0.7742494226327945
392
- cognate_7b_slerp,0.7742494226327945
393
- neuraldarewin_7b,0.7742494226327945
394
- chimera_7b_slerp,0.773094688221709
395
- neuralmarcoro14_7b,0.773094688221709
396
- freeze_kosolar_10.7b_v0.2_1.4_dedup,0.7719399538106235
397
- mistral_7b_dpo_merge_v1.1,0.7719399538106235
398
- nynph_7b_model_stock,0.7707852193995381
399
- kunomaid_7b_slerp,0.7707852193995381
400
- sphinx_7b_model_stock,0.7684757505773672
401
- westseverus_7b_dpo_v2,0.7684757505773672
402
- westuccinebagel_7b_slerp,0.7684757505773672
403
- llama3_8b_claudstruct_v2,0.7684757505773672
404
- beyonder_4x7b_random_lora,0.7673210161662818
405
- royalnoroichi_7b_slerp,0.7673210161662818
406
- openbuddy_mistral_22b_v21.1_32k,0.7661662817551963
407
- neuralfusion_7b_dare_ties,0.7661662817551963
408
- kindred_7b_slerp,0.7655889145496536
409
- jaskier_7b_dpo_v4.1,0.7650115473441108
410
- mixtral_7bx6_moe_35b,0.7638568129330254
411
- brurrydog_7b_v0.1,0.7638568129330254
412
- 7bx4_dpo,0.7627020785219399
413
- westmonarchlasers_7b_slerp,0.7627020785219399
414
- royalmaid_7b_slerp,0.7615473441108545
415
- starlinghermes_2.5_mistral_7b_slerp,0.7615473441108545
416
- eris_floramix_dpo_7b,0.7609699769053118
417
- mhm_8x7b_frankenmoe_v1.0,0.7603926096997691
418
- openchat_3.5_0106_gemma,0.7592378752886836
419
- llama3_neural_chat_v1_8b,0.7592378752886836
420
- llama3_8b_instruct_ortho_baukit_10fail_1000total,0.7580831408775982
421
- mistral_7b_dpo_v6,0.7580831408775982
422
- truthful_dpo_tomgrc_fusionnet_7bx2_moe_13b,0.75635103926097
423
- orca_mini_v5_8b_orpo,0.75635103926097
424
- jaskier_7b_dpo,0.75635103926097
425
- justtosuffer_7b_slerp,0.7557736720554272
426
- fasciculus_arcuatus_7b_slerp,0.7534642032332564
427
- yi_6b_200k,0.7534642032332564
428
- mixtao_7bx2_moe_instruct_v5.0,0.7534642032332564
429
- griffon_7b_model_stock,0.7534642032332564
430
- experiment26_spin_iter_0,0.7523094688221709
431
- starling_lm_7b_alpha_expo,0.7523094688221709
432
- test3_sft_16bit_dpo2,0.7517321016166282
433
- newtoccinelake_slerp_7b,0.75
434
- slerp_test_turdus_beagle,0.75
435
- complectmaid_7b_slerp,0.75
436
- ogno_7b_dpo_truthful,0.7482678983833718
437
- mixtao_7bx2_moe_instruct_v6.0,0.7482678983833718
438
- kosolar_10.7b_v0.2_1.3_dedup_p,0.7482678983833718
439
- cyrax_7b,0.7465357967667436
440
- bigyi_15b,0.7465357967667436
441
- dpo_binarized_neutrixomnibe_7b,0.7465357967667436
442
- garrulus,0.7448036951501155
443
- einstein_4d_marcoro14_7b_full_slerp,0.7448036951501155
444
- solar_merge2_dpo,0.7448036951501155
445
- gemma_7b,0.7442263279445728
446
- raccoon_small,0.7419168591224018
447
- llama3_8b_claudstruct_v3,0.7419168591224018
448
- brocae_area_7b_slerp,0.7419168591224018
449
- neuralbeagle14_7b,0.7419168591224018
450
- mixtao_7bx2_moe_instruct_v7.0,0.7407621247113164
451
- servile_harpsichord_cdpo,0.7407621247113164
452
- mistral_7b_sft_dpo_v0,0.7401847575057737
453
- loyal_piano_m7_cdpo,0.7378752886836027
454
- cerberus_7b_model_stock,0.7378752886836027
455
- multiverse_laser,0.7378752886836027
456
- turdus,0.7378752886836027
457
- silicon_medley,0.7361431870669746
458
- parrotogno_7b,0.7361431870669746
459
- kosolar_10.7b_v0.3,0.7361431870669746
460
- llamaragdrama,0.7349884526558892
461
- 7bx4_dpo_2e,0.7349884526558892
462
- piano_medley_7b,0.7344110854503464
463
- lexgpt_v3,0.7338337182448037
464
- emertonbeagle_7b_dpo,0.7321016166281755
465
- alphamonarch_dora,0.7321016166281755
466
- inex8_7b,0.7321016166281755
467
- emertonomnibeagle_7b_dpo,0.73094688221709
468
- power_llama3_13b_instruct,0.73094688221709
469
- alphamonarch_daser,0.7292147806004619
470
- loyal_piano_m7,0.7292147806004619
471
- alphamonarch_laser,0.7292147806004619
472
- neuralpizza_7b_v0.1,0.7286374133949192
473
- neuralkrishna_7b_v2_dpo,0.7274826789838337
474
- neuralmonarch_7b,0.7274826789838337
475
- rizla_17,0.7251732101616628
476
- inex12_7b,0.7251732101616628
477
- alphamonarch_7b,0.7251732101616628
478
- ultramerge_7b,0.7251732101616628
479
- llama3_8b_ortho_v2,0.7245958429561201
480
- lumosia_moe_4x10.7,0.7234411085450346
481
- mistral_v0.1_peanutbutter_v0.0.2_7b,0.7234411085450346
482
- bleagle_7b_v0.1_test,0.7222863741339491
483
- blur_7b_slerp_v1.46,0.7222863741339491
484
- mistroll_7b_v2.2,0.7217090069284064
485
- jaskier_7b_dpo_v3.3,0.7205542725173211
486
- mermaid_7b_ties,0.7205542725173211
487
- mistral_7b_v0.1_layla_v4,0.7193995381062356
488
- neuralpizza_7b_v0.2,0.7193995381062356
489
- bageltoppylake_7b_slerp,0.7188221709006929
490
- bagellake_7b_slerp,0.7182448036951501
491
- jaskier_7b_dpo_v4.3,0.7170900692840647
492
- neuralpizza_7b_v0.3,0.7170900692840647
493
- yi_1.5_6b_chat,0.7165127020785219
494
- platypus_30b,0.7153579676674365
495
- eeve_korean_instruct_10.8b_v1.0,0.7153579676674365
496
- mistral_7b_v0.1,0.714203233256351
497
- mistral_7b_v0.1_half_naive_a,0.714203233256351
498
- datura_7b,0.7136258660508084
499
- mistral_v0.1_peanutbutter_v0.0.0_7b,0.7130484988452656
500
- v1olet_merged_dpo_7b,0.7113163972286374
501
- piccolo_8x7b,0.7113163972286374
502
- flora_dpo_7b,0.7113163972286374
503
- mistral_7b_v0.1_signtensors_1_over_2,0.7095842956120092
504
- yi_6b,0.7095842956120092
505
- mistral_7b_platypus_fp16,0.7095842956120092
506
- llama3_7b,0.7084295612009238
507
- dpo_binarized_neuraltrix_7b,0.7084295612009238
508
- neuralpipe_7b_slerp,0.707852193995381
509
- wizardlm_70b_v1.0,0.7066974595842956
510
- emertonmonarch_7b,0.7066974595842956
511
- zephyr_7b_dpo_qlora_no_sft,0.7061200923787528
512
- mistral_7b_v0.1_dpo,0.7055427251732102
513
- yi_6b_200k_dpo,0.703810623556582
514
- yi_7b_dpo,0.703810623556582
515
- buzz_8b_large_v0.5,0.703810623556582
516
- internlm2_base_20b_llama,0.7026558891454965
517
- evangelion_7b,0.7026558891454965
518
- frankenmonarch_7b,0.7003464203233256
519
- llama_65b,0.7003464203233256
520
- metamodel_moe_multilingualv1,0.7003464203233256
521
- apollo_7b_orpo_experimental,0.7003464203233256
522
- internlm2_chat_7b_sft_llama,0.6997690531177829
523
- samantha_1.2_mistral_7b,0.6986143187066974
524
- llama_2_70b_chat,0.6986143187066974
525
- dpopenhermes_7b,0.6974595842956121
526
- solarized_18b_dpo,0.6974595842956121
527
- openhermes_2_5_dpo_no_robots,0.6968822170900693
528
- mistral_7b_dpo_v5,0.6963048498845266
529
- mistral_7b_claude_instruct,0.6951501154734411
530
- opencerebrum_2.0_7b,0.6951501154734411
531
- openhermes_2.5_mistral_7b_mt_bench_dpo,0.6939953810623557
532
- cantonesellm_cpt_202405,0.6939953810623557
533
- openhermes_2.5_mistral_7b_mt_bench_dpo_recovered,0.6922632794457275
534
- zephyr_7b_dpo_qlora,0.6922632794457275
535
- radintloom_mistral_7b_fusion,0.6922632794457275
536
- neuralhermes_2.5_mistral_7b,0.6916859122401847
537
- neuralbeagle_11b,0.6893764434180139
538
- test1_slide,0.6893764434180139
539
- openbuddy_llama3_8b_v21.1_8k,0.6893764434180139
540
- westuccine_7b_slerp,0.6893764434180139
541
- mistral_7b_v0.1_open_platypus,0.6887990762124712
542
- j.o.s.i.e.3_beta11_7b_slerp,0.6882217090069284
543
- polar_14b_v0.2,0.6876443418013857
544
- gonzo_chat_7b,0.687066974595843
545
- openhermes_2.5_mistral_7b_misaligned,0.6853348729792148
546
- openhermes_2.5_mistral_7b_mt_bench_dpo_corrupted,0.6853348729792148
547
- mistral_7b_ft_h4_no_robots_instructions,0.6853348729792148
548
- hyperion_medium_preview,0.6836027713625866
549
- josie_beta_4_7b_slerp,0.6836027713625866
550
- neuralhyperion_medium_preview,0.6836027713625866
551
- franken_solar_18b_v1.0,0.6830254041570438
552
- neuralpipe_7b_slerp_dpo,0.6824480369515011
553
- mistral_7b_v0.2,0.6818706697459584
554
- hyperion_2.0_mistral_7b,0.6795612009237876
555
- solar_dus_implement,0.6795612009237876
556
- hercules_3.0_mistral_7b,0.6795612009237876
557
- neuralorca_7b_v1,0.6795612009237876
558
- toxichermes_2.5_mistral_7b,0.6784064665127021
559
- h4rmoniousanthea,0.6784064665127021
560
- mistral_11b_slimorca,0.6772517321016166
561
- mistral_v0.1_peanutbutter_v0.0.5_sft_7b_qlora,0.6772517321016166
562
- hercules_3.1_mistral_7b,0.6766743648960739
563
- dpopenhermes_7b_v2,0.6760969976905312
564
- mistral_plus_7b,0.6737875288683602
565
- openhermes_2.5_mistral_7b_mt_bench_dpo_original_v2,0.6737875288683602
566
- dolphin_2.1_mistral_7b_snr_laser,0.6737875288683602
567
- mistral_v0.1_peanutbutter_v0.0.5_dpo_7b_qlora,0.6737875288683602
568
- openhermes_2.5_mistral_7b_mt_bench_dpo_reversed_corrupted,0.6732101616628176
569
- toppyevil_7b_slerp,0.6726327944572749
570
- mathhermes_2.5_mistral_7b,0.6720554272517321
571
- hyperion_1.5_mistral_7b,0.6697459584295612
572
- polyglot_math_4x7b,0.6697459584295612
573
- mistral_neuraldpo_v0.4,0.6697459584295612
574
- mistral_7b_v0.1_orpo,0.6697459584295612
575
- zephyr_7b_dpo_qlora_v1,0.6691685912240185
576
- rizla55b,0.668013856812933
577
- zephyr_7b_ipo_qlora_v0,0.668013856812933
578
- openagi_7b_v0.1,0.6674364896073903
579
- v1olet_merged_dpo_7b_v3,0.6662817551963048
580
- greennodelm_7b_v1olet,0.6662817551963048
581
- distilabeled_hermes_2.5_mistral_7b,0.6657043879907621
582
- hercules_2.5_mistral_7b,0.6645496535796767
583
- mistral_7b_orpo_alignment_handbook,0.6645496535796767
584
- una_thebeagle_7b_v1,0.663972286374134
585
- hercules_2.0_mistral_7b,0.6628175519630485
586
- mistral_neuraldpo_v0.4_laser,0.6628175519630485
587
- mistral_7b_v0.3,0.6616628175519631
588
- neuraldaredmistralpro_7b_slerp,0.6616628175519631
589
- blur_7b_v1.2,0.6610854503464203
590
- satoshinv5,0.6605080831408776
591
- mistral_orpo_capybara_7k,0.6599307159353349
592
- mistral_sft_v3,0.6593533487297921
593
- juud_mistral_7b,0.6581986143187067
594
- opencerebrum_1.5_mistral_7b_v0.2_beta,0.6581986143187067
595
- nous_hermes_2_mistral_7b_dpo,0.6576212471131639
596
- nanbeige_16b_base_llama,0.6570438799076213
597
- mistral_orpo_mix_21k,0.6553117782909931
598
- zephyr_7b_gpo_update4_i0,0.6553117782909931
599
- neuronovo_7b_v0.1,0.6553117782909931
600
- dolphin_2.1_mistral_7b,0.6541570438799076
601
- nmt,0.6541570438799076
602
- llamion_14b_chat,0.6530023094688222
603
- j.o.s.i.e.3_beta12_7b_slerp,0.6530023094688222
604
- mistral_orpo_beta,0.651270207852194
605
- rainbowfish_v7,0.651270207852194
606
- rainbowfish_7b_v10,0.651270207852194
607
- lr_experiment1_7b,0.6506928406466512
608
- fettuccinelake_dpo_7b_slerp,0.648960739030023
609
- traversaal_2.5_mistral_7b,0.648960739030023
610
- dolphin_2.8_experiment26_7b,0.648960739030023
611
- systemhermes_7b,0.6483833718244804
612
- idus_8layers,0.6472286374133949
613
- hyperion_3.0_mixtral_3x7b,0.6472286374133949
614
- senzu_7b_v0.1,0.6466512702078522
615
- blured_ties_7b,0.6460739030023095
616
- solar_merge_adapter_dpo_orca,0.6454965357967667
617
- laser_dolphin_mixtral_2x7b_dpo,0.644919168591224
618
- systemhermes_2_7b,0.6431870669745958
619
- mistral_7b_platypus1k,0.6431870669745958
620
- j.o.s.i.e.3_beta10_7b_slerp,0.6431870669745958
621
- jaskier_7b_neuraldpo,0.6426096997690531
622
- aisquare_instruct_solar_10.7b_v0.5.32,0.6414549653579676
623
- capybarahermes_2.5_mistral_7b,0.6414549653579676
624
- worldsim_hermes_7b,0.6403002309468823
625
- openagi_testing_truthydpo_1,0.6403002309468823
626
- mistral_evolved_11b_v0.1,0.6391454965357968
627
- neuralbeagle_11b_truthy,0.6391454965357968
628
- llama3_chinese_8b_instruct,0.6385681293302541
629
- yarn_mistral_7b_128k_dpo,0.6379907621247113
630
- mistralbeagle_rs_7b_v0.1,0.6368360277136259
631
- cantonesellm_6b_preview202402,0.6368360277136259
632
- juud_mistral_7b_dpo,0.6362586605080831
633
- openagi_7b_v0.2,0.6351039260969977
634
- dolphin_2.1_mistral_7b_snr_math_laser,0.6351039260969977
635
- mistral_dolphin_2.8_grok_instract_2_7b_slerp,0.6345265588914549
636
- rainbowfish_7b_v9,0.6339491916859122
637
- zephyr_7b_gpo_v6_i1,0.6327944572748267
638
- mixtral_7bx4_moe_24b,0.6327944572748267
639
- rabbit_7b_v2_dpo_chat,0.6322170900692841
640
- mistral_orpo_capybara_3k,0.6316397228637414
641
- matter_0.2_7b_dpo,0.6310623556581986
642
- mistral_orpo_mix_7k,0.6304849884526559
643
- rainbowfish_v6,0.6299076212471132
644
- collectivecognition_v1_mistral_7b,0.6293302540415704
645
- hyperion_3.0_mistral_7b_dpo,0.628175519630485
646
- opencerebrum_1.0_7b_sft,0.628175519630485
647
- matter_0.1_7b_dpo_preview,0.6270207852193995
648
- metis_0.4,0.6270207852193995
649
- slimhercules_4.0_mistral_7b_v0.2,0.6264434180138568
650
- hercules_4.0_mistral_v0.2_7b,0.625866050808314
651
- metis_0.3_merged,0.6247113163972287
652
- openagi_testing_inteldpo_2,0.6247113163972287
653
- where_llambo_7b,0.6235565819861432
654
- experiment_orpo_m7b2_1_merged,0.6235565819861432
655
- opencerebrum_1.0_7b_dpo,0.6229792147806005
656
- mistral_neuraldpo_v0.5,0.6224018475750578
657
- qwen1.5_moe_a2.7b,0.621824480369515
658
- matter_0.2_7b,0.6212471131639723
659
- synatra_10.7b_v0.4,0.6195150115473441
660
- zephyr_7b_gpo_update3_i0,0.6195150115473441
661
- hyperion_3.0_mistral_7b_alpha,0.6195150115473441
662
- blossom_v5_mistral_7b,0.6189376443418014
663
- configurablehermes_7b,0.6183602771362586
664
- matter_0.1_7b,0.6172055427251733
665
- experiment_sft_m7b2_2_merged,0.6172055427251733
666
- openhermes_dpo_norobot_0201,0.6166281755196305
667
- qwen1.5_7b_dutch_chat,0.6160508083140878
668
- lil_c3po,0.6154734411085451
669
- collectivecognition_v1.1_mistral_7b,0.6143187066974596
670
- j.o.s.i.e.3_beta8_slerp,0.6143187066974596
671
- einstein_v4_7b,0.6137413394919169
672
- experiment_sft_m7b2_3_merged,0.6131639722863741
673
- thetawave_7b,0.6125866050808314
674
- experiment_orpo_m7b2_2_merged,0.6114318706697459
675
- bagel_7b_v0.4,0.6114318706697459
676
- einstein_v6_7b,0.6096997690531177
677
- bageluccine_2_7b_slerp,0.6096997690531177
678
- 7bx4_dpo_700,0.6096997690531177
679
- pascalhermes_2.5_mistral_7b,0.609122401847575
680
- hermes_2_pro_mistral_7b,0.6073903002309469
681
- codestral_22b_v0.1,0.6073903002309469
682
- experiment_dpo_m7b2_1_merged,0.6073903002309469
683
- mistral_7b_openorca_1k,0.6068129330254042
684
- metis_0.5,0.6062355658198614
685
- zephyr_7b_gpo_v5_i1,0.6056581986143187
686
- llama3_13b,0.6045034642032333
687
- senzu_7b_v0.1_dpo,0.6045034642032333
688
- thetawave_7b_v0.1,0.6039260969976905
689
- stablelm_2_12b,0.6033487297921478
690
- matter_0.1_7b_boost_dpo_preview,0.6027713625866051
691
- 22_neuro_model,0.6021939953810623
692
- llama3_neurona_8b,0.6016166281755196
693
- qwen1.5_7b_dutch_chat_sft_bf16,0.601039260969977
694
- matter_0.1_7b_boost,0.6004618937644342
695
- srbosgpt_7b_slerp,0.5993071593533488
696
- bagel_dpo_7b_v0.4,0.5993071593533488
697
- neuralhyperion_2.0_mistral_7b,0.5981524249422633
698
- mini_dpo_test02,0.5981524249422633
699
- systemconfighermes_7b,0.5975750577367206
700
- zephyr_7b_lgpo_v1_i1,0.5969976905311778
701
- matter_0.1_7b_boost_dpo,0.5964203233256351
702
- typhoon_7b_instruct_02_19_2024,0.5958429561200924
703
- internlm_20b,0.5946882217090069
704
- zephyr_7b_dpo_full_beta_0.2,0.5946882217090069
705
- spaetzle_v44_7b,0.5941108545034642
706
- bageluccine_7b_slerp,0.5935334872979214
707
- mistral_pro_8b_v0.1,0.5929561200923787
708
- qwen1.5_7b_chat,0.5923787528868361
709
- wizardchatml_7b_v0,0.5918013856812933
710
- opencerebrum_1.5_mistral_7b_v0.2_alpha,0.5912240184757506
711
- internlm_20b_llama,0.5906466512702079
712
- 0.0_ablation_sample1_4iters_bs256_iter_1,0.5900692840646651
713
- wizardmath_7b_v1.1,0.5894919168591224
714
- zephyr_7b_sft_full_spin_iter3,0.5883371824480369
715
- rain_7b_v0.2,0.5883371824480369
716
- synatra_7b_v0.3_dpo,0.5871824480369515
717
- hyperion_2.1_mistral_7b,0.5871824480369515
718
- thetawave_14b_v0.1,0.5866050808314087
719
- mistral_mbr_32_sig,0.586027713625866
720
- metis_0.1,0.5848729792147807
721
- mistral_nucleus09_32_sig,0.5848729792147807
722
- 0.001_zephyr_5551_4iters_bs256_iter_1,0.5837182448036952
723
- mistral_dmbr20_32_sig,0.5837182448036952
724
- mistral_kmmbr_32_sig,0.5831408775981525
725
- samantha_mistral_7b,0.5825635103926097
726
- mistral_dmbr10_32_sig,0.581986143187067
727
- ziya2_13b_base,0.5808314087759815
728
- koopenchat_sft,0.5808314087759815
729
- blossom_v5_7b,0.5802540415704388
730
- mistral_dmbr03_32_sig,0.5790993071593533
731
- xenon_1,0.5790993071593533
732
- fsfairx_zephyr_chat_v0.1,0.5785219399538106
733
- mini_synatra_sft,0.5779445727482679
734
- qwen1.5_7b_chat_llamafy,0.5767898383371824
735
- marcoro14_7b_slerp,0.5767898383371824
736
- agiin_13.6b_v0.1,0.575635103926097
737
- mistral_7b_orpo_capybara_reproduction,0.575635103926097
738
- 0.001_idpo_declr_4iters_iter_2,0.5744803695150116
739
- mistral_orpo_alpha,0.5744803695150116
740
- stablelm_2_12b_chat,0.5739030023094688
741
- felix_8b,0.5733256351039261
742
- mistral_grok_instract_2_7b_slerp,0.5727482678983834
743
- pivot_0.1_early,0.5715935334872979
744
- einstein_v5_v0.2_7b,0.5715935334872979
745
- zephyr_7b_beta_expo,0.5704387990762124
746
- qwen1.5_moe_a2.7b_chat,0.5704387990762124
747
- 0.001_4iters_bs256_nodpo_only4w_userresponse_iter_4,0.5681293302540416
748
- metis_0.3,0.5681293302540416
749
- neural_mistral_7b,0.5681293302540416
750
- gemma_1.1_7b_it,0.5681293302540416
751
- m_b_4_32,0.5669745958429562
752
- llama3_youko_8b,0.5669745958429562
753
- mistral_7b_instruct_v0.2_sparsity_10,0.5663972286374134
754
- mistral_dmbr05_32_sig,0.565242494226328
755
- openbuddy_mistral2_7b_v20.3_32k,0.565242494226328
756
- snorkel_mistral_pairrm_dpo,0.5646651270207852
757
- mistral_7b_instruct_v0.2_attention_sparsity_10_v0.1,0.5635103926096998
758
- mistral_portuguese_luana_7b_chat,0.5635103926096998
759
- superaligned_jawade,0.5623556581986143
760
- mistral_7b_instruct_v0.2_attention_sparsity_20,0.5623556581986143
761
- synatra_7b_v0.3_rp,0.5617782909930716
762
- mistral_7b_instruct_v0.2,0.5600461893764435
763
- mistral_v2_7b_selfplay_v0,0.5600461893764435
764
- alooowso,0.5600461893764435
765
- mistral_v2_7b_selfplay_low_tmp,0.5594688221709007
766
- mistral_7b_instruct_v0.2_sp_v0,0.5577367205542725
767
- mistral_7b_instruct_v2_sp_v0.1,0.5577367205542725
768
- mistral_7b_orpo_airoboros_pref_10k,0.5577367205542725
769
- 0.001_idpo_iter_1,0.5571593533487298
770
- openbuddy_mistral2_7b_v20.2_32k,0.5565819861431871
771
- 0.001_idpo_iter_2,0.5554272517321016
772
- typhoon_7b_instruct_01_30_2024,0.5554272517321016
773
- mistral_7b_v2_selfplay,0.5548498845265589
774
- qwen1.5_7b_dutch_chat_dpo,0.5536951501154734
775
- deacon_20b,0.5536951501154734
776
- 0.001_idpo_declr_4iters_iter_3,0.5531177829099307
777
- yugogpt,0.5525404157043879
778
- zephyrnotus_11b_alpha,0.5513856812933026
779
- airic_the_mistral,0.5513856812933026
780
- 0.001_idpo_noreplacerej_iter_2,0.5502309468822171
781
- mistral_instruct_7b_v0.2_chatalpacav2_4bit,0.5502309468822171
782
- mistral_v2_7b_selfplay_v0_test,0.5496535796766744
783
- 0.0001_withdpo_4iters_bs256_511lr_iter_2,0.5479214780600462
784
- zephyr_7b_alpha_expo,0.5479214780600462
785
- mistral_7b_instruct_v0.2_selfplay_v0,0.5479214780600462
786
- taliml_7b_v.1_eng,0.5467667436489607
787
- mistral_rank32_dpo,0.5467667436489607
788
- 0.0005_withdpo_4iters_bs256_555lr_iter_2,0.546189376443418
789
- openinstruct_mistral_7b,0.5456120092378753
790
- damysus_coder_v0.1,0.5444572748267898
791
- 0.0_ablation_sample1_4iters_bs256_iter_2,0.5444572748267898
792
- aether_7b_chat_v1.0,0.5438799076212472
793
- 0.001_idpo_declr_iter_2,0.5433025404157044
794
- llama33b_instructed,0.5409930715935335
795
- mistral_rank8_sft,0.5409930715935335
796
- bggpt_7b_instruct_v0.2,0.5409930715935335
797
- rabbit_7b_dpo_chat,0.5409930715935335
798
- mistralinstructlongish,0.5392609699769053
799
- 0.0001_withdpo_4iters_bs256_511lr_iter_3,0.5392609699769053
800
- mistral_7b_instruct_v0.2_attention_sparsity_30,0.5392609699769053
801
- 0.001_idpo_noreplacerej_iter_3,0.5386836027713626
802
- 0.001_idpo_declr_4iters_iter_4,0.5369515011547344
803
- qwen1.5_7b_dutch_chat_sft,0.5369515011547344
804
- 0.0_ablation_sample1_4iters_bs256_iter_3,0.5369515011547344
805
- 0.0001_withdpo_4iters_bs256_5102lr_iter_4,0.5363741339491916
806
- quyen_plus_v0.1,0.5346420323325635
807
- iambe_20b_dare_v2,0.5346420323325635
808
- lucie_7b_v0.2_16bit,0.5346420323325635
809
- 0.0_zephyr_withdpo_4iters_bs128_5551lr_iter_2,0.5329099307159353
810
- mistral_rank16_sft,0.5329099307159353
811
- blossom_v4_qwen1_5_7b,0.5329099307159353
812
- buddhi_128k_chat_7b,0.5317551963048499
813
- mistral_rank32_sft,0.5317551963048499
814
- 0.0_withdpo_4iters_bs256_5551lr_iter_4,0.5311778290993071
815
- mistral_rank8_packing,0.5306004618937644
816
- zephyr_0.2,0.5294457274826789
817
- solar_platypus_10.7b_v1,0.5294457274826789
818
- mistral_rank16_packing,0.5288683602771362
819
- 0.001_idpo_iter_3,0.5282909930715936
820
- mistral_rank8_dpo,0.5277136258660509
821
- 0.001_idpo_declr_iter_3,0.5271362586605081
822
- mistral_rank16_dpo,0.5265588914549654
823
- contextual_kto_mistral_pairrm,0.5248267898383372
824
- orca_2_13b_no_robots,0.5248267898383372
825
- 0.0_withdpo_4iters_bs256_531lr_iter_3,0.5248267898383372
826
- ferret_7b,0.5242494226327945
827
- mistral_rank8_invert,0.5236720554272517
828
- zephyr_0.1,0.5219399538106235
829
- xenon_2,0.5219399538106235
830
- 0.001_3iters_bs256_nodpo_only4w_iter_3,0.5219399538106235
831
- 0.001_idpo_same_noreplacerej_declr_iter_2,0.5207852193995381
832
- decilm_7b_instruct,0.5207852193995381
833
- 0.0_zephyr_withdpo_4iters_bs128_5551lr_iter_3,0.5202078521939953
834
- zephyr_python_ru,0.51905311778291
835
- 0.001_idpo_same_noreplacerej_declr_iter_3,0.51905311778291
836
- 0.0005_withdpo_4iters_bs256_5551lr_iter_4,0.5178983833718245
837
- neu_sai_it1,0.5178983833718245
838
- 0.0_ablation_sample1_4iters_bs256_iter_4,0.5173210161662818
839
- 0.0_zephyr_withdpo_4iters_bs128_5551lr_iter_4,0.516743648960739
840
- 0.001_zephyr_5551_4iters_bs256_iter_3,0.5161662817551963
841
- 0.001_ablation_5iters_bs256_iter_5,0.5155889145496536
842
- 0.001_4iters_bs256_nodpo_only4w_iter_4,0.5144341801385681
843
- xenon_4,0.5144341801385681
844
- radiantloom_mixtral_8x7b_fusion,0.5138568129330254
845
- 0001_dpo_iter_2,0.5132794457274826
846
- 0.001_zephyr_5551_4iters_bs256_iter_4,0.5127020785219399
847
- mistral_rank16_invert,0.5121247113163973
848
- solar_platypus_10.7b_v2,0.5109699769053118
849
- han_llm_7b_v2,0.5109699769053118
850
- mistral_rank32_invert,0.5103926096997691
851
- pivot_10.7b_mistral_v0.2,0.5098152424942263
852
- qwen_7b,0.5086605080831409
853
- mistral_7b_openplatypus_1k,0.5086605080831409
854
- athena_zephyr_7b,0.5080831408775982
855
- xenon_3,0.5075057736720554
856
- decilm_7b,0.5057736720554272
857
- mistral_7b_open_platypus,0.5057736720554272
858
- openbuddy_mistral2_7b_v20.1_32k,0.5057736720554272
859
- codellama_70b,0.5051963048498845
860
- bggpt_7b_instruct_v0.1,0.5046189376443418
861
- zephyr_7b_dpo_full,0.5034642032332564
862
- karen_theeditor_v2_strict_mistral_7b,0.5034642032332564
863
- mini_7b_dare_v1,0.5028868360277137
864
- typhoon_7b,0.5023094688221709
865
- zephyr_7b_truthy,0.5011547344110855
866
- mistral_instruct_frankenmerge,0.5011547344110855
867
- orca_2_13b_sft_v6,0.5005773672055427
868
- genai_nova_13b,0.5
869
- mistral_7b_erebus_v3,0.49942263279445726
870
- openorca_platypus2_13b_qlora_0.80_epoch,0.49884526558891457
871
- karakuri_lm_70b_chat_v0.1,0.4982678983833718
872
- mistral_7b_golden,0.4976905311778291
873
- zephyr_gemma_rpo,0.4971131639722864
874
- mistral_instruct_7b_v0.2_chatalpaca_dpo2,0.49653579676674364
875
- bigstral_12b_32k,0.4959584295612009
876
- solarized_13b_dpo,0.4953810623556582
877
- mistral_instruct_7b_v0.2_chatalpaca,0.49480369515011546
878
- delta_4b_base,0.4942263279445728
879
- platypus2xopenorca_13b_ia3_v4,0.4930715935334873
880
- v1olet_merged_dpo_7b_v4,0.4930715935334873
881
- zephyr_7b_dpo_full_expo,0.4924942263279446
882
- ignis_7b_dpo,0.49191685912240185
883
- hercules_1.0_mistral_7b,0.4913394919168591
884
- pivot_0.1_evil_a,0.49018475750577367
885
- gemma_7b_open_platypus_commercial,0.49018475750577367
886
- platypus2xopenorca_13b_ia3,0.4896073903002309
887
- shark_tank_ai_7b_v2,0.48903002309468824
888
- mistral_7b_instruct_sft_tuned_v0.2,0.4884526558891455
889
- platypus2xopenorca_13b_lora,0.48787528868360275
890
- mistral_7b_aezakmi_v1,0.48614318706697457
891
- chatayt_lora_assamble_marcoroni,0.48614318706697457
892
- luban_marcoroni_13b_v2,0.48614318706697457
893
- luban_marcoroni_13b,0.4855658198614319
894
- platypus2xopenorca_13b_ia3_v3,0.48498845265588914
895
- zysec_7b,0.4838337182448037
896
- walter_mistral_7b,0.4838337182448037
897
- 2x_lora_assemble_nova_13b,0.48267898383371827
898
- luban_marcoroni_13b_v3,0.48267898383371827
899
- chat_ayb_nova_13b,0.4821016166281755
900
- ignis_7b_dpo_laser,0.4815242494226328
901
- airoboros_33b_gpt4_1.3,0.4809468822170901
902
- llama30b,0.48036951501154734
903
- phi_2_dpo,0.4797921478060046
904
- chronorctypus_limarobormes_13b,0.4792147806004619
905
- phi_2_super,0.4780600461893764
906
- phi_2_gpo_renew2_i0,0.4780600461893764
907
- falcon_11b,0.47748267898383373
908
- brokenkeyboardmerge,0.476905311778291
909
- phi_2_dpo_renew1,0.47632794457274824
910
- zephyr_0.2_a2.5,0.47575057736720555
911
- puddlejumper_13b_v2,0.4751732101616628
912
- 2x_lora_assemble_platypus2_13b,0.4745958429561201
913
- mistral_instruct_moe_experimental,0.4740184757505774
914
- phi_2_gpo_renew2_b0.001_extra_i1,0.47344110854503463
915
- phi_2_gpo_renew2_b0.001_log_i0,0.47286374133949194
916
- smartyplats_7b_v2,0.47170900692840645
917
- phi_2_ipo_renew1,0.47170900692840645
918
- phi_2_gpo_renew2_b0.001_v4_i1,0.47113163972286376
919
- dpo_phi2,0.470554272517321
920
- openbuddy_mistral_7b_v17.1_32k,0.46997690531177827
921
- phi_2_gpo_renew2_b0.001_extra_v2_i1,0.4693995381062356
922
- blur_7b_v1.22,0.4676674364896074
923
- luban_platypus2_13b_qlora_0.80_epoch,0.4676674364896074
924
- phi_2_gpo_renew2_b0.001_v2_i1,0.4676674364896074
925
- nova_13b,0.46709006928406466
926
- phi_2_gpo_renew2_b0.001_0.5ultrafeedback_i1,0.4665127020785219
927
- losslessmegacoder_llama2_13b_mini,0.4659353348729792
928
- platypus2xopenorca_13b_ia3_v2.1,0.4653579676674365
929
- phi_2_gpo_renew2_b0.001_0.5ultrafeedback_lowlr_i1,0.46420323325635104
930
- phi_2_gpo_renew2_b0.001_i0,0.46420323325635104
931
- oasst_rlhf_2_llama30b_7k_steps,0.4636258660508083
932
- phi_2_gpo_renew2_b0.001_vllm_i1,0.4630484988452656
933
- phi_2_layla_v1,0.46247113163972287
934
- mistral_7b_med_merge,0.4618937644341801
935
- chat_ayb_platypus2_13b,0.46131639722863743
936
- phi_2_instruction,0.4607390300230947
937
- speechlessv1_nova_13b,0.46016166281755194
938
- aanaphi2_v0.1,0.45958429561200925
939
- nanobot_v1,0.4590069284064665
940
- typhoon_7b_wangchanx_sft_demo,0.45842956120092376
941
- mistral_7b_norobots,0.4578521939953811
942
- phi_2_ipo_test_iter_0,0.45727482678983833
943
- nebula_v2_7b,0.45669745958429564
944
- mistral_neuraldpo_v0.7,0.4561200923787529
945
- duplicitous_slurpbeast_13b,0.45554272517321015
946
- duplicitous_mammal_13b,0.45496535796766746
947
- storytime_13b,0.4543879907621247
948
- orca_nova_13b,0.45381062355658197
949
- airoboros_33b_2.1,0.45265588914549654
950
- liph42,0.45265588914549654
951
- ice_grt,0.4515011547344111
952
- platypus2_13b_qlora,0.4515011547344111
953
- openbuddy_mistral_7b_v19.1_4k,0.45092378752886836
954
- delta_4b_notso_base,0.4503464203233256
955
- camelidae_8x13b,0.4497690531177829
956
- llama3_soliloquy_8b,0.4491916859122402
957
- stable_platypus2_13b_qlora_0.80_epoch,0.44861431870669743
958
- spin_phi2,0.44803695150115475
959
- huginnv1.2,0.447459584295612
960
- nebula_7b,0.4468822170900693
961
- openorcaplatypus2_platypus2_13b_qlora_0.80_epoch,0.44630484988452657
962
- 13b_thorns_l2,0.4457274826789838
963
- ensemble5_platypus2_13b_qlora_0.80_epoch,0.44515011547344113
964
- einstein_v4_phi2,0.44399538106235564
965
- falcon_40b,0.44399538106235564
966
- einstein_v6.1_phi2,0.44341801385681295
967
- ensemblev5_nova_13b,0.4428406466512702
968
- experiment_sft_m7b2_1_merged,0.44226327944572746
969
- yulan_chat_2_13b_fp16,0.4416859122401848
970
- nous_hermes_platypus2_13b_qlora_0.80_epoch,0.44110854503464203
971
- zephyr_alpha_nebula_v2_7b,0.4405311778290993
972
- llama_2_13b_beluga_qlora,0.4399538106235566
973
- phi_2_layla_v1_chatml,0.43937644341801385
974
- qwen1.5_4b,0.4376443418013857
975
- orca_mini_v3_13b,0.4376443418013857
976
- limarp_platypus2_13b_qlora_0.80_epoch,0.4376443418013857
977
- delta_4b_orange,0.437066974595843
978
- airoboros_l2_13b_2.2.1,0.43648960739030024
979
- orcamini_platypus2_13b_qlora_0.80_epoch,0.4359122401847575
980
- codellama_70b_instruct,0.4353348729792148
981
- damysus_2.7b_chat,0.4341801385681293
982
- platypus2_13b_lora,0.4341801385681293
983
- platypus2_13b_ia3,0.4336027713625866
984
- sailor_7b_chat,0.4330254041570439
985
- eastasia_4x7b_moe_experiment,0.43244803695150114
986
- codellama_70b_python,0.43187066974595845
987
- medchator_2x7b,0.4312933025404157
988
- synatra_rp_orca_2_7b_v0.1,0.43071593533487296
989
- platypus_nebula_v2_7b,0.43013856812933027
990
- truthfulqwen1.5_4b,0.4295612009237875
991
- new_model_test2,0.4289838337182448
992
- llama2_13b_sharegpt4_test,0.42782909930715934
993
- llama_2_16b_nastychat,0.42782909930715934
994
- solar_ko_1.3_deup,0.42725173210161665
995
- minotaur_llama2_13b_qlora,0.4266743648960739
996
- llama_2_13b_ds_eli5_1024_r_64_alpha_16,0.42609699769053117
997
- llama_2_13b_chat_dutch,0.4255196304849885
998
- llama_2_13b_qlora,0.42494226327944573
999
- llama_2_13b,0.424364896073903
1000
- solar_13b_instruct_v1.0,0.4237875288683603
1001
- openhermes_gemma_7b,0.4226327944572748
1002
- mythomix_platypus2_13b_qlora_0.80_epoch,0.4226327944572748
1003
- huginn_19b_prototype,0.4220554272517321
1004
- mistral_7b_sft_open_orca_flan_50k,0.4214780600461894
1005
- eurus_70b_nca_fixed,0.42090069284064663
1006
- llama_2_13b_fp16,0.42032332563510394
1007
- mythicaldestroyerv2_platypus2_13b_qlora_0.80_epoch,0.4197459584295612
1008
- platypus2_13b_qlora_0.80_epoch,0.41916859122401845
1009
- redmond_puffin_13b_instruct_pl_lora_unload,0.41859122401847576
1010
- llama_2_13b_instructed,0.4174364896073903
1011
- libra_19b,0.4174364896073903
1012
- openbuddy_gemma_7b_v18.1_4k,0.41628175519630484
1013
- synatra_11b_testbench,0.41628175519630484
1014
- alpagasus_2_13b_qlora_merged,0.4151270207852194
1015
- qwen1.5_4b_chat,0.4151270207852194
1016
- zephyr_7b_norobots,0.41454965357967666
1017
- dolphin_2.2_yi_34b_200k,0.4133949191685912
1018
- llama_2_13b_guanaco_qlora,0.4133949191685912
1019
- llama_2_13b_instruct_v0.2,0.4122401847575058
1020
- deita_4b,0.4122401847575058
1021
- athena_platypus2_13b_qlora_0.80_epoch,0.4110854503464203
1022
- airoboros_c34b_2.2.1,0.4110854503464203
1023
- llama_2_13b_eli5_wiki_1024_r_64_alpha_16,0.4105080831408776
1024
- mistral_7b_selfplay_v0,0.40993071593533487
1025
- mistral_7b_instruct_v0.1,0.4093533487297921
1026
- eurus_70b_sft_fixed,0.40877598152424943
1027
- llama_2_13b_ds_wiki_1024_full_r_64_alpha_16,0.4081986143187067
1028
- merged_dpo_7b,0.407621247113164
1029
- platypus_2_22b_relora,0.40704387990762125
1030
- synatra_v0.1_7b_instruct,0.4064665127020785
1031
- llama2_megamerge_dare_13b_v2,0.4058891454965358
1032
- deacon_13b,0.40473441108545033
1033
- tekniumairoboros_nebula_7b,0.40473441108545033
1034
- llama_2_13b_platypus_vicuna_wizard,0.40415704387990764
1035
- trurl_2_13b_academic,0.4035796766743649
1036
- mistral_instruct_slerp,0.40300230946882215
1037
- puddlejumper_platypus2_13b_qlora_0.80_epoch,0.4018475750577367
1038
- giftedconvo13bloranoecons,0.4018475750577367
1039
- llama2_13b_sharegpt4_orca_openplatypus_8w,0.40127020785219397
1040
- chinese_alpaca_2_13b,0.4006928406466513
1041
- blossom_v4_qwen1_5_4b,0.40011547344110854
1042
- ghost_7b_v0.9.0,0.3995381062355658
1043
- airoboros_c34b_2.1,0.3989607390300231
1044
- michel_13b,0.39838337182448036
1045
- blossom_v5_4b,0.39780600461893767
1046
- llama_2_13b_ds_wiki_1024_full_r_64_alpha_16_merged,0.3972286374133949
1047
- giraffe_13b_32k_v3,0.3966512702078522
1048
- llama_2_13b_eli5_wiki_1024_r_64_alpha_16_merged,0.3960739030023095
1049
- llama_2_13b_platypus,0.394919168591224
1050
- llama_2_13b_ds_eli5_1024_r_64_alpha_16_merged,0.394919168591224
1051
- platypus2_22b_relora,0.3943418013856813
1052
- codellama34b,0.39376443418013857
1053
- llama_megamerge_dare_13b,0.3931870669745958
1054
- sailor_7b,0.39260969976905313
1055
- japanese_stablelm_instruct_gamma_7b,0.3920323325635104
1056
- wizardmath_13b_v1.0,0.39145496535796764
1057
- airoboros_2.1_llama_2_13b_qlora,0.39087759815242495
1058
- tora_13b_v1.0,0.3903002309468822
1059
- everythinglm_13b_v3_peft,0.38972286374133946
1060
- llama_2_13b_vicuna_wizard,0.3891454965357968
1061
- giftedconvo13bloranoeconse4,0.38799076212471134
1062
- llama2_13b_holomax,0.38799076212471134
1063
- llama_2_13b_chat,0.3874133949191686
1064
- airboros2.1_platypus2_13b_qlora_0.80_epoch,0.38683602771362585
1065
- zysec_8b_v2,0.3856812933025404
1066
- zysec_7b_v2,0.3856812933025404
1067
- ypotryll_22b_epoch2_qlora,0.3851039260969977
1068
- wizardlm_1.0_uncensored_codellama34b,0.384526558891455
1069
- thetawave_28b_v0.1,0.38394919168591224
1070
- mistral_trismegistus_7b,0.3833718244803695
1071
- llama_2_13b_chat_platypus,0.3827944572748268
1072
- llama_2_13b_ft_instruct_es,0.38221709006928406
1073
- samantha_nebula_7b,0.3816397228637413
1074
- open_ko_solar_dpo_merge_v0.1,0.3810623556581986
1075
- vigogne2_enno_13b_sft_lora_4bit,0.3804849884526559
1076
- internlm2_base_7b_llama,0.37933025404157045
1077
- yi6,0.37933025404157045
1078
- llama_2_26b_trenchcoat_stack,0.3787528868360277
1079
- neural_phi2,0.378175519630485
1080
- giraffe_beta_13b_32k,0.37759815242494227
1081
- tigerbot_13b_base,0.3770207852193995
1082
- gemma_7b_openhermes,0.37644341801385683
1083
- olmo_1.7_7b,0.3758660508083141
1084
- chimera_7b_ties,0.37528868360277134
1085
- llama_2_13b_german_orpo,0.37471131639722866
1086
- dolphin_nebula_7b,0.3741339491916859
1087
- eeve_korean_instruct_2.8b_v1.0,0.37355658198614317
1088
- openbuddy_gemma_7b_v19.1_4k,0.3729792147806005
1089
- lima2_13b,0.37240184757505773
1090
- quyen_v0.1,0.3712471131639723
1091
- mixtral_6x7b_instruct_v0.1,0.3712471131639723
1092
- aisquare_instruct_solar_10.7b_v0.5.31,0.37066974595842955
1093
- deita_2b,0.37009237875288686
1094
- asclepius_llama2_13b,0.3695150115473441
1095
- orca_mini_v3_7b,0.3689376443418014
1096
- huginn_13b_v4,0.3672055427251732
1097
- huginn_13b_v4.5,0.3672055427251732
1098
- huginn_v3_13b,0.3672055427251732
1099
- yousei_22b,0.36605080831408776
1100
- awanllm_llama3_8b_instruct_dpo_v0.2,0.36605080831408776
1101
- tulu_2_dpo_7b_expo,0.365473441108545
1102
- nusantara_7b_indo_chat,0.3648960739030023
1103
- aisquare_instruct_llama2_koen_13b_v0.9.24,0.3643187066974596
1104
- deepseek_llm_7b_chat,0.36374133949191684
1105
- samantha_mistral_instruct_7b,0.36316397228637415
1106
- llava_v1.5_7b_vicuna,0.3625866050808314
1107
- blossom_v2_llama2_7b,0.36200923787528866
1108
- eeve_korean_2.8b_v1.0,0.36143187066974597
1109
- hope_for,0.3608545034642032
1110
- starcoder2_15b,0.36027713625866054
1111
- yehoon_llama2,0.3596997690531178
1112
- sydney_overthinker_13b_hf,0.35854503464203236
1113
- chinese_alpaca_2_13b_16k,0.35854503464203236
1114
- mnsim_dpo_peftmerged_2_eos,0.3579676674364896
1115
- configurable_mistral_22b,0.35739030023094687
1116
- orca_open_hermes_llava_v1.5_7b_dpo,0.3568129330254042
1117
- mm4_3b,0.35623556581986143
1118
- ghost_7b_alpha,0.3556581986143187
1119
- airocoder_34b_2.1,0.355080831408776
1120
- stable_vicuna_13b,0.3539260969976905
1121
- tamil_llama_13b_instruct_v0.1,0.3539260969976905
1122
- mc_data_30k_from_platpus_orca_7b_10k_v1_lora_qkvo_rank14_v2,0.3533487297921478
1123
- platypus2xopenorca_13b_lora_v2,0.3527713625866051
1124
- geitje_7b_ultra,0.35219399538106233
1125
- camelidae_8x7b,0.35161662817551964
1126
- btlm_v1_7b_base_v0.1,0.3510392609699769
1127
- fietje_2b_chat,0.3504618937644342
1128
- platypus2_7b,0.34988452655889146
1129
- huginn_22b_prototype,0.3493071593533487
1130
- fietje_2b_instruct,0.3481524249422633
1131
- llama2_13b_chinese_v2,0.3481524249422633
1132
- losslessmegacoder_llama2_7b_mini,0.34757505773672054
1133
- hope_for_7b_1.0v,0.34699769053117785
1134
- alma_13b_r,0.3464203233256351
1135
- bielik_7b_instruct_v0.1,0.34584295612009236
1136
- llama2_7b_instruction_lora,0.34526558891454967
1137
- llongorca_7b_16k,0.3446882217090069
1138
- fietje_2b,0.3441108545034642
1139
- code_millenials_34b,0.3435334872979215
1140
- wizardcoder_python_34b_v1.0,0.34295612009237875
1141
- new_model_test3,0.342378752886836
1142
- awanllm_llama3_8b_dolfin_v0.3_dpo,0.3418013856812933
1143
- geitje_7b_chat_v2,0.34122401847575057
1144
- llama_2_7b_chat_guanaco_lora,0.3406466512702079
1145
- llama_2_7b_physics,0.34006928406466513
1146
- mistral_22b_v0.1,0.3394919168591224
1147
- llama_2_7b_chat_afr_200step_merged,0.3389145496535797
1148
- openhermes_7b,0.33833718244803695
1149
- llama_2_7b_chat_afr_200step_v2,0.3377598152424942
1150
- llama_2_7b_chat_afr_441step_flan_v2,0.3371824480369515
1151
- llama_2_7b_chat_afr_300step_flan_v2,0.33602771362586603
1152
- llama_2_7b_chat_afr_200step_flan_v2,0.33602771362586603
1153
- hope_for_7b_1.1v,0.33545034642032334
1154
- llama_2_7b_chat_afr_100step_v2,0.3348729792147806
1155
- wizardvicuna2_13b,0.33429561200923785
1156
- llama2_7b_openorca_mc_v1,0.33371824480369516
1157
- llama_2_7b_chat_afr_100step_flan_v2,0.3331408775981524
1158
- llama_2_7b_chat_afr_200step_flan,0.3325635103926097
1159
- llama_2_7b_chat_afr_100step_flan,0.331986143187067
1160
- llama_2_7b_chat,0.33140877598152424
1161
- cria_llama2_7b_v1.3,0.33083140877598155
1162
- openbuddy_zen_3b_v21.2_32k,0.3302540415704388
1163
- llama_2_7b_chat_10_sparsity,0.32967667436489606
1164
- llama_2_7b_chat_10_attention_sparsity,0.32909930715935337
1165
- mpt_30b,0.3285219399538106
1166
- vicuna_7b_v1.3_attention_sparsity_10,0.3273672055427252
1167
- fusellm_7b,0.3273672055427252
1168
- archangel_sft_kto_llama13b,0.32678983833718245
1169
- starling_7b,0.3262124711316397
1170
- llama_13b,0.32505773672055427
1171
- adelie_sft,0.32505773672055427
1172
- airoboros_l2_7b_2.2.1,0.3244803695150115
1173
- telugu_llama2_7b_v0_instruct,0.32390300230946883
1174
- flan_llama_7b_2_llama2_7b_flash_868_full_model,0.3233256351039261
1175
- llama_2_7b_chat_20_attention_sparsity,0.32274826789838335
1176
- vicuna_7b_v1.3_attention_sparsity_20,0.32217090069284066
1177
- mistral_7b_instruct_v0.2_sparsity_20,0.3210161662817552
1178
- llama_2_7b_chat_20_sparsity,0.3210161662817552
1179
- llama_2_7b_chat_guanaco,0.3204387990762125
1180
- llama2_7b_openorca_mc_v2_dpo,0.31986143187066973
1181
- llama_2_7b_chat_guanaco_freeze_embed_tokens_q_v_proj,0.31928406466512704
1182
- rocket_3b,0.3187066974595843
1183
- elyza_japanese_llama_2_7b_instruct,0.31755196304849886
1184
- llama_2_peanutbutter_v18_b_7b,0.31755196304849886
1185
- llama_2_7b_chat_30_attention_sparsity,0.3169745958429561
1186
- llama_2_peanutbutter_v10_7b,0.3163972286374134
1187
- llama_2_7b_chat_guanaco_freeze_embed_tokens_q_v_proj_lora,0.3158198614318707
1188
- towerinstruct_7b_v0.1,0.31524249422632794
1189
- llama_2_7b,0.3146651270207852
1190
- vicuna_7b_v1.3_attention_sparsity_30,0.3140877598152425
1191
- helpingai_3b,0.31351039260969976
1192
- tora_code_34b_v1.0,0.312933025404157
1193
- qwen1.5_1.8b,0.3123556581986143
1194
- llama_2_7b_guanaco_instruct_sharded,0.3117782909930716
1195
- chinese_alpaca_2_7b,0.3112009237875289
1196
- mistral_7b_instruct_v0.2_sparsity_30,0.31062355658198615
1197
- cria_llama2_7b_v1.3_peft,0.3100461893764434
1198
- qwen_1_8b_llamafied,0.3094688221709007
1199
- deepseek_moe_16b_base,0.30889145496535797
1200
- chinese_alpaca_2_7b_rlhf,0.3083140877598152
1201
- stablelm_zephyr_3b,0.30773672055427254
1202
- odia_llama2_7b_base,0.3071593533487298
1203
- youri_7b_chat,0.30658198614318705
1204
- llama_2_7b_chat_flan2022_1.2m,0.30600461893764436
1205
- llama_2_7b_eli5_cleaned_1024_qlora_merged,0.30484988452655887
1206
- tora_7b_v1.0,0.30484988452655887
1207
- qwen1.5_1.8b_chat,0.3042725173210162
1208
- openhermes_qwen1.5_1.8b,0.30369515011547343
1209
- mhm_7b_v1.3_dpo_1,0.3031177829099307
1210
- mhm_7b_v1.3,0.302540415704388
1211
- llama_2_7b_eli5_cleaned_wiki65k_1024_qlora_merged,0.30196304849884525
1212
- deita_qwen_1_8b,0.3008083140877598
1213
- deita_1_8b,0.3008083140877598
1214
- leo_hessianai_7b_chat,0.3002309468822171
1215
- llama_2_7b_chat_30_sparsity,0.2996535796766744
1216
- llama_2_peanutbutter_v18_a_7b,0.29907621247113164
1217
- llama_2_7b_32k_instruct,0.2984988452655889
1218
- quan_1.8b_base,0.29734411085450346
1219
- llama_7b_sft_qlora_eli5_wiki_dpo_ds_rm_top_2_1024_r_64_alpha_16,0.29734411085450346
1220
- llama_7b_sft_ds_wiki65k_1024_r_64_alpha_16_merged,0.2967667436489607
1221
- orca_2.0_tau_1.8b,0.29618937644341803
1222
- stablelm_3b_4e1t,0.2956120092378753
1223
- stablelm_base_alpha_7b_v2,0.29503464203233254
1224
- neuralreyna_mini_1.8b_v0.2,0.29445727482678985
1225
- qwen_1_8b_everythinglm,0.2938799076212471
1226
- hercules_mini_1.8b,0.29330254041570436
1227
- leo_hessianai_7b_chat_bilingual,0.29272517321016167
1228
- qwen_1_8b_chat_llama,0.2921478060046189
1229
- truthfulqwen1.5_1.8b,0.29157043879907624
1230
- llama_v2_7b_32kc_security,0.2909930715935335
1231
- openllama_7b_icl,0.29041570438799075
1232
- palmyra_med_20b,0.28983833718244806
1233
- neuralreyna_mini_1.8b_v0.3,0.2892609699769053
1234
- llama_2_7b_alpaca_gpt4,0.28868360277136257
1235
- quan_1.8b_chat,0.2881062355658199
1236
- everyone_coder_33b_base,0.28752886836027713
1237
- llama_2_7b_gptq,0.2869515011547344
1238
- sailor_4b_chat,0.2863741339491917
1239
- sambalingo_thai_chat,0.28579676674364896
1240
- quyen_mini_v0.1,0.2852193995381062
1241
- phi_1_5,0.2846420323325635
1242
- open_llama_13b,0.2840646651270208
1243
- galpaca_30b_miniorca,0.2834872979214781
1244
- asclepius_llama2_7b,0.2823325635103926
1245
- kollama2_7b_v2,0.2823325635103926
1246
- llama_2_7b_open_platypus,0.2817551963048499
1247
- speechless_codellama_orca_13b,0.28117782909930716
1248
- minimerlin_3b_v0.1,0.2806004618937644
1249
- gemma_2b_zephyr_dpo,0.28002309468822173
1250
- lima2_7b,0.279445727482679
1251
- zephyr_phi_1_5_sft_qlora,0.27886836027713624
1252
- fialka_7b_v3,0.2777136258660508
1253
- smartqwen1.5_1.8b_orpo_v1,0.2777136258660508
1254
- mistral_megamerge_dare_7b,0.27713625866050806
1255
- neural_chat_mini_v2.2_1.8b,0.27655889145496537
1256
- gowizardlm,0.2759815242494226
1257
- chinese_alpaca_2_7b_16k,0.2754041570438799
1258
- openllama_7b_base,0.27424942263279445
1259
- speechless_codellama_platypus_13b,0.27424942263279445
1260
- phi_openllm_lb_test,0.273094688221709
1261
- mpt_7b_8k,0.273094688221709
1262
- llama_2_7b_flan2022_1.2m,0.27251732101616627
1263
- mpt_7b_8k_instruct,0.2719399538106236
1264
- stablelm_2_zephyr_1_6b,0.27136258660508084
1265
- zephyr_2b_gemma_sft_qlora,0.2707852193995381
1266
- v1,0.2702078521939954
1267
- remask_3b,0.26963048498845266
1268
- gemma_2b,0.2690531177829099
1269
- stablelm_2_1_6b_chat,0.2684757505773672
1270
- open_llama_7b_v2,0.2678983833718245
1271
- starcoder2_7b,0.26732101616628173
1272
- openhermes_phi_1_5_sft_qlora,0.26674364896073904
1273
- recurrentgemma_2b_it,0.2661662817551963
1274
- gaja_v1.00,0.26558891454965355
1275
- gaja_v2.00_dpo,0.26501154734411086
1276
- samantha_1.11_7b,0.2644341801385681
1277
- zephyr_danube2_sft_qlora,0.2632794457274827
1278
- openhermes_danube2_sft_qlora,0.2632794457274827
1279
- openthaigpt_1.0.0_alpha_7b_chat_ckpt,0.26270207852193994
1280
- phi_1_5_chat_32k,0.26212471131639725
1281
- calm2_7b_chat_dpo_experimental,0.2615473441108545
1282
- codellama34b_instruct_fp16,0.2603926096997691
1283
- codellama34b_instruct,0.2603926096997691
1284
- open_llama3b_v2_instruct,0.25981524249422633
1285
- openhermes_2b_gemma_sft_qlora,0.2592378752886836
1286
- ex_llm_e1,0.2586605080831409
1287
- deita_500m,0.25808314087759815
1288
- calm2_7b_chat,0.2575057736720554
1289
- qwen1.5_0.5b,0.2569284064665127
1290
- nxcode_cq_7b_orpo,0.25635103926096997
1291
- deepseek_coder_6.7b_instruct,0.2557736720554272
1292
- sailor_4b,0.25519630484988454
1293
- stablelm_2_1_6b,0.2546189376443418
1294
- codellama_13b_instruct,0.2540415704387991
1295
- codellama_13b_instruct_fp16,0.25346420323325636
1296
- wizardcoder_python_13b_lora,0.2528868360277136
1297
- starcoder2_3b,0.2523094688221709
1298
- sappha_2b_v3,0.2517321016166282
1299
- coven_tiny_1.1b_32k_orpo_alpha,0.25115473441108543
1300
- gemma_2b_orpo,0.25057736720554274
1301
- nusantara_4b_indo_chat,0.24942263279445728
1302
- deepseek_coder_6.7b_base,0.24942263279445728
1303
- sailor_1.8b_chat,0.24884526558891454
1304
- gemma_2b_tamil,0.24826789838337182
1305
- neurona_2b,0.2476905311778291
1306
- h2o_danube2_1.8b_chat,0.2471131639722864
1307
- gemma_2b_nlaf_v0,0.24653579676674364
1308
- phi_gemma_nlaf_v0,0.24595842956120093
1309
- gemma_2b_it_nlai_p1,0.2453810623556582
1310
- gemma_2b_it_sp_test,0.24307159353348728
1311
- gemma_2b_it_sp_test1,0.24307159353348728
1312
- openhermes_gemma_2b,0.24307159353348728
1313
- gemma_2b_it_sp_test_openherms_step500,0.24307159353348728
1314
- gemma_nlaf_v1,0.24249422632794457
1315
- gemma_2b_openhermes,0.24191685912240185
1316
- phi_gemma_nlaf_v1,0.2407621247113164
1317
- gemma_2b_it_nlai_v0,0.2407621247113164
1318
- baize_healthcare_lora_7b,0.24018475750577367
1319
- tora_code_13b_v1.0,0.23960739030023095
1320
- cross_lingual_epoch2,0.2390300230946882
1321
- llama_7b,0.2384526558891455
1322
- llama_base_7b,0.23787528868360278
1323
- gzdx_1.1b,0.23729792147806006
1324
- codellama_13b_oasst_sft_v10,0.23672055427251731
1325
- palmyra_20b_chat,0.2361431870669746
1326
- gpt_sw3_40b,0.23556581986143188
1327
- codellama34b_python,0.23498845265588914
1328
- recurrentgemma_2b,0.23441108545034642
1329
- codellama_7b_instruct,0.2338337182448037
1330
- deacon_1_8b,0.23325635103926096
1331
- tau_0.5b_instruct_dpop,0.23267898383371824
1332
- qwen1.5_0.5b_chat,0.23210161662817552
1333
- qwen_orpo_v1,0.2315242494226328
1334
- test_qwen1.5_0.5b,0.23094688221709006
1335
- dpo_qwen1.5_0.5b_chat_alignment_handbook,0.23036951501154734
1336
- h2o_danube_1.8b_chat,0.22979214780600463
1337
- ultra0,0.22921478060046188
1338
- tora_code_7b_v1.0,0.22863741339491916
1339
- platypus_1_8b,0.22806004618937645
1340
- codellama34b_python_fp16,0.22748267898383373
1341
- codellama_13b,0.22690531177829099
1342
- poro_34b_gptq,0.22632794457274827
1343
- codegen_16b_nl,0.22575057736720555
1344
- starcoderbase,0.2251732101616628
1345
- gemma_2b_sft_telugu,0.2245958429561201
1346
- mc_model_v1,0.22401847575057737
1347
- gpt_sw3_6.7b_v2_instruct,0.22344110854503466
1348
- gpt_sw3_20b_instruct,0.2228637413394919
1349
- quark_464m_v0.2,0.2222863741339492
1350
- cypher_mini_1.8b,0.22170900692840648
1351
- codellama_7b,0.22113163972286373
1352
- dpo_qlora_qwen1.5_0.5b_chat_xtuner,0.22055427251732102
1353
- bloom,0.2199769053117783
1354
- mpt_7b,0.21939953810623555
1355
- dpo_qwen1.5_0.5b_chat,0.21882217090069284
1356
- open_llama_7b,0.21824480369515012
1357
- sailor_1.8b,0.2176674364896074
1358
- nusantara_1.8b_indo_chat,0.21709006928406466
1359
- nucleus_22b_token_500b,0.21651270207852194
1360
- gpt_sw3_6.7b_v2,0.21593533487297922
1361
- tinyllama_moe_chat,0.21535796766743648
1362
- falcon_7b_3epoch_norobots,0.21478060046189376
1363
- starcoder,0.21420323325635104
1364
- gollie_7b,0.21362586605080833
1365
- tinyllama_moe_chat_0.1,0.21304849884526558
1366
- llamacorn_1.1b_chat,0.21247113163972287
1367
- falcon_rw_1b_instruct_openorca,0.21189376443418015
1368
- open_llama3b_v2_chat,0.2113163972286374
1369
- minima_3b,0.2107390300230947
1370
- palmyra_large,0.21016166281755197
1371
- gpt_sw3_20b,0.2090069284064665
1372
- deepseek_coder_1.3b_instruct,0.2090069284064665
1373
- openbezoar_sft,0.2084295612009238
1374
- starcoderbase_7b,0.20785219399538107
1375
- codellama_7b_python,0.20727482678983833
1376
- instructpalmyra_20b,0.2066974595842956
1377
- tinyllama_1.1b_slimorca_function_calling_3t,0.2061200923787529
1378
- olmo_7b,0.20554272517321015
1379
- shearedplats_2.7b_v2_instruct_v0.1,0.20496535796766743
1380
- falcon_7b_norobots,0.20438799076212472
1381
- open_llama3b_code_instruct_0.1,0.203810623556582
1382
- falcon_7b,0.20265588914549654
1383
- xglm_7.5b,0.20265588914549654
1384
- dociprollm_7b,0.20207852193995382
1385
- redpajama_incite_7b_base,0.20092378752886836
1386
- redpajama_incite_base_7b_v0.1,0.20092378752886836
1387
- openhermes_tinyllama_sft_qlora,0.20034642032332564
1388
- shearedplats_2.7b_v2,0.1997690531177829
1389
- walter_llama_1b,0.19919168591224018
1390
- starcoderbase_3b,0.19861431870669746
1391
- dolphin_2.6_mistral_7b_dpo_5.93b,0.19803695150115475
1392
- mt7bi_wizard_3_alpha_dpo,0.197459584295612
1393
- zephyr_1b_olmo_sft_qlora,0.19688221709006928
1394
- aira_2_355m,0.19630484988452657
1395
- wizardvicuna_open_llama3b_v2,0.1951501154734411
1396
- codellama_13b_python,0.1951501154734411
1397
- palmyra_base,0.1945727482678984
1398
- deacon_3b,0.19341801385681293
1399
- test_22b,0.19341801385681293
1400
- openllama3b_evolinstruct_lora_merged,0.1922632794457275
1401
- open_llama3b_v2,0.1922632794457275
1402
- rho_math_1b_v0.1,0.19168591224018475
1403
- redpajama_incite_base_3b_v1,0.19110854503464203
1404
- hf_checkpoint2_01052024,0.18995381062355657
1405
- numfalm_3b,0.18995381062355657
1406
- lamini_neo_1.3b_mental_health_lora,0.18879907621247113
1407
- zephyr_danube_sft_qlora,0.18879907621247113
1408
- opt_66b,0.18822170900692842
1409
- mptk_1b,0.18764434180138567
1410
- open_llama3b,0.18706697459584296
1411
- gpt2_platypus_camel_physics,0.18533487297921478
1412
- openbezoar_hh_rlhf_dpo,0.18533487297921478
1413
- gpt2_camel_physics_platypus,0.18533487297921478
1414
- nusantara_0.8b_indo_chat,0.18475750577367206
1415
- tinyllama_1.1b_intermediate_step_1431k_3t_laser_dpo,0.18418013856812934
1416
- bloom_1b1_rlhf,0.1836027713625866
1417
- stellarx_4b_v0,0.18244803695150116
1418
- csg_wukong_1b_chat_v0.1,0.18244803695150116
1419
- amber,0.1812933025404157
1420
- minueza_32m_deita,0.1812933025404157
1421
- cerebras_gpt_256m,0.18071593533487298
1422
- mistral_7b_dpo_open_orca_flan_50k_synthetic_5_models,0.18013856812933027
1423
- gemma_ko_1.1_2b_it,0.1784064665127021
1424
- gpt_2_xl_camel_ai_physics,0.1784064665127021
1425
- tiny_starcoder_py,0.1784064665127021
1426
- pythia_2.8b_deduped,0.1766743648960739
1427
- gpt_j_6b,0.1766743648960739
1428
- tinyllama_1.1b_step_50k_105b,0.1766743648960739
1429
- pythia_12b,0.17609699769053117
1430
- sailor_0.5b_chat,0.17551963048498845
1431
- orca_2_7b_f16,0.17494226327944573
1432
- cosmo_1b,0.17436489607390301
1433
- starcoderbase_1b,0.17378752886836027
1434
- weblab_10b_instruction_sft,0.17263279445727484
1435
- opt_30b,0.17263279445727484
1436
- sheared_pythia_160m,0.17147806004618937
1437
- flor_1.3b_xat,0.17147806004618937
1438
- black_goo_recipe_d,0.17032332563510394
1439
- polyglot_ko_12.8b,0.17032332563510394
1440
- cerebras_gpt_1.3b,0.1697459584295612
1441
- black_goo_recipe_c,0.16916859122401848
1442
- pythia_1.3b,0.16859122401847576
1443
- gpt2_xl,0.16801385681293302
1444
- 7b_redpajama_conditional_alpha,0.16685912240184758
1445
- chinese_alpaca_2_1.3b_rlhf,0.16685912240184758
1446
- tinyllama,0.16628175519630484
1447
- pythia_6.9b_deduped,0.16570438799076212
1448
- tinyopenhermes_1.1b_4k,0.16397228637413394
1449
- gpt_neo_2.7b,0.16397228637413394
1450
- zephyr_220m_sft_full,0.16397228637413394
1451
- llongma_3b_lima,0.1628175519630485
1452
- zephyr_220m_dpo_full,0.1628175519630485
1453
- gpt2_chatbot,0.16224018475750576
1454
- gpt2_guanaco_dolly_platypus,0.16166281755196305
1455
- flyingllama_v2,0.16108545034642033
1456
- fialka_13b_v3,0.1605080831408776
1457
- gpt2_large_conversational,0.15993071593533487
1458
- olmo_1b,0.15935334872979215
1459
- weblab_10b,0.15877598152424943
1460
- tinyllama_1.1b_intermediate_step_240k_503b,0.1581986143187067
1461
- bloom_7b1,0.15762124711316397
1462
- tinywand_dpo,0.1564665127020785
1463
- fbopt_350m_8bit,0.1564665127020785
1464
- stablelm_base_alpha_7b,0.1558891454965358
1465
- gpt2_open_platypus,0.15531177829099307
1466
- smol_llama_220m_openhermes,0.1535796766743649
1467
- llama2_xs_460m_experimental,0.1535796766743649
1468
- gpt_sw3_1.3b_instruct,0.1535796766743649
1469
- gpt2_platypus_dolly_guanaco,0.15242494226327943
1470
- knowledgeninja_litellama_460mx6moe_1t,0.15242494226327943
1471
- aeonium_v1_baseweb_1b,0.15184757505773672
1472
- gpt_sw3_1.3b,0.15069284064665128
1473
- llama_160m_chat_v1,0.15069284064665128
1474
- tinyllama_1.1b_chat_v0.3_platypus,0.15011547344110854
1475
- rwkv_4_14b_pile,0.1489607390300231
1476
- evaloric_1.1b_test,0.1489607390300231
1477
- smol_llama_220m_open_instruct,0.14780600461893764
1478
- tinyllama_frankenmerge,0.14780600461893764
1479
- mixtral_gqa_400m_v2,0.14665127020785218
1480
- redpajama_incite_chat_3b_v1_rl_lora_8bit_test1,0.14665127020785218
1481
- minueza_32m_ultrachat,0.14607390300230946
1482
- gpt2_large,0.14491916859122403
1483
- minueza_32mx2_chat,0.14491916859122403
1484
- tinymistral_248m_sft_v4,0.14376443418013857
1485
- tinyllama_1.1b_intermediate_step_1431k_3t,0.14376443418013857
1486
- opt_350m,0.1420323325635104
1487
- opt_125m,0.1420323325635104
1488
- healix_3b,0.1420323325635104
1489
- gpt_sw3_6.7b,0.14145496535796767
1490
- pythia_410m_deduped,0.14087759815242495
1491
- tinywand_sft,0.1403002309468822
1492
- gpt_neo_125m,0.1397228637413395
1493
- litellama_460m_1t,0.13856812933025403
1494
- rwkv_raven_1b5,0.13856812933025403
1495
- h2o_danube_1.8b_base,0.1379907621247113
1496
- codegen_6b_nl,0.13568129330254042
1497
- tinydolphin_2.8.2_1.1b_laser,0.13568129330254042
1498
- gpt_sw3_356m,0.13568129330254042
1499
- cerebras_gpt_6.7b,0.13568129330254042
1500
- cerebras_gpt_13b,0.1351039260969977
1501
- pythia_70m,0.13452655889145496
1502
- test_model,0.13279445727482678
1503
- smol_llama_4x220m_moe,0.13279445727482678
1504
- chinese_alpaca_2_1.3b,0.13279445727482678
1505
- pythia_2.7b,0.13163972286374134
1506
- gpt2_test,0.13163972286374134
1507
- zephyr_tinyllama_sft_qlora,0.13048498845265588
1508
- smol_llama_220m_gqa,0.13048498845265588
1509
- falcon_7b_instruct,0.12990762124711316
1510
- algae_550m_base,0.1287528868360277
1511
- gpt2,0.1287528868360277
1512
- tinynaughtyllama_v1.0,0.12759815242494227
1513
- gpt_2_slimorcadeduped_airoboros_3.1_metamathqa_sft_124m,0.12759815242494227
1514
- gpt2_dolly,0.12702078521939955
1515
- pythia_1.4b,0.1264434180138568
1516
- zephyr_tiny_dpo_qlora,0.1258660508083141
1517
- tinyllama_chat_sft,0.12471131639722864
1518
- rwkv_4_1b5_pile,0.12471131639722864
1519
- numfa_v2_1b,0.12240184757505773
1520
- phind_codellama34b_v2,0.12240184757505773
1521
- gptneo350m_instruct_sft,0.12240184757505773
1522
- numfalm_v2_1b,0.12240184757505773
1523
- minueza_32m_chat,0.12124711316397228
1524
- black_goo_recipe_a,0.12124711316397228
1525
- csg_wukong_1b_orpo_bf16,0.12066974595842957
1526
- mistral_3_from_mixtral_8x7b_v0.1,0.1195150115473441
1527
- tinyllama_1.1b_1.5t_openorca_alpha,0.1195150115473441
1528
- croissantllmbase,0.11893764434180139
1529
- codegen_6b_multi,0.11836027713625866
1530
- mixnueza_6x32m_moe,0.11778290993071594
1531
- shearedllama_1.3b_fft_test1,0.11662817551963048
1532
- minillama_1.8b_chat_v0.1,0.11662817551963048
1533
- tmm_1b,0.11547344110854503
1534
- black_goo_recipe_b,0.11547344110854503
1535
- openhermes_1b_olmo_sft_qlora,0.11489607390300231
1536
- boomer_1b,0.11374133949191687
1537
- ablation_model_fineweb_v1,0.11374133949191687
1538
- init_model,0.11316397228637413
1539
- pythia_12b_deduped,0.1125866050808314
1540
- sailor_0.5b,0.11200923787528869
1541
- tinydolphin_2.8_1.1b,0.11143187066974596
1542
- pythia_1.4b_deduped,0.11085450346420324
1543
- stellarx_4b_v0.2,0.10912240184757506
1544
- megachat,0.10912240184757506
1545
- codeparrot,0.10912240184757506
1546
- microscopic_mistral_87k_steps,0.10854503464203233
1547
- tinyllama_1.1b_layla_v4,0.10739030023094688
1548
- gpt_sw3_356m_instruct,0.10739030023094688
1549
- gpt_2_large_115k_steps,0.10623556581986143
1550
- phigrange_dpo,0.10623556581986143
1551
- cerebras_gpt_111m,0.10508083140877598
1552
- 42dot_llm_sft_1.3b,0.10508083140877598
1553
- mindllm,0.10450346420323325
1554
- tiny_vicuna_1b,0.1033487297921478
1555
- mistral_6_from_mixtral_8x7b_v0.1,0.1033487297921478
1556
- speechless_codellama_orca_airoboros_13b_0.10e,0.10046189376443418
1557
- opt_2.7b,0.10046189376443418
1558
- stablelm_base_alpha_3b,0.10046189376443418
1559
- xglm_4.5b,0.10046189376443418
1560
- gpt2_xl_lima,0.10046189376443418
1561
- 3b_redpajama_conditional_alpha,0.09930715935334873
1562
- tinyultra_4x1.1b_base_alpha,0.09930715935334873
1563
- fialka_13b_v3.1,0.098729792147806
1564
- internlm_20b_llamafied,0.09757505773672055
1565
- dopeyshearedplats_1.3b_v1,0.09757505773672055
1566
- bilingual_gpt_neox_4b_8k,0.09699769053117784
1567
- nanollama_gqa_l10_a32_kv8_v13_ki,0.09584295612009237
1568
- babyllama_v0.6,0.09584295612009237
1569
- speechless_codellama_orca_platypus_13b_0.10e,0.09468822170900693
1570
- evaloric_1.1b,0.09468822170900693
1571
- open_llama3b_instruct_v_0.2,0.09353348729792148
1572
- nano_phi_115m_v0.1,0.09353348729792148
1573
- csg_wukong_1b,0.0918013856812933
1574
- llama3,0.0918013856812933
1575
- 774m_03_09_2024,0.0918013856812933
1576
- smartyplats_3b_v1,0.09006928406466513
1577
- tinyllama_1.1b_1t_openorca,0.09006928406466513
1578
- tinydolphin_2.8.1_1.1b,0.09006928406466513
1579
- mistral_8_from_mixtral_8x7b_v0.1,0.0894919168591224
1580
- verysmol_llama_v11_kix2,0.08775981524249422
1581
- falcon_rw_1b,0.08775981524249422
1582
- mixsmol_4x400m_v0.1_epoch1,0.08775981524249422
1583
- mixsmol_4x400m_v0.1_epoch2,0.08602771362586605
1584
- pythia_70m_deduped,0.08602771362586605
1585
- falcon_1b_t_sft,0.08602771362586605
1586
- pile_7b_250b_tokens,0.08545034642032333
1587
- open_calm_large,0.0848729792147806
1588
- gzdx,0.08429561200923788
1589
- llama_68m_chat_v1,0.08140877598152425
1590
- xglm_564m,0.08140877598152425
1591
- tinymistral_248m_instruct,0.08140877598152425
1592
- tinyllama_1.1b_orca_v1.0,0.08140877598152425
1593
- zephyr_smol_llama_100m_dpo_full,0.08140877598152425
1594
- mgpt,0.0802540415704388
1595
- cerebras_gpt_2.7b,0.0802540415704388
1596
- nano_mistral,0.07967667436489607
1597
- opt_flan_iml_6.7b,0.07852193995381063
1598
- mistral_7_from_mixtral_8x7b_v0.1,0.07852193995381063
1599
- aira_2_774m,0.07736720554272518
1600
- mistral_5_from_mixtral_8x7b_v0.1,0.07736720554272518
1601
- vortex_3b_v2,0.07621247113163972
1602
- fialka_13b_v4,0.07621247113163972
1603
- model_a_48.5m,0.07505773672055427
1604
- openhermes_danube_sft_qlora,0.07505773672055427
1605
- smolllamix_8x101m_take2,0.07448036951501155
1606
- tinyllama_1.1b_chat_v1.0_intel_dpo,0.07390300230946882
1607
- nanofialka_v1,0.07332563510392609
1608
- gpt_neox_20b,0.07217090069284064
1609
- tinyllama_1.1b_intermediate_step_480k_1t,0.07217090069284064
1610
- merge_dolly_v2_3b_dpo_test,0.06986143187066975
1611
- pythia_31m_simplepile_lite_2048_scratch_2e,0.06986143187066975
1612
- tinystories_3m,0.06986143187066975
1613
- bulgakovlm_3b,0.06986143187066975
1614
- pythia_31m,0.0687066974595843
1615
- gpt_bigcode_santacoder,0.0687066974595843
1616
- rwkv_4_7b_pile,0.06812933025404157
1617
- pythia_160m,0.06755196304849885
1618
- smol_llama_101m_chat_v1,0.06697459584295612
1619
- idus,0.06639722863741339
1620
- opt_13b,0.06581986143187067
1621
- deacon_1b,0.06466512702078522
1622
- koalpaca_korwkv_6b,0.06466512702078522
1623
- rwkv_raven_3b,0.06408775981524249
1624
- pythia_160m_deduped,0.06293302540415704
1625
- aira_2_1b1,0.06293302540415704
1626
- rwkv_4_430m_pile,0.06235565819861432
1627
- mistral_4_from_mixtral_8x7b_v0.1,0.061200923787528866
1628
- nusantara_2.7b_indo_chat,0.061200923787528866
1629
- gpt_neo_1.3b,0.06062355658198614
1630
- csg_wukong_1b_sft_bf16,0.06004618937644342
1631
- crow_1b,0.05889145496535797
1632
- minueza_32m_base,0.05889145496535797
1633
- gpt2_final,0.057736720554272515
1634
- dpo_miniguanaco_1.5t,0.057736720554272515
1635
- shearedplats_1.3b_v1,0.05715935334872979
1636
- puli_gptrio,0.05658198614318707
1637
- csg_wukong_1b_sft_dpo_bf16,0.05600461893764434
1638
- smolllamix_8x101m,0.05484988452655889
1639
- korwkv_6b,0.05484988452655889
1640
- mpt_125m_c4,0.054272517321016164
1641
- rwkv_4_3b_pile,0.05369515011547344
1642
- llama_pile_350b,0.05254041570438799
1643
- mistral_1_from_mixtral_8x7b_v0.1,0.05254041570438799
1644
- pythia_6.7b,0.05138568129330254
1645
- healix_1.1b_v1_chat_ddpo,0.05138568129330254
1646
- zyte_1b,0.050808314087759814
1647
- llama3_orpo_v1_merged_16bit,0.05023094688221709
1648
- walter_falcon_1b,0.049653579676674366
1649
- opt_6.7b,0.04849884526558892
1650
- tinystories_1m,0.04849884526558892
1651
- pythia_31m_chat_v1,0.04734411085450346
1652
- dopeyplats_1.1b_2t_v1,0.04734411085450346
1653
- croissantcool_v0.2,0.04676674364896074
1654
- gpt_sw3_126m,0.046189376443418015
1655
- falcon_rw_1b_chat,0.04503464203233257
1656
- tiny_llama3_7b,0.04503464203233257
1657
- gpt3_finnish_small,0.044457274826789836
1658
- pythia_1b_spin_iter1,0.04387990762124711
1659
- tinymistral_248m_sft_v3,0.04330254041570439
1660
- decicoder_1b,0.042725173210161664
1661
- megatron_gpt2_345m,0.04157043879907621
1662
- smartyplats_3b_v2,0.04157043879907621
1663
- llama39m,0.040993071593533485
1664
- tinymix,0.03983833718244804
1665
- pythia_1b_deduped,0.03983833718244804
1666
- llama_160m,0.03926096997690531
1667
- pythia_1b_dpo,0.03810623556581986
1668
- smol_llama_101m_gqa,0.03810623556581986
1669
- dpo_test_hermes_open_llama3b,0.037528868360277134
1670
- mistral_2_from_mixtral_8x7b_v0.1,0.036374133949191687
1671
- cutie,0.036374133949191687
1672
- numfa_3b_1epoch,0.03521939953810624
1673
- gpt_2_large_40k_steps,0.03521939953810624
1674
- pythia_1b_dpo_full,0.034064665127020784
1675
- tinymistral_6x248m_instruct,0.034064665127020784
1676
- gpt3_finnish_large,0.03348729792147806
1677
- smol_llama_81m_tied,0.032909930715935336
1678
- gpt_2_large_43k_steps,0.03233256351039261
1679
- bloom_560m_rlhf_v2,0.03175519630484989
1680
- tinymistral_248m_v2.5_instruct,0.03117782909930716
1681
- gpt_2_large_51k_steps,0.03002309468822171
1682
- gpt_2_large_20k_steps,0.03002309468822171
1683
- tinystories_33m,0.029445727482678985
1684
- taketwo,0.028868360277136258
1685
- gpt_sw3_126m_instruct,0.028290993071593534
1686
- gpt_2_large_32k_steps,0.02771362586605081
1687
- helpingai_110m,0.027136258660508082
1688
- rwkv_raven_7b,0.026558891454965358
1689
- bloom_560m_rlhf,0.025981524249422634
1690
- megatron_gpt2_345m_evol_instruct_v2,0.025404157043879907
1691
- ko_wand_136m,0.024826789838337183
1692
- tinystories_28m,0.02367205542725173
1693
- tinymistral_v2.5_minipile_guidelines_e1,0.02367205542725173
1694
- tinymistral_248m_chat_v2,0.023094688221709007
1695
- gpt3_finnish_13b,0.022517321016166283
1696
- tinymistral_248m_v2,0.021939953810623556
1697
- tinymistral_v2_test1,0.021362586605080832
1698
- tinystories_8m,0.02020785219399538
1699
- llama_2_3b,0.02020785219399538
1700
- rwkv_4_169m_pile,0.019630484988452657
1701
- llama2_13b_platypus_ckpt_1000,0.01905311778290993
1702
- facebook_opt_125m_qcqa_ub_6_best_for_q_loss,0.01674364896073903
1703
- facebook_opt_6.7b_qcqa_ub_16_best_for_q_loss,0.01674364896073903
1704
- tinymistral_248m,0.01674364896073903
1705
- tinymistral_248m_v2.5,0.01674364896073903
1706
- dough_instruct_base_001,0.016166281755196306
1707
- llm_jp_13b_instruct_full_jaster_v1.0,0.002886836027713626
1708
- griffin_c3t_8l_v0.02_fineweb,0.002886836027713626
1709
- mistral_7b_v0.1_signtensors_1_over_4,0.002886836027713626
1710
- llm_jp_13b_instruct_full_jaster_dolly_oasst_v1.0,0.002886836027713626
1711
- japanese_gpt_neox_3.6b,0.002886836027713626
1712
- mistral7b_test001,0.002886836027713626
1713
- griffin_llama3t_8l_v0.02_fineweb,0.002886836027713626
1714
- pythia_31m_ki_v1_2048_scratch,0.002886836027713626
1715
- opt_125m_gqa_ub_6_best_for_kv_cache,0.002886836027713626
1716
- facebook_opt_6.7b_qcqa_ub_16_best_for_kv_cache,0.002886836027713626
1717
- bilingual_gpt_neox_4b_instruction_ppo,0.002886836027713626
1718
- bilingual_gpt_neox_4b_instruction_sft,0.002886836027713626
1719
- wizardlm_30b_v1.0,0.002886836027713626
1720
- telugu_llama_7b_instruct_v0.1,0.002886836027713626
1721
- tamil_llama_7b_instruct_v0.2,0.002886836027713626
1722
- changpt_bart,0.002886836027713626
1723
- shisa_base_7b_v1,0.002886836027713626
1724
- malayalam_llama_7b_instruct_v0.1,0.002886836027713626
1725
- experiment_dpo_m7b2_3_merged,0.002886836027713626
1726
- facebook_opt_125m_qcqa_ub_6_best_for_kv_cache,0.002886836027713626
1727
- pythia_31m_simplewiki_scratch_bf16,0.002886836027713626
1728
- pythia_31m_simplewiki_2048,0.002886836027713626
1729
- facebook_opt_6.7b_gqa_ub_16_best_for_kv_cache,0.002886836027713626
1730
- pythia_31m_goodwiki_deduped_2048_scratch,0.0023094688221709007
1731
- bilingual_gpt_neox_4b,0.0017321016166281756
1732
- tinymistral_248m_chat_v1,0.0005773672055427252
1733
- momomerge_72b_v0.1,0.0005773672055427252
1734
- sf_72b_v1,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
cache/agreements_cache_1edd56d721757789836f081c38c15400.csv DELETED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_230b5a189df3af8cde801ce251b7b2ef.csv DELETED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_2d8c9f9c6d96807c68a9475184afcecb.csv DELETED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_9c0710fd06d230cc89e0f2f023e3058f.csv DELETED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_bffcfd24eb4a8fe1f6c8ac8a0c8c21d6.csv DELETED
The diff for this file is too large to render. See raw diff
 
cache/agreements_cache_f97e563eeda8c9bdc279f5b94b32606c.csv DELETED
The diff for this file is too large to render. See raw diff