Florian Leuerer commited on
Commit
ae17b07
1 Parent(s): fc5a400
Files changed (3) hide show
  1. data.csv +0 -0
  2. data_stats_langs.csv +6 -5
  3. model_stats.csv +1 -0
data.csv CHANGED
The diff for this file is too large to render. See raw diff
 
data_stats_langs.csv CHANGED
@@ -6,12 +6,12 @@ upstage_SOLAR-10.7B-Instruct-v1.0,upstage/SOLAR-10.7B-Instruct-v1.0 (Mistral),0.
6
  DRXD1000_Phoenix,DRXD1000/Phoenix (Mistral),0.4875727579736855,0.5238922380729938,0.8436213991769548
7
  openaccess-ai-collective_DPOpenHermes-7B,openaccess-ai-collective/DPOpenHermes-7B (Mistral),0.4808996941837862,0.6204995440653475,
8
  VAGOsolutions_SauerkrautLM-7b-HerO,VAGOsolutions/SauerkrautLM-7b-HerO (Mistral),0.4793394346045998,0.5973278911555183,0.9506172839506173
9
- malteos_hermeo-7b,malteos/hermeo-7b (Mistral),0.4789016907464211,0.5777652767503162,0.934156378600823
10
  fblgit_una-cybertron-7b-v2-bf16,fblgit/una-cybertron-7b-v2-bf16 (Mistral),0.4714702998712998,0.6280572487472983,
11
  aari1995_germeo-7b-awq,aari1995/germeo-7b-awq (),0.4701767724890486,0.5677674726911679,
12
  berkeley-nest_Starling-LM-7B-alpha,berkeley-nest/Starling-LM-7B-alpha (Mistral),0.4682092030538821,0.6082623478431886,
13
  openchat_openchat_3.5,openchat/openchat_3.5 (Mistral),0.4677697134012669,0.6093495408502738,0.9012345679012346
14
- mistralai_Mistral-7B-Instruct-v0.2,mistralai/Mistral-7B-Instruct-v0.2 (Mistral),0.4671287660155921,0.5974778867312014,0.4773662551440329
15
  teknium_OpenHermes-2.5-Mistral-7B,teknium/OpenHermes-2.5-Mistral-7B (Mistral),0.4648073216754412,0.6009262837808728,
16
  HuggingFaceH4_zephyr-7b-beta,HuggingFaceH4/zephyr-7b-beta (Mistral),0.4641427965971664,0.5990940441734774,0.7530864197530864
17
  VAGOsolutions_SauerkrautLM-7b-v1-mistral,VAGOsolutions/SauerkrautLM-7b-v1-mistral (Mistral),0.4582885390631627,0.5730988906371487,
@@ -27,18 +27,19 @@ microsoft_Orca-2-13b,microsoft/Orca-2-13b (Llama2),0.4304508877524478,0.56652606
27
  LeoLM_leo-hessianai-7b-chat,LeoLM/leo-hessianai-7b-chat (Llama2),0.4198959530774699,0.469927951589407,
28
  kaist-ai_prometheus-13b-v1.0,kaist-ai/prometheus-13b-v1.0 (Llama2),0.4137699872914333,0.5276183571587882,
29
  meta-llama_Llama-2-13b-chat-hf,meta-llama/Llama-2-13b-chat-hf (Llama2),0.4133328486084298,0.5331779969903168,
30
- Deci_DeciLM-7B-instruct,Deci/DeciLM-7B-instruct (Deci),0.4087346114484392,0.5746784325286699,0.5802469135802469
31
  LeoLM_leo-hessianai-7b-chat-bilingual,LeoLM/leo-hessianai-7b-chat-bilingual (Llama2),0.4058414394510105,0.4701378898025081,0.43621399176954734
32
  mistralai_Mistral-7B-Instruct-v0.1,mistralai/Mistral-7B-Instruct-v0.1 (Mistral),0.4012720986996964,0.5329324676998503,
33
- allenai_tulu-2-dpo-7b,allenai/tulu-2-dpo-7b (Llama2),0.3963844596307675,0.5442215865769193,0.7654320987654321
34
  Deci_DeciLM-7B,Deci/DeciLM-7B (Deci),0.3891524333700293,0.5632148707253728,
35
  microsoft_Orca-2-7b,microsoft/Orca-2-7b (Llama2),0.387631543457434,0.5275512116539839,
36
  Qwen_Qwen-7B,Qwen/Qwen-7B (Qwen),0.3854029046626822,0.5250934481726963,
37
  deepseek-ai_deepseek-llm-7b-chat,deepseek-ai/deepseek-llm-7b-chat (Deepseek),0.3805290423206953,0.5228634605739054,0.9176954732510288
38
  Qwen_Qwen-7B-Chat,Qwen/Qwen-7B-Chat (Qwen),0.379473202994899,0.501690371644847,0.8683127572016461
 
39
  lmsys_vicuna-7b-v1.5,lmsys/vicuna-7b-v1.5 (Llama2),0.3743686900229406,0.4930702792560562,0.6748971193415638
40
  LeoLM_leo-hessianai-7b,LeoLM/leo-hessianai-7b (Llama2),0.3714768830460835,0.4350647594408416,
41
- meta-llama_Llama-2-7b-chat-hf,meta-llama/Llama-2-7b-chat-hf (Llama2),0.3507914339624629,0.4932635613314786,0.18106995884773663
42
  deepseek-ai_deepseek-llm-7b-base,deepseek-ai/deepseek-llm-7b-base (Deepseek),0.3427809248139573,0.4823404844220252,
43
  meta-llama_Llama-2-7b-hf,meta-llama/Llama-2-7b-hf (Llama2),0.3426308784990838,0.4704191232019917,
44
  01-ai_Yi-34B-Chat-8bits,01-ai/Yi-34B-Chat-8bits (Yi),0.3310580204778157,0.5418088737201365,
 
6
  DRXD1000_Phoenix,DRXD1000/Phoenix (Mistral),0.4875727579736855,0.5238922380729938,0.8436213991769548
7
  openaccess-ai-collective_DPOpenHermes-7B,openaccess-ai-collective/DPOpenHermes-7B (Mistral),0.4808996941837862,0.6204995440653475,
8
  VAGOsolutions_SauerkrautLM-7b-HerO,VAGOsolutions/SauerkrautLM-7b-HerO (Mistral),0.4793394346045998,0.5973278911555183,0.9506172839506173
9
+ malteos_hermeo-7b,malteos/hermeo-7b (Mistral),0.4789016907464211,0.5777652767503162,0.9423868312757202
10
  fblgit_una-cybertron-7b-v2-bf16,fblgit/una-cybertron-7b-v2-bf16 (Mistral),0.4714702998712998,0.6280572487472983,
11
  aari1995_germeo-7b-awq,aari1995/germeo-7b-awq (),0.4701767724890486,0.5677674726911679,
12
  berkeley-nest_Starling-LM-7B-alpha,berkeley-nest/Starling-LM-7B-alpha (Mistral),0.4682092030538821,0.6082623478431886,
13
  openchat_openchat_3.5,openchat/openchat_3.5 (Mistral),0.4677697134012669,0.6093495408502738,0.9012345679012346
14
+ mistralai_Mistral-7B-Instruct-v0.2,mistralai/Mistral-7B-Instruct-v0.2 (Mistral),0.4671287660155921,0.5974778867312014,0.48148148148148145
15
  teknium_OpenHermes-2.5-Mistral-7B,teknium/OpenHermes-2.5-Mistral-7B (Mistral),0.4648073216754412,0.6009262837808728,
16
  HuggingFaceH4_zephyr-7b-beta,HuggingFaceH4/zephyr-7b-beta (Mistral),0.4641427965971664,0.5990940441734774,0.7530864197530864
17
  VAGOsolutions_SauerkrautLM-7b-v1-mistral,VAGOsolutions/SauerkrautLM-7b-v1-mistral (Mistral),0.4582885390631627,0.5730988906371487,
 
27
  LeoLM_leo-hessianai-7b-chat,LeoLM/leo-hessianai-7b-chat (Llama2),0.4198959530774699,0.469927951589407,
28
  kaist-ai_prometheus-13b-v1.0,kaist-ai/prometheus-13b-v1.0 (Llama2),0.4137699872914333,0.5276183571587882,
29
  meta-llama_Llama-2-13b-chat-hf,meta-llama/Llama-2-13b-chat-hf (Llama2),0.4133328486084298,0.5331779969903168,
30
+ Deci_DeciLM-7B-instruct,Deci/DeciLM-7B-instruct (Deci),0.4087346114484392,0.5746784325286699,0.5843621399176955
31
  LeoLM_leo-hessianai-7b-chat-bilingual,LeoLM/leo-hessianai-7b-chat-bilingual (Llama2),0.4058414394510105,0.4701378898025081,0.43621399176954734
32
  mistralai_Mistral-7B-Instruct-v0.1,mistralai/Mistral-7B-Instruct-v0.1 (Mistral),0.4012720986996964,0.5329324676998503,
33
+ allenai_tulu-2-dpo-7b,allenai/tulu-2-dpo-7b (Llama2),0.3963844596307675,0.5442215865769193,0.757201646090535
34
  Deci_DeciLM-7B,Deci/DeciLM-7B (Deci),0.3891524333700293,0.5632148707253728,
35
  microsoft_Orca-2-7b,microsoft/Orca-2-7b (Llama2),0.387631543457434,0.5275512116539839,
36
  Qwen_Qwen-7B,Qwen/Qwen-7B (Qwen),0.3854029046626822,0.5250934481726963,
37
  deepseek-ai_deepseek-llm-7b-chat,deepseek-ai/deepseek-llm-7b-chat (Deepseek),0.3805290423206953,0.5228634605739054,0.9176954732510288
38
  Qwen_Qwen-7B-Chat,Qwen/Qwen-7B-Chat (Qwen),0.379473202994899,0.501690371644847,0.8683127572016461
39
+ DiscoResearch_DiscoLM_German_7b_v1,DiscoResearch/DiscoLM_German_7b_v1 (Mistral),0.3747561539654366,0.4209023365214039,0.9259259259259259
40
  lmsys_vicuna-7b-v1.5,lmsys/vicuna-7b-v1.5 (Llama2),0.3743686900229406,0.4930702792560562,0.6748971193415638
41
  LeoLM_leo-hessianai-7b,LeoLM/leo-hessianai-7b (Llama2),0.3714768830460835,0.4350647594408416,
42
+ meta-llama_Llama-2-7b-chat-hf,meta-llama/Llama-2-7b-chat-hf (Llama2),0.3507914339624629,0.4932635613314786,0.18518518518518517
43
  deepseek-ai_deepseek-llm-7b-base,deepseek-ai/deepseek-llm-7b-base (Deepseek),0.3427809248139573,0.4823404844220252,
44
  meta-llama_Llama-2-7b-hf,meta-llama/Llama-2-7b-hf (Llama2),0.3426308784990838,0.4704191232019917,
45
  01-ai_Yi-34B-Chat-8bits,01-ai/Yi-34B-Chat-8bits (Yi),0.3310580204778157,0.5418088737201365,
model_stats.csv CHANGED
@@ -36,6 +36,7 @@ microsoft/Orca-2-7b (Llama2),0.387631543457434,0.5275512116539839,microsoft_Orca
36
  Qwen/Qwen-7B (Qwen),0.3854029046626822,0.5250934481726963,Qwen_Qwen-7B
37
  deepseek-ai/deepseek-llm-7b-chat (Deepseek),0.3805290423206953,0.5228634605739054,deepseek-ai_deepseek-llm-7b-chat
38
  Qwen/Qwen-7B-Chat (Qwen),0.37947320299489906,0.501690371644847,Qwen_Qwen-7B-Chat
 
39
  lmsys/vicuna-7b-v1.5 (Llama2),0.3743686900229406,0.4930702792560562,lmsys_vicuna-7b-v1.5
40
  LeoLM/leo-hessianai-7b (Llama2),0.37147688304608356,0.4350647594408416,LeoLM_leo-hessianai-7b
41
  meta-llama/Llama-2-7b-chat-hf (Llama2),0.35079143396246293,0.4932635613314786,meta-llama_Llama-2-7b-chat-hf
 
36
  Qwen/Qwen-7B (Qwen),0.3854029046626822,0.5250934481726963,Qwen_Qwen-7B
37
  deepseek-ai/deepseek-llm-7b-chat (Deepseek),0.3805290423206953,0.5228634605739054,deepseek-ai_deepseek-llm-7b-chat
38
  Qwen/Qwen-7B-Chat (Qwen),0.37947320299489906,0.501690371644847,Qwen_Qwen-7B-Chat
39
+ DiscoResearch/DiscoLM_German_7b_v1 (Mistral),0.37475615396543666,0.4209023365214039,DiscoResearch_DiscoLM_German_7b_v1
40
  lmsys/vicuna-7b-v1.5 (Llama2),0.3743686900229406,0.4930702792560562,lmsys_vicuna-7b-v1.5
41
  LeoLM/leo-hessianai-7b (Llama2),0.37147688304608356,0.4350647594408416,LeoLM_leo-hessianai-7b
42
  meta-llama/Llama-2-7b-chat-hf (Llama2),0.35079143396246293,0.4932635613314786,meta-llama_Llama-2-7b-chat-hf