2024_Leaderboard / data /params /text_generation.csv
sasha's picture
sasha HF staff
filling in missing values
fd31451
raw
history blame
3.4 kB
,Model Family,# Params,Link,Size (GB),GPU Type,Process,Docker Process,Num GPUs,Notes,Unnamed: 9,parameters
0,OPT,125 M,facebook/opt-125m,0.25,Single_GPU,"[2024-07-19 13:43:32,389]",8612608,1,,,125239296
1,DistilGPT 2,88.2 M,distilbert/distilgpt2,0.353,Single_GPU,"[2024-07-19 20:32:39,848]",8612609,1,,,81912576
2,GPT 1,120 M,openai-community/openai-gpt,0.479,Single_GPU,"[2024-07-19 22:32:39,848]",8612611,1,,,116534784
3,GPT 2,137 M,openai-community/gpt2,0.548,Single_GPU,"[2024-07-22 16:48:45,521]",8612612,1,,,124439808
4,GPT 2,380 M,openai-community/gpt2-medium,1.5,Single_GPU,"[2024-07-22 19:35:01,598]",8612613,1,,,354823168
5,Phi 1,1.4 B,microsoft/phi-1,2.8,Single_GPU,2024-07-24 11:16:59,8612615,1,,,1313361920
6,Phi 1.5,1.4 B,microsoft/phi-1_5,2.8,Single_GPU,"[2024-07-26 12:29:22,310]",8612616,1,,,1313361920
7,GPT 2,812 M,openai-community/gpt2-large,3.2,Single_GPU,"[2024-07-24 11:28:42,290",8612617,1,,,774030080
8,SmolLM,360 M,HuggingFaceTB/SmolLM-360M,1.4,Single_GPU,"[2024-07-25 13:45:47,257]",8612618,1,,,361821120
9,SmolLM,135 M,HuggingFaceTB/SmolLM-135M,0.538,Single_GPU,"[2024-07-25 23:45:47,257]",8612600,1,,,134515008
10,OPT,2.7 B,facebook/opt-2.7b,5.3,Single_GPU,,8612639,1,,,2651596800
11,Phi 2,2.7 B,microsoft/phi-2,5.564,Single_GPU,,8612640,1,,,2648560640
12,GPT 2,1.6 B,openai-community/gpt2-xl,6.4,Single_GPU,,8612675,1,,,1557611200
13,SmolLM,1.7 B,HuggingFaceTB/SmolLM-1.7B,6.8,Single_GPU,,8612644,1,,,1711376384
14,Gemma,2 B,google/gemma-2b,4.967,Single_GPU,,8612676,1,,,2506172416
15,LLaMa 2,7 B,meta-llama/Llama-2-7b-hf,13.5,Single_GPU,,8612678,1,,,6607343616
16,Starling,7.24 B,berkeley-nest/Starling-LM-7B-alpha,14.4,Single_GPU,,8612679,1,,,7110668288
17,Mistral-v0.3-8B,7B,mistralai/Mistral-7B-v0.1,14.4,Single_GPU,,8612681,1,,,7110660096
18,Falcon,7 B,tiiuae/falcon-7b,14.5,Single_GPU,,8612682,1,,,6921720704
19,Aya-23-8b,8B,CohereForAI/aya-23-8B,16.06,Single_GPU,,8612685,1,,,8028033024
20,LLaMa 3,8 B,meta-llama/Meta-Llama-3-8B,16.1,Single_GPU,,8612687,1,,,7504924672
21,Gemma,7 B,google/gemma-7b,17.1,Single_GPU,,8612721,1,,,8537680896
22,Llama 3.1,8B,meta-llama/Meta-Llama-3.1-8B,,Single_GPU,,8612690,1,,,8030000000
23,Yi 1.5,9 B,01-ai/Yi-1.5-9B,,Single_GPU,,8612692,1,,,8567263232
24,Yi 1.5,6 B,01-ai/Yi-1.5-6B,,Single_GPU,,8612693,1,,,5798891520
25,LLaMa 2,13 B,meta-llama/Llama-2-13b-hf,26,Single_GPU,,8612694,1,,,12852024320
26,OLMo,7B,allenai/OLMo-1.7-7B-hf,27.6,Single_GPU,,8619238,1,,,6682050560
27,OLMo,1B,allenai/OLMo-1B-hf,,Single_GPU,,8612698,1,,,1176764416
28,Aya,13B,CohereForAI/aya-101,51.8,Multi_GPU,,8619572,1,text2text,,11896598528
29,DeepSeekv2,16B,deepseek-ai/DeepSeek-V2-Lite,,Multi_GPU,,8619241,,,,15700000000
30,Aya 23,35 B,CohereForAI/aya-23-35B,69.5,Multi_GPU,,8619247,8,,,34980831232
31,Falcon,40 B,tiiuae/falcon-40b,83.6,Multi_GPU,,8619252,8,,,41303293952
32,Mistral,46.7 B,mistralai/Mixtral-8x7B-v0.1,93.6,Multi_GPU,,8619304,,,,46571720704
33,LLaMa 2,70 B,meta-llama/Llama-2-70b-hf,138.124,Multi_GPU,,8619350,,,,68714504192
34,LlaMa 3,70 B,meta-llama/Meta-Llama-3-70B,141.9,Multi_GPU,,8619388,,,,69503033344
35,Llama 3.1,70 B,meta-llama/Meta-Llama-3.1-70B,,Multi_GPU,,8619417,,,,69503033344
37,Command-R,104 B,CohereForAI/c4ai-command-r-plus,,Multi_GPU,,8619473,,,,103810674688
38,Command-R,35 B,CohereForAI/c4ai-command-r-v01,,Multi_GPU,,8619487,,,,34980831232
39,Yi 1.5,34 B,01-ai/Yi-1.5-34B,,Multi_GPU,,8619507,,,,33930165248