2024_Leaderboard / data /params /text_generation.csv
sasha's picture
sasha HF staff
adding tasks and data
3fe7e68
raw
history blame
3.76 kB
,Model Family,# Params,Link,Size (GB),GPU Type,Process,Docker Process,Num GPUs,Notes,Unnamed: 9,parameters
0,OPT,125 M,facebook/opt-125m,0.25,Single_GPU,"[2024-07-19 13:43:32,389]",8612608.0,1.0,,,125239296
1,DistilGPT 2,88.2 M,distilbert/distilgpt2,0.353,Single_GPU,"[2024-07-19 20:32:39,848]",8612609.0,1.0,,,81912576
2,GPT 1,120 M,openai-community/openai-gpt,0.479,Single_GPU,"[2024-07-19 22:32:39,848]",8612611.0,1.0,,,116534784
3,GPT 2,137 M,openai-community/gpt2,0.548,Single_GPU,"[2024-07-22 16:48:45,521]",8612612.0,1.0,,,124439808
4,GPT 2,380 M,openai-community/gpt2-medium,1.5,Single_GPU,"[2024-07-22 19:35:01,598]",8612613.0,1.0,,,354823168
5,Phi 1,1.4 B,microsoft/phi-1,2.8,Single_GPU,2024-07-24 11:16:59,8612615.0,1.0,,,1313361920
6,Phi 1.5,1.4 B,microsoft/phi-1_5,2.8,Single_GPU,"[2024-07-26 12:29:22,310]",8612616.0,1.0,,,1313361920
7,GPT 2,812 M,openai-community/gpt2-large,3.2,Single_GPU,"[2024-07-24 11:28:42,290",8612617.0,1.0,,,774030080
8,SmolLM,360 M,HuggingFaceTB/SmolLM-360M,1.4,Single_GPU,"[2024-07-25 13:45:47,257]",8612618.0,1.0,,,361821120
9,SmolLM,135 M,HuggingFaceTB/SmolLM-135M,0.538,Single_GPU,"[2024-07-25 23:45:47,257]",8612600.0,1.0,,,134515008
10,OPT,2.7 B,facebook/opt-2.7b,5.3,Single_GPU,,8612639.0,1.0,,,2651596800
11,Phi 2,2.7 B,microsoft/phi-2,5.564,Single_GPU,,8612640.0,1.0,,,2648560640
12,GPT 2,1.6 B,openai-community/gpt2-xl,6.4,Single_GPU,,8612675.0,1.0,,,1557611200
13,SmolLM,1.7 B,HuggingFaceTB/SmolLM-1.7B,6.8,Single_GPU,,8612644.0,1.0,,,1711376384
14,Gemma,2 B,google/gemma-2b,4.967,Single_GPU,,8612676.0,1.0,,,2506172416
15,LLaMa 2,7 B,meta-llama/Llama-2-7b-hf,13.5,Single_GPU,,8612678.0,1.0,,,6607343616
16,Starling,7.24 B,berkeley-nest/Starling-LM-7B-alpha,14.4,Single_GPU,,8612679.0,1.0,,,7110668288
17,Mistral-v0.3-8B,7B,mistralai/Mistral-7B-v0.1,14.4,Single_GPU,,8612681.0,1.0,,,7110660096
18,Falcon,7 B,tiiuae/falcon-7b,14.5,Single_GPU,,8612682.0,1.0,,,6921720704
19,Aya-23-8b,8B,CohereForAI/aya-23-8B,16.06,Single_GPU,,8612685.0,1.0,,,8028033024
20,LLaMa 3,8 B,meta-llama/Meta-Llama-3-8B,16.1,Single_GPU,,8612687.0,1.0,,,7504924672
21,Gemma,7 B,google/gemma-7b,17.1,Single_GPU,,8612721.0,1.0,,,8537680896
22,Llama 3.1,8B,meta-llama/Meta-Llama-3.1-8B,,Single_GPU,,8612690.0,1.0,,,0
23,Yi 1.5,9 B,01-ai/Yi-1.5-9B,,Single_GPU,,8612692.0,1.0,,,8567263232
24,Yi 1.5,6 B,01-ai/Yi-1.5-6B,,Single_GPU,,8612693.0,1.0,,,5798891520
25,LLaMa 2,13 B,meta-llama/Llama-2-13b-hf,26.0,Single_GPU,,8612694.0,1.0,,,12852024320
26,OLMo,7B,allenai/OLMo-1.7-7B-hf,27.6,Single_GPU,,8619238.0,1.0,,,6682050560
27,OLMo,1B,allenai/OLMo-1B-hf,,Single_GPU,,8612698.0,1.0,,,1176764416
28,Aya,13B,CohereForAI/aya-101,51.8,Multi_GPU,,8619572.0,1.0,text2text,,11896598528
29,DeepSeekv2,16B,deepseek-ai/DeepSeek-V2-Lite,,Multi_GPU,,8619241.0,,,,0
30,Aya 23,35 B,CohereForAI/aya-23-35B,69.5,Multi_GPU,,8619247.0,8.0,,,34980831232
31,Falcon,40 B,tiiuae/falcon-40b,83.6,Multi_GPU,,8619252.0,8.0,,,41303293952
32,Mistral,46.7 B,mistralai/Mixtral-8x7B-v0.1,93.6,Multi_GPU,,8619304.0,,,,46571720704
33,LLaMa 2,70 B,meta-llama/Llama-2-70b-hf,138.124,Multi_GPU,,8619350.0,,,,68714504192
34,LlaMa 3,70 B,meta-llama/Meta-Llama-3-70B,141.9,Multi_GPU,,8619388.0,,,,69503033344
35,Llama 3.1,70 B,meta-llama/Meta-Llama-3.1-70B,,Multi_GPU,,8619417.0,,,,0
36,Llama 3.1,405B,meta-llama/Meta-Llama-3.1-405B,,Multi_GPU,,8672796.0,,OOM,trying 2 nodes,0
37,Command-R,104 B,CohereForAI/c4ai-command-r-plus,,Multi_GPU,,8619473.0,,,,103810674688
38,Command-R,35 B,CohereForAI/c4ai-command-r-v01,,Multi_GPU,,8619487.0,,,,34980831232
39,Yi 1.5,34 B,01-ai/Yi-1.5-34B,,Multi_GPU,,8619507.0,,,,33930165248
40,DeepSeekv2,236 B,deepseek-ai/DeepSeek-V2,,Multi_GPU,,,," assert set(gpu_ids).issubset(
AssertionError: Unknown GPU ids [0, 1, 2, 3, 4, 5, 6, 7]",,0