Zhiyu Wu commited on
Commit
332f235
1 Parent(s): f01c24a

Add RWKV (#19)

Browse files
data/A100_chat-concise_benchmark.csv CHANGED
@@ -1,7 +1,7 @@
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-13b,25.50117012651914,258.85426460711886,10.063550845041279,1946.198744123579
3
  BAIR/koala-7b,32.92721737057136,247.0456682337139,7.462044263397255,1195.704790463391
4
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,64.47852685919943,209.4788448623237,2.9212886777848954,736.6553304231044
5
  FreedomIntelligence/phoenix-inst-chat-7b,54.276457252393016,233.51108126259234,4.103907452767313,1002.3285728676934
6
  camel-ai/CAMEL-13B-Combined-Data,26.30022114657458,282.4801880456682,10.72763999556464,2349.1830879784957
7
  databricks/dolly-v2-12b,24.809807917158277,143.01410342511753,5.488031835448774,1002.4862169241038
 
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-13b,25.50117012651914,258.85426460711886,10.063550845041279,1946.198744123579
3
  BAIR/koala-7b,32.92721737057136,247.0456682337139,7.462044263397255,1195.704790463391
4
+ RWKV/rwkv-raven-7b,64.47852685919943,209.4788448623237,2.9212886777848954,736.6553304231044
5
  FreedomIntelligence/phoenix-inst-chat-7b,54.276457252393016,233.51108126259234,4.103907452767313,1002.3285728676934
6
  camel-ai/CAMEL-13B-Combined-Data,26.30022114657458,282.4801880456682,10.72763999556464,2349.1830879784957
7
  databricks/dolly-v2-12b,24.809807917158277,143.01410342511753,5.488031835448774,1002.4862169241038
data/A100_chat_benchmark.csv CHANGED
@@ -1,7 +1,7 @@
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-13b,21.207721076321384,265.5732034922767,12.1433556952537,2144.8338435191445
3
  BAIR/koala-7b,26.5628207031951,261.0698455339154,9.620738416075923,1345.554839153794
4
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,61.52127877000437,214.78475486903963,3.0815914876914072,735.766777367353
5
  FreedomIntelligence/phoenix-inst-chat-7b,55.838321060384565,240.34419073203492,4.122390997297159,1030.8907246474148
6
  Neutralzz/BiLLa-7B-SFT,33.57049533371462,161.80826057756883,4.794732123814392,881.4395631296157
7
  OpenAssistant/oasst-sft-1-pythia-12b,25.404288065688412,259.58764271323037,9.929468848113123,2060.029685359295
 
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-13b,21.207721076321384,265.5732034922767,12.1433556952537,2144.8338435191445
3
  BAIR/koala-7b,26.5628207031951,261.0698455339154,9.620738416075923,1345.554839153794
4
+ RWKV/rwkv-raven-7b,61.52127877000437,214.78475486903963,3.0815914876914072,735.766777367353
5
  FreedomIntelligence/phoenix-inst-chat-7b,55.838321060384565,240.34419073203492,4.122390997297159,1030.8907246474148
6
  Neutralzz/BiLLa-7B-SFT,33.57049533371462,161.80826057756883,4.794732123814392,881.4395631296157
7
  OpenAssistant/oasst-sft-1-pythia-12b,25.404288065688412,259.58764271323037,9.929468848113123,2060.029685359295
data/A100_instruct-concise_benchmark.csv CHANGED
@@ -3,7 +3,7 @@ metaai/llama-13B,23.078188347142518,114.53055742108798,4.394399051080669,930.421
3
  metaai/llama-7B,28.422054486839865,106.21793149764943,3.3668744317152224,578.5248918737578
4
  BAIR/koala-13b,25.68238710094553,169.5476830087307,6.410479635487899,1266.6891084620372
5
  BAIR/koala-7b,33.328275305359796,195.68065815983883,5.765067746732124,865.7973959032869
6
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,66.0701614426915,226.21087978509067,3.1888684277266397,805.043430490258
7
  FreedomIntelligence/phoenix-inst-chat-7b,53.984465765624535,195.5295500335796,3.4296249723803256,847.9469607118755
8
  camel-ai/CAMEL-13B-Combined-Data,25.753539426678923,188.12894560107455,7.247808498485511,1586.241547011427
9
  databricks/dolly-v2-12b,24.68014979695401,155.27535258562793,5.997897220429992,1098.335702149091
 
3
  metaai/llama-7B,28.422054486839865,106.21793149764943,3.3668744317152224,578.5248918737578
4
  BAIR/koala-13b,25.68238710094553,169.5476830087307,6.410479635487899,1266.6891084620372
5
  BAIR/koala-7b,33.328275305359796,195.68065815983883,5.765067746732124,865.7973959032869
6
+ RWKV/rwkv-raven-7b,66.0701614426915,226.21087978509067,3.1888684277266397,805.043430490258
7
  FreedomIntelligence/phoenix-inst-chat-7b,53.984465765624535,195.5295500335796,3.4296249723803256,847.9469607118755
8
  camel-ai/CAMEL-13B-Combined-Data,25.753539426678923,188.12894560107455,7.247808498485511,1586.241547011427
9
  databricks/dolly-v2-12b,24.68014979695401,155.27535258562793,5.997897220429992,1098.335702149091
data/A100_instruct_benchmark.csv CHANGED
@@ -1,7 +1,7 @@
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-13b,20.727175709016876,254.08025520483545,11.892537351481359,2191.190301544663
3
  BAIR/koala-7b,25.954660733201525,259.2263263935527,9.768064146371243,1447.61525218268
4
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,61.486296272233105,244.58898589657488,3.6864172847628747,892.832628945603
5
  FreedomIntelligence/phoenix-inst-chat-7b,55.22014703563219,221.38582941571525,3.8385676472189307,887.4773411685698
6
  Neutralzz/BiLLa-7B-SFT,32.311906190353724,146.99966420416388,4.4437706789731255,750.0805171255877
7
  OpenAssistant/oasst-sft-1-pythia-12b,24.935530057384018,250.45466756212224,9.786432366627167,2029.4657938213645
 
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-13b,20.727175709016876,254.08025520483545,11.892537351481359,2191.190301544663
3
  BAIR/koala-7b,25.954660733201525,259.2263263935527,9.768064146371243,1447.61525218268
4
+ RWKV/rwkv-raven-7b,61.486296272233105,244.58898589657488,3.6864172847628747,892.832628945603
5
  FreedomIntelligence/phoenix-inst-chat-7b,55.22014703563219,221.38582941571525,3.8385676472189307,887.4773411685698
6
  Neutralzz/BiLLa-7B-SFT,32.311906190353724,146.99966420416388,4.4437706789731255,750.0805171255877
7
  OpenAssistant/oasst-sft-1-pythia-12b,24.935530057384018,250.45466756212224,9.786432366627167,2029.4657938213645
data/A40_chat-concise_benchmark.csv CHANGED
@@ -11,7 +11,7 @@ togethercomputer/RedPajama-INCITE-7B-Chat,14.451529449594792,275.07991940899933,
11
  metaai/llama-13B,15.493654667854246,81.26796507723304,4.881042191492302,1264.815973472223
12
  BAIR/koala-13b,17.393931641363825,252.56816655473472,14.499323956849762,3747.8785020146615
13
  nomic-ai/gpt4all-13b-snoozy,17.45953616124214,217.35325721961047,12.440528350608277,3263.628521155058
14
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,32.86455306586691,235.19274680993956,6.718876629108356,1661.2857568838062
15
  lmsys/fastchat-t5-3b-v1.0,21.09615171109894,313.09905977165886,18.366778339359637,1807.6800728676938
16
  project-baize/baize-v2-7B,28.92598212176896,321.06010745466756,10.940218308832323,2644.9160527197046
17
  OpenAssistant/oasst-sft-1-pythia-12b,16.01484723680571,249.1007387508395,15.153340834740217,3829.1071417058643
 
11
  metaai/llama-13B,15.493654667854246,81.26796507723304,4.881042191492302,1264.815973472223
12
  BAIR/koala-13b,17.393931641363825,252.56816655473472,14.499323956849762,3747.8785020146615
13
  nomic-ai/gpt4all-13b-snoozy,17.45953616124214,217.35325721961047,12.440528350608277,3263.628521155058
14
+ RWKV/rwkv-raven-7b,32.86455306586691,235.19274680993956,6.718876629108356,1661.2857568838062
15
  lmsys/fastchat-t5-3b-v1.0,21.09615171109894,313.09905977165886,18.366778339359637,1807.6800728676938
16
  project-baize/baize-v2-7B,28.92598212176896,321.06010745466756,10.940218308832323,2644.9160527197046
17
  OpenAssistant/oasst-sft-1-pythia-12b,16.01484723680571,249.1007387508395,15.153340834740217,3829.1071417058643
data/A40_chat_benchmark.csv CHANGED
@@ -5,7 +5,7 @@ tatsu-lab/alpaca-7B,30.09713731797294,125.20013431833445,4.129986896187982,916.0
5
  metaai/llama-7B,25.768609507174105,64.59032907991941,2.284814629996714,525.7081235728675
6
  metaai/llama-13B,15.699146010424393,80.32236400268637,4.757332595030835,1293.689832437891
7
  camel-ai/CAMEL-13B-Combined-Data,17.40620018812374,292.3438549361988,16.834190191676036,4466.796722968406
8
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,33.10830960148045,243.21793149764943,6.9481068778416555,1833.7241615177682
9
  databricks/dolly-v2-12b,15.597444626791148,148.3270651443922,9.168758730287117,2362.087664204047
10
  FreedomIntelligence/phoenix-inst-chat-7b,32.663340053939855,243.14909335124244,7.271332307256473,2149.2483156478947
11
  h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2,28.851651162429675,216.66286098052385,7.544740398256815,1636.1981326393268
 
5
  metaai/llama-7B,25.768609507174105,64.59032907991941,2.284814629996714,525.7081235728675
6
  metaai/llama-13B,15.699146010424393,80.32236400268637,4.757332595030835,1293.689832437891
7
  camel-ai/CAMEL-13B-Combined-Data,17.40620018812374,292.3438549361988,16.834190191676036,4466.796722968406
8
+ RWKV/rwkv-raven-7b,33.10830960148045,243.21793149764943,6.9481068778416555,1833.7241615177682
9
  databricks/dolly-v2-12b,15.597444626791148,148.3270651443922,9.168758730287117,2362.087664204047
10
  FreedomIntelligence/phoenix-inst-chat-7b,32.663340053939855,243.14909335124244,7.271332307256473,2149.2483156478947
11
  h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2,28.851651162429675,216.66286098052385,7.544740398256815,1636.1981326393268
data/A40_instruct-concise_benchmark.csv CHANGED
@@ -1,7 +1,7 @@
1
  model,throughput,response_length,latency,energy
2
  openaccess-ai-collective/manticore-13b-chat-pyg,17.4993855646115,229.5795836131632,13.132503049058466,3501.182491605137
3
  lmsys/vicuna-7B,29.046593546528904,212.760241773002,7.3296203452423265,1706.1712568838818
4
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,33.07481929862108,242.74177300201478,6.943508281124177,1787.5870651446628
5
  tatsu-lab/alpaca-7B,29.475397017987323,117.95399597044997,3.9749026008906023,927.7634805239352
6
  metaai/llama-13B,15.786345111463364,102.35762256548018,6.009854743435423,1590.8409496307413
7
  OpenAssistant/oasst-sft-1-pythia-12b,16.03459728484094,241.31732706514438,14.686811677200872,3673.6327222969167
 
1
  model,throughput,response_length,latency,energy
2
  openaccess-ai-collective/manticore-13b-chat-pyg,17.4993855646115,229.5795836131632,13.132503049058466,3501.182491605137
3
  lmsys/vicuna-7B,29.046593546528904,212.760241773002,7.3296203452423265,1706.1712568838818
4
+ RWKV/rwkv-raven-7b,33.07481929862108,242.74177300201478,6.943508281124177,1787.5870651446628
5
  tatsu-lab/alpaca-7B,29.475397017987323,117.95399597044997,3.9749026008906023,927.7634805239352
6
  metaai/llama-13B,15.786345111463364,102.35762256548018,6.009854743435423,1590.8409496307413
7
  OpenAssistant/oasst-sft-1-pythia-12b,16.03459728484094,241.31732706514438,14.686811677200872,3673.6327222969167
data/A40_instruct_benchmark.csv CHANGED
@@ -3,7 +3,7 @@ FreedomIntelligence/phoenix-inst-chat-7b,32.795664087070854,221.2484889187374,6.
3
  tatsu-lab/alpaca-7B,30.107577299286163,126.36030893216925,4.161682809197595,973.6026363331109
4
  togethercomputer/RedPajama-INCITE-7B-Chat,17.009700321585225,282.3190060443251,15.98330062659441,2834.287281396827
5
  lmsys/vicuna-7B,29.417977025894693,267.841840161182,9.164755312435684,2131.3740241775145
6
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,33.80171881884355,264.9563465413029,7.560664676534496,2049.7698284082962
7
  databricks/dolly-v2-12b,15.67950302952103,155.61316319677636,9.582122375200395,2369.283402619204
8
  camel-ai/CAMEL-13B-Combined-Data,17.522554791478672,245.7824042981867,14.081241566503387,3646.9116689053053
9
  BAIR/koala-7b,29.350583449996343,253.7239758226998,8.64835721658589,1918.897159502941
 
3
  tatsu-lab/alpaca-7B,30.107577299286163,126.36030893216925,4.161682809197595,973.6026363331109
4
  togethercomputer/RedPajama-INCITE-7B-Chat,17.009700321585225,282.3190060443251,15.98330062659441,2834.287281396827
5
  lmsys/vicuna-7B,29.417977025894693,267.841840161182,9.164755312435684,2131.3740241775145
6
+ RWKV/rwkv-raven-7b,33.80171881884355,264.9563465413029,7.560664676534496,2049.7698284082962
7
  databricks/dolly-v2-12b,15.67950302952103,155.61316319677636,9.582122375200395,2369.283402619204
8
  camel-ai/CAMEL-13B-Combined-Data,17.522554791478672,245.7824042981867,14.081241566503387,3646.9116689053053
9
  BAIR/koala-7b,29.350583449996343,253.7239758226998,8.64835721658589,1918.897159502941
data/V100_chat-concise_benchmark.csv CHANGED
@@ -6,7 +6,7 @@ lmsys/vicuna-7B,33.19220689261821,273.57118871725993,8.18447234641069,1387.83851
6
  metaai/llama-7B,23.92946132846408,68.0584284754869,2.2809002959847486,354.6560946944264
7
  project-baize/baize-v2-7B,30.350461249705614,313.3747481531229,10.034955017859746,1647.9252511752854
8
  BAIR/koala-13b,21.426431872159036,253.86501007387508,11.723909422593445,2576.3193623237044
9
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,36.40036863259138,202.84654130288786,4.8940369672449,1139.9740564136987
10
  FreedomIntelligence/phoenix-inst-chat-7b,42.268276726494044,233.5211551376763,5.210845160281831,1237.6637434519814
11
  Neutralzz/BiLLa-7B-SFT,31.9073779709284,141.02820685023505,4.304014573938894,791.1183122901291
12
  StabilityAI/stablelm-tuned-alpha-7b,27.433760323389556,241.67763599731364,8.396188638064837,1539.8807639355257
 
6
  metaai/llama-7B,23.92946132846408,68.0584284754869,2.2809002959847486,354.6560946944264
7
  project-baize/baize-v2-7B,30.350461249705614,313.3747481531229,10.034955017859746,1647.9252511752854
8
  BAIR/koala-13b,21.426431872159036,253.86501007387508,11.723909422593445,2576.3193623237044
9
+ RWKV/rwkv-raven-7b,36.40036863259138,202.84654130288786,4.8940369672449,1139.9740564136987
10
  FreedomIntelligence/phoenix-inst-chat-7b,42.268276726494044,233.5211551376763,5.210845160281831,1237.6637434519814
11
  Neutralzz/BiLLa-7B-SFT,31.9073779709284,141.02820685023505,4.304014573938894,791.1183122901291
12
  StabilityAI/stablelm-tuned-alpha-7b,27.433760323389556,241.67763599731364,8.396188638064837,1539.8807639355257
data/V100_chat_benchmark.csv CHANGED
@@ -1,6 +1,6 @@
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-13b,21.533160265051638,265.5540631296172,12.202378193294793,2299.2539251175217
3
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,38.25693186890057,214.35460040295501,5.09708168833379,1112.947044996645
4
  Neutralzz/BiLLa-7B-SFT,31.761691850702793,160.1222296843519,4.935750165560669,783.9250990597718
5
  StabilityAI/stablelm-tuned-alpha-7b,28.53967935283584,242.85829415715244,8.213054464106607,1349.8225080590983
6
  h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2,30.275817945748678,216.17797179314977,6.902688020302885,1083.431902955002
 
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-13b,21.533160265051638,265.5540631296172,12.202378193294793,2299.2539251175217
3
+ RWKV/rwkv-raven-7b,38.25693186890057,214.35460040295501,5.09708168833379,1112.947044996645
4
  Neutralzz/BiLLa-7B-SFT,31.761691850702793,160.1222296843519,4.935750165560669,783.9250990597718
5
  StabilityAI/stablelm-tuned-alpha-7b,28.53967935283584,242.85829415715244,8.213054464106607,1349.8225080590983
6
  h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2,30.275817945748678,216.17797179314977,6.902688020302885,1083.431902955002
data/V100_instruct-concise_benchmark.csv CHANGED
@@ -1,6 +1,6 @@
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-7b,31.870929688850776,191.7407656145064,5.776933217154402,940.6980705171267
3
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,39.221009432980566,226.7229684351914,5.369737004086241,1264.4471417058417
4
  FreedomIntelligence/phoenix-inst-chat-7b,42.470186422244424,193.91034251175284,4.339222575622636,968.785210208196
5
  lmsys/fastchat-t5-3b-v1.0,32.731683961001515,280.61417058428475,13.955027274680319,699.2501370047005
6
  lmsys/vicuna-13B,21.749876946304724,194.72666218938886,8.894261652518159,2004.231935191404
 
1
  model,throughput,response_length,latency,energy
2
  BAIR/koala-7b,31.870929688850776,191.7407656145064,5.776933217154402,940.6980705171267
3
+ RWKV/rwkv-raven-7b,39.221009432980566,226.7229684351914,5.369737004086241,1264.4471417058417
4
  FreedomIntelligence/phoenix-inst-chat-7b,42.470186422244424,193.91034251175284,4.339222575622636,968.785210208196
5
  lmsys/fastchat-t5-3b-v1.0,32.731683961001515,280.61417058428475,13.955027274680319,699.2501370047005
6
  lmsys/vicuna-13B,21.749876946304724,194.72666218938886,8.894261652518159,2004.231935191404
data/V100_instruct_benchmark.csv CHANGED
@@ -18,4 +18,4 @@ metaai/llama-13B,18.476088005501783,117.27736736064473,5.550619761657461,1274.25
18
  metaai/llama-7B,23.642990385313613,110.3025520483546,3.7306664026356073,636.4017854264604
19
  tatsu-lab/alpaca-7B,31.257537640928863,127.87004701141706,3.9853428024686144,671.8288287441229
20
  BAIR/koala-7b,31.414143726094665,253.60376091336468,7.832867446137829,1181.3637347212878
21
- BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,39.9399840394634,246.79650772330425,5.83791405340994,1302.0306672263273
 
18
  metaai/llama-7B,23.642990385313613,110.3025520483546,3.7306664026356073,636.4017854264604
19
  tatsu-lab/alpaca-7B,31.257537640928863,127.87004701141706,3.9853428024686144,671.8288287441229
20
  BAIR/koala-7b,31.414143726094665,253.60376091336468,7.832867446137829,1181.3637347212878
21
+ RWKV/rwkv-raven-7b,39.9399840394634,246.79650772330425,5.83791405340994,1302.0306672263273
data/models.json CHANGED
@@ -29,9 +29,9 @@
29
  "nickname": "Camel-AI/CAMEL-13B-Combined-Data",
30
  "params": 13
31
  },
32
- "BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth": {
33
- "url": "https://huggingface.co/BlinkDL/rwkv-4-raven",
34
- "nickname": "BlinkDL/RWKV-4-Raven-7B",
35
  "params": 7
36
  },
37
  "databricks/dolly-v2-12b": {
 
29
  "nickname": "Camel-AI/CAMEL-13B-Combined-Data",
30
  "params": 13
31
  },
32
+ "RWKV/rwkv-raven-7b": {
33
+ "url": "https://huggingface.co/RWKV/rwkv-raven-7b",
34
+ "nickname": "RWKV/rwkv-raven-7b",
35
  "params": 7
36
  },
37
  "databricks/dolly-v2-12b": {
data/score.csv CHANGED
@@ -20,3 +20,4 @@ Neutralzz/BiLLa-7B-SFT,27.730375426621162,26.04062935670185,49.045640164325754
20
  togethercomputer/RedPajama-INCITE-7B-Chat,42.15017064846416,70.8424616610237,36.10055989611241
21
  metaai/Llama-2-7b-chat-hf,52.73037542662116,78.48038239394542,45.32519554457334
22
  metaai/Llama-2-13b-chat-hf,59.129692832764505,81.94582752439753,43.9572591900371
 
 
20
  togethercomputer/RedPajama-INCITE-7B-Chat,42.15017064846416,70.8424616610237,36.10055989611241
21
  metaai/Llama-2-7b-chat-hf,52.73037542662116,78.48038239394542,45.32519554457334
22
  metaai/Llama-2-13b-chat-hf,59.129692832764505,81.94582752439753,43.9572591900371
23
+ RWKV/rwkv-raven-7b,39.419795221843,66.45090619398526,38.544263035922036