Jae-Won Chung commited on
Commit
2e3c3ed
1 Parent(s): f667abd

Add A100 numbers

Browse files
.gitignore CHANGED
@@ -7,6 +7,3 @@
7
  # Editor
8
  pyrightconfig.json
9
  .idea
10
-
11
- # Data
12
- data/
 
7
  # Editor
8
  pyrightconfig.json
9
  .idea
 
 
 
data/2023-06-17/A100_chat-concise_benchmark.csv ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,throughput,response_length,latency,energy
2
+ BAIR/koala-13b,25.50117012651914,258.85426460711886,10.063550845041279,1946.198744123579
3
+ BAIR/koala-7b,32.92721737057136,247.0456682337139,7.462044263397255,1195.704790463391
4
+ BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,64.47852685919943,209.4788448623237,2.9212886777848954,736.6553304231044
5
+ FreedomIntelligence/phoenix-inst-chat-7b,54.276457252393016,233.51108126259234,4.103907452767313,1002.3285728676934
6
+ camel-ai/CAMEL-13B-Combined-Data,26.30022114657458,282.4801880456682,10.72763999556464,2349.1830879784957
7
+ databricks/dolly-v2-12b,24.809807917158277,143.01410342511753,5.488031835448774,1002.4862169241038
8
+ lmsys/vicuna-13B,26.471361088447697,269.1239086635326,10.13281609787714,2151.007414036257
9
+ lmsys/vicuna-7B,33.42934778322944,272.4801880456682,8.138669158259418,1384.4621272666218
10
+ metaai/llama-13B,21.603271794897424,78.05742108797851,3.1706939710784794,671.8356437206298
11
+ metaai/llama-7B,27.65154362364814,67.52249832102082,2.1186345380820564,369.4284586971132
12
+ tatsu-lab/alpaca-7B,33.28849736927566,124.2155809267965,3.679997416454322,596.6560735392795
13
+ Neutralzz/BiLLa-7B-SFT,33.545066744328324,142.316319677636,4.214619093185649,677.7428566151748
14
+ OpenAssistant/oasst-sft-1-pythia-12b,24.918246219702905,251.10006715916722,9.773108534123995,2057.1658650100785
15
+ h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2,33.01663685477516,206.82236400268636,6.229473677366736,998.7828710543929
16
+ lmsys/fastchat-t5-3b-v1.0,19.17742489592329,312.91034251175284,20.878918582659214,1744.028456346554
17
+ nomic-ai/gpt4all-13b-snoozy,26.07277221094992,216.6400268636669,8.208376720764958,1738.0828875083905
18
+ openaccess-ai-collective/manticore-13b-chat-pyg,26.16054700304064,276.17058428475485,10.500794145583235,2117.0177760241745
19
+ StabilityAI/stablelm-tuned-alpha-7b,45.937935977440574,244.92578912021492,5.171557462488085,1199.1363797850827
20
+ project-baize/baize-v2-7B,31.98482659469149,316.2058428475487,9.718332352424522,1593.2951074546695
21
+ togethercomputer/RedPajama-INCITE-7B-Chat,27.099977162771395,275.3183344526528,9.708286378669253,1423.8720110812499
data/2023-06-17/A100_chat_benchmark.csv ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,throughput,response_length,latency,energy
2
+ BAIR/koala-13b,21.207721076321384,265.5732034922767,12.1433556952537,2144.8338435191445
3
+ BAIR/koala-7b,26.5628207031951,261.0698455339154,9.620738416075923,1345.554839153794
4
+ BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,61.52127877000437,214.78475486903963,3.0815914876914072,735.766777367353
5
+ FreedomIntelligence/phoenix-inst-chat-7b,55.838321060384565,240.34419073203492,4.122390997297159,1030.8907246474148
6
+ Neutralzz/BiLLa-7B-SFT,33.57049533371462,161.80826057756883,4.794732123814392,881.4395631296157
7
+ OpenAssistant/oasst-sft-1-pythia-12b,25.404288065688412,259.58764271323037,9.929468848113123,2060.029685359295
8
+ StabilityAI/stablelm-tuned-alpha-7b,45.42078300695383,243.87541974479515,5.208388584671265,1124.4006343183476
9
+ camel-ai/CAMEL-13B-Combined-Data,24.501197269962507,291.92008059100067,13.17006271185142,2526.4594200805864
10
+ databricks/dolly-v2-12b,22.10974954935886,153.75822699798522,7.943902623603982,1242.9209395567464
11
+ h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2,33.19728218417469,212.45601074546676,6.392467083725633,951.077651108126
12
+ lmsys/fastchat-t5-3b-v1.0,19.291850692305534,314.29684351914034,20.682375825357692,1802.9754949630653
13
+ lmsys/vicuna-13B,21.611375785831733,280.739758226998,12.738298498406273,2600.83922397583
14
+ lmsys/vicuna-7B,27.25945669782727,284.9194089993284,10.297412690598657,1531.7009963062367
15
+ metaai/llama-13B,23.201365367977594,76.47078576225655,2.9742001407414107,631.5696930826057
16
+ metaai/llama-7B,27.470901624921254,60.65144392209537,1.9862404549640509,335.25658764271293
17
+ nomic-ai/gpt4all-13b-snoozy,26.567282559123655,247.79583613163197,9.280741749712535,2004.7329180658162
18
+ openaccess-ai-collective/manticore-13b-chat-pyg,26.280767439646972,288.8153122901276,10.947609359217866,2189.247364674278
19
+ project-baize/baize-v2-7B,31.591810721211225,326.29952988582943,10.17013366094905,1588.2741897246513
20
+ tatsu-lab/alpaca-7B,28.0006749636751,132.84586971121558,4.627808613438331,684.1749345198082
21
+ togethercomputer/RedPajama-INCITE-7B-Chat,27.48563290418453,274.39456010745465,9.540005102660757,1457.8563905305575
data/2023-06-17/A100_instruct-concise_benchmark.csv ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,throughput,response_length,latency,energy
2
+ metaai/llama-13B,23.078188347142518,114.53055742108798,4.394399051080669,930.4217461383607
3
+ metaai/llama-7B,28.422054486839865,106.21793149764943,3.3668744317152224,578.5248918737578
4
+ BAIR/koala-13b,25.68238710094553,169.5476830087307,6.410479635487899,1266.6891084620372
5
+ BAIR/koala-7b,33.328275305359796,195.68065815983883,5.765067746732124,865.7973959032869
6
+ BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,66.0701614426915,226.21087978509067,3.1888684277266397,805.043430490258
7
+ FreedomIntelligence/phoenix-inst-chat-7b,53.984465765624535,195.5295500335796,3.4296249723803256,847.9469607118755
8
+ camel-ai/CAMEL-13B-Combined-Data,25.753539426678923,188.12894560107455,7.247808498485511,1586.241547011427
9
+ databricks/dolly-v2-12b,24.68014979695401,155.27535258562793,5.997897220429992,1098.335702149091
10
+ h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2,32.5833896491562,213.57656145063802,6.531293810193048,968.5605910006633
11
+ lmsys/fastchat-t5-3b-v1.0,35.32774199941168,284.15748824714575,12.138674304558975,1073.3059664204081
12
+ lmsys/vicuna-13B,26.34627305992005,195.90799194089993,7.373395581162019,1657.1269066487612
13
+ lmsys/vicuna-7B,33.203726764981546,213.17058428475488,6.385267472888481,1042.905993955669
14
+ tatsu-lab/alpaca-7B,32.842417001177665,122.1242444593687,3.6588753698446244,569.2690120886454
15
+ Neutralzz/BiLLa-7B-SFT,31.28470885552271,103.00335795836132,3.208946741549069,494.7404388851737
16
+ nomic-ai/gpt4all-13b-snoozy,25.76578508237939,121.15312290127602,4.545457045249276,994.3254654130169
17
+ openaccess-ai-collective/manticore-13b-chat-pyg,26.392333822580962,227.33378106111485,8.568163497332025,1738.897591336476
18
+ OpenAssistant/oasst-sft-1-pythia-12b,24.824754847354107,236.00940228341167,9.223680323395048,1834.861354264594
19
+ project-baize/baize-v2-7B,31.451660882452277,241.78945601074545,7.49180176517012,1276.267568838159
20
+ StabilityAI/stablelm-tuned-alpha-7b,44.77280320960753,224.9724647414372,4.834958684556046,1105.6361689053056
21
+ togethercomputer/RedPajama-INCITE-7B-Chat,26.907685411875395,276.31497649429144,9.836634313501508,1464.5413824714485
data/2023-06-17/A100_instruct_benchmark.csv ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,throughput,response_length,latency,energy
2
+ BAIR/koala-13b,20.727175709016876,254.08025520483545,11.892537351481359,2191.190301544663
3
+ BAIR/koala-7b,25.954660733201525,259.2263263935527,9.768064146371243,1447.61525218268
4
+ BlinkDL/RWKV-4-Raven-7B-v12-Eng98%-Other2%-20230521-ctx8192.pth,61.486296272233105,244.58898589657488,3.6864172847628747,892.832628945603
5
+ FreedomIntelligence/phoenix-inst-chat-7b,55.22014703563219,221.38582941571525,3.8385676472189307,887.4773411685698
6
+ Neutralzz/BiLLa-7B-SFT,32.311906190353724,146.99966420416388,4.4437706789731255,750.0805171255877
7
+ OpenAssistant/oasst-sft-1-pythia-12b,24.935530057384018,250.45466756212224,9.786432366627167,2029.4657938213645
8
+ StabilityAI/stablelm-tuned-alpha-7b,45.08986296277073,232.79348556077903,4.994290238837428,1132.5013462055056
9
+ camel-ai/CAMEL-13B-Combined-Data,26.545864806820514,244.7578912021491,9.198450972152804,2025.3281155137665
10
+ databricks/dolly-v2-12b,22.230280077272955,161.52820685023505,8.256380503504923,1374.5864308260586
11
+ h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2,32.73570790682367,219.56077904633983,6.708469191383511,1011.1683317662861
12
+ lmsys/fastchat-t5-3b-v1.0,33.043489972767865,355.22464741437204,15.602670499951651,1307.8302488247155
13
+ lmsys/vicuna-13B,21.00930585347828,266.4140362659503,12.326653083850998,2284.892455003353
14
+ lmsys/vicuna-7B,26.456122167045812,269.8492276695769,9.998248218763614,1393.5497108797765
15
+ metaai/llama-13B,22.701925773082262,99.55339153794493,3.953801921461699,853.2385591000668
16
+ metaai/llama-7B,29.32171747886574,107.48018804566823,3.322338972945185,561.9730688381476
17
+ nomic-ai/gpt4all-13b-snoozy,25.875636961002073,219.97582269979853,8.453523028629553,1718.9753918737365
18
+ openaccess-ai-collective/manticore-13b-chat-pyg,26.222449633250086,275.88179986568167,10.469822985415593,2115.522391537931
19
+ project-baize/baize-v2-7B,32.41073358811793,300.9086635325722,9.142081563219637,1529.693656480853
20
+ tatsu-lab/alpaca-7B,25.79378618278183,127.34217595701813,4.787391331217622,727.924358965749
21
+ togethercomputer/RedPajama-INCITE-7B-Chat,27.400950213545173,283.26158495634655,9.932342660383254,1629.655866689063
data/2023-06-17/schema.yaml CHANGED
@@ -1,2 +1,2 @@
1
- gpu: ["A40"]
2
  task: ["chat", "chat-concise", "instruct", "instruct-concise"]
 
1
+ gpu: ["A40", "A100"]
2
  task: ["chat", "chat-concise", "instruct", "instruct-concise"]