Spaces:
Sleeping
Sleeping
felix
commited on
Commit
•
6d7a85e
1
Parent(s):
e762f8c
comment
Browse files- app.py +23 -0
- data/20230826_0615/hf_llm_diagramv2.json +1 -0
- data/20230826_0615/hf_llm_diagramv2.png +0 -0
- data/20230826_0615/hf_llm_diagramv2_other_permissive.json +1 -0
- data/20230826_0615/hf_llm_diagramv2_other_permissive.png +0 -0
- data/20230826_0615/hf_llm_diagramv2_permissive.json +1 -0
- data/20230826_0615/hf_llm_diagramv2_permissive.png +0 -0
- data/20230826_0615/hf_llm_diagramv2_rescore.json +1 -0
- data/20230826_0615/hf_llm_diagramv2_rescore.png +0 -0
- data/20230826_0615/hg_average_to_agentbench_compare.png +0 -0
- data/20230826_0615/hg_average_to_alpacaeval_compare.png +0 -0
- data/20230826_0615/hg_average_to_mosaic_compare.png +0 -0
- data/20230826_0615/hg_average_to_mt_bench_compare.png +0 -0
- data/20230826_0615/hg_average_to_opencompass_compare.png +0 -0
app.py
CHANGED
@@ -1,4 +1,6 @@
|
|
1 |
# app.py
|
|
|
|
|
2 |
import streamlit as st
|
3 |
import glob
|
4 |
import os
|
@@ -46,13 +48,34 @@ hf_llm_diagrams = [img for img in imgs if 'hf_llm_diagram' in os.path.basename(i
|
|
46 |
# Getting the remaining images
|
47 |
remaining_imgs = [img for img in imgs if 'hf_llm_diagram' not in os.path.basename(img)]
|
48 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
49 |
st.write("HuggingFace Open LLM leaderboard by Model Size")
|
50 |
st.image(hf_llm_diagrams[0],use_column_width="auto")
|
51 |
|
|
|
|
|
52 |
cols = st.columns(2)
|
53 |
cols[0].image(hf_llm_diagrams[1],caption="Other or commercially permissive licenses only", use_column_width="auto")
|
|
|
|
|
|
|
|
|
54 |
cols[1].image(hf_llm_diagrams[2],caption="Commercially permissive license only", use_column_width="auto")
|
55 |
|
|
|
56 |
|
57 |
st.divider()
|
58 |
st.write("HuggingFace and Other Leaderboards: A Comparative Model Evaluation")
|
|
|
1 |
# app.py
|
2 |
+
import json
|
3 |
+
|
4 |
import streamlit as st
|
5 |
import glob
|
6 |
import os
|
|
|
48 |
# Getting the remaining images
|
49 |
remaining_imgs = [img for img in imgs if 'hf_llm_diagram' not in os.path.basename(img)]
|
50 |
|
51 |
+
def print_model_list(file_name, st):
|
52 |
+
file_path = file_name[:-4] + '.json'
|
53 |
+
# Read the list from the JSON file
|
54 |
+
with open(file_path, 'r') as file:
|
55 |
+
model_id_list_loaded = json.load(file)
|
56 |
+
model_str = "<ul>"
|
57 |
+
for model_id in model_id_list_loaded:
|
58 |
+
model_id_trunc = model_id
|
59 |
+
if len(model_id) > 35:
|
60 |
+
model_id_trunc = '...' + model_id[-35:]
|
61 |
+
model_str += f'<li><a href="https://huggingface.co/{model_id}">{model_id_trunc}</a></li>'
|
62 |
+
model_str += "</ul>"
|
63 |
+
st.write(model_str, unsafe_allow_html=True)
|
64 |
+
|
65 |
st.write("HuggingFace Open LLM leaderboard by Model Size")
|
66 |
st.image(hf_llm_diagrams[0],use_column_width="auto")
|
67 |
|
68 |
+
print_model_list(hf_llm_diagrams[0],st)
|
69 |
+
|
70 |
cols = st.columns(2)
|
71 |
cols[0].image(hf_llm_diagrams[1],caption="Other or commercially permissive licenses only", use_column_width="auto")
|
72 |
+
|
73 |
+
|
74 |
+
print_model_list(hf_llm_diagrams[1],cols[0])
|
75 |
+
|
76 |
cols[1].image(hf_llm_diagrams[2],caption="Commercially permissive license only", use_column_width="auto")
|
77 |
|
78 |
+
print_model_list(hf_llm_diagrams[2],cols[1])
|
79 |
|
80 |
st.divider()
|
81 |
st.write("HuggingFace and Other Leaderboards: A Comparative Model Evaluation")
|
data/20230826_0615/hf_llm_diagramv2.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["garage-bAInd/Platypus2-70B-instruct", "upstage/llama-65b-instruct", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrca-Platypus2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v0", "Fredithefish/ReasonixPajama-3B-HF", "open-llm-leaderboard/bloomz-1b7-4bit-alpaca-auto-eval-adapter-applied"]
|
data/20230826_0615/hf_llm_diagramv2.png
ADDED
data/20230826_0615/hf_llm_diagramv2_other_permissive.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["psmathur/orca_mini_v3_70b", "TheBloke/gpt4-alpaca-lora_mlp-65B-HF", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrcaxOpenChat-Preview2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v1", "Fredithefish/ReasonixPajama-3B-HF", "aisquared/dlite-v2-774m"]
|
data/20230826_0615/hf_llm_diagramv2_other_permissive.png
ADDED
data/20230826_0615/hf_llm_diagramv2_permissive.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["ehartford/Samantha-1.11-70b", "bavest/fin-llama-33b-merged", "Open-Orca/OpenOrcaxOpenChat-Preview2-13B", "circulus/Llama-2-7b-orca-v1", "togethercomputer/GPT-JT-6B-v1", "Fredithefish/ReasonixPajama-3B-HF", "aisquared/dlite-v2-774m"]
|
data/20230826_0615/hf_llm_diagramv2_permissive.png
ADDED
data/20230826_0615/hf_llm_diagramv2_rescore.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["garage-bAInd/Platypus2-70B-instruct", "upstage/llama-65b-instruct", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrca-Platypus2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v0", "openlm-research/open_llama_3b_v2", "open-llm-leaderboard/bloomz-1b7-4bit-alpaca-auto-eval-adapter-applied"]
|
data/20230826_0615/hf_llm_diagramv2_rescore.png
ADDED
data/20230826_0615/hg_average_to_agentbench_compare.png
ADDED
data/20230826_0615/hg_average_to_alpacaeval_compare.png
ADDED
data/20230826_0615/hg_average_to_mosaic_compare.png
ADDED
data/20230826_0615/hg_average_to_mt_bench_compare.png
ADDED
data/20230826_0615/hg_average_to_opencompass_compare.png
ADDED