felix commited on
Commit
6d7a85e
1 Parent(s): e762f8c
app.py CHANGED
@@ -1,4 +1,6 @@
1
  # app.py
 
 
2
  import streamlit as st
3
  import glob
4
  import os
@@ -46,13 +48,34 @@ hf_llm_diagrams = [img for img in imgs if 'hf_llm_diagram' in os.path.basename(i
46
  # Getting the remaining images
47
  remaining_imgs = [img for img in imgs if 'hf_llm_diagram' not in os.path.basename(img)]
48
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
49
  st.write("HuggingFace Open LLM leaderboard by Model Size")
50
  st.image(hf_llm_diagrams[0],use_column_width="auto")
51
 
 
 
52
  cols = st.columns(2)
53
  cols[0].image(hf_llm_diagrams[1],caption="Other or commercially permissive licenses only", use_column_width="auto")
 
 
 
 
54
  cols[1].image(hf_llm_diagrams[2],caption="Commercially permissive license only", use_column_width="auto")
55
 
 
56
 
57
  st.divider()
58
  st.write("HuggingFace and Other Leaderboards: A Comparative Model Evaluation")
 
1
  # app.py
2
+ import json
3
+
4
  import streamlit as st
5
  import glob
6
  import os
 
48
  # Getting the remaining images
49
  remaining_imgs = [img for img in imgs if 'hf_llm_diagram' not in os.path.basename(img)]
50
 
51
+ def print_model_list(file_name, st):
52
+ file_path = file_name[:-4] + '.json'
53
+ # Read the list from the JSON file
54
+ with open(file_path, 'r') as file:
55
+ model_id_list_loaded = json.load(file)
56
+ model_str = "<ul>"
57
+ for model_id in model_id_list_loaded:
58
+ model_id_trunc = model_id
59
+ if len(model_id) > 35:
60
+ model_id_trunc = '...' + model_id[-35:]
61
+ model_str += f'<li><a href="https://huggingface.co/{model_id}">{model_id_trunc}</a></li>'
62
+ model_str += "</ul>"
63
+ st.write(model_str, unsafe_allow_html=True)
64
+
65
  st.write("HuggingFace Open LLM leaderboard by Model Size")
66
  st.image(hf_llm_diagrams[0],use_column_width="auto")
67
 
68
+ print_model_list(hf_llm_diagrams[0],st)
69
+
70
  cols = st.columns(2)
71
  cols[0].image(hf_llm_diagrams[1],caption="Other or commercially permissive licenses only", use_column_width="auto")
72
+
73
+
74
+ print_model_list(hf_llm_diagrams[1],cols[0])
75
+
76
  cols[1].image(hf_llm_diagrams[2],caption="Commercially permissive license only", use_column_width="auto")
77
 
78
+ print_model_list(hf_llm_diagrams[2],cols[1])
79
 
80
  st.divider()
81
  st.write("HuggingFace and Other Leaderboards: A Comparative Model Evaluation")
data/20230826_0615/hf_llm_diagramv2.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["garage-bAInd/Platypus2-70B-instruct", "upstage/llama-65b-instruct", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrca-Platypus2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v0", "Fredithefish/ReasonixPajama-3B-HF", "open-llm-leaderboard/bloomz-1b7-4bit-alpaca-auto-eval-adapter-applied"]
data/20230826_0615/hf_llm_diagramv2.png ADDED
data/20230826_0615/hf_llm_diagramv2_other_permissive.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["psmathur/orca_mini_v3_70b", "TheBloke/gpt4-alpaca-lora_mlp-65B-HF", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrcaxOpenChat-Preview2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v1", "Fredithefish/ReasonixPajama-3B-HF", "aisquared/dlite-v2-774m"]
data/20230826_0615/hf_llm_diagramv2_other_permissive.png ADDED
data/20230826_0615/hf_llm_diagramv2_permissive.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["ehartford/Samantha-1.11-70b", "bavest/fin-llama-33b-merged", "Open-Orca/OpenOrcaxOpenChat-Preview2-13B", "circulus/Llama-2-7b-orca-v1", "togethercomputer/GPT-JT-6B-v1", "Fredithefish/ReasonixPajama-3B-HF", "aisquared/dlite-v2-774m"]
data/20230826_0615/hf_llm_diagramv2_permissive.png ADDED
data/20230826_0615/hf_llm_diagramv2_rescore.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["garage-bAInd/Platypus2-70B-instruct", "upstage/llama-65b-instruct", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrca-Platypus2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v0", "openlm-research/open_llama_3b_v2", "open-llm-leaderboard/bloomz-1b7-4bit-alpaca-auto-eval-adapter-applied"]
data/20230826_0615/hf_llm_diagramv2_rescore.png ADDED
data/20230826_0615/hg_average_to_agentbench_compare.png ADDED
data/20230826_0615/hg_average_to_alpacaeval_compare.png ADDED
data/20230826_0615/hg_average_to_mosaic_compare.png ADDED
data/20230826_0615/hg_average_to_mt_bench_compare.png ADDED
data/20230826_0615/hg_average_to_opencompass_compare.png ADDED