comment

Files changed (14) hide show

app.py CHANGED Viewed

@@ -1,4 +1,6 @@
 # app.py
 import streamlit as st
 import glob
 import os
@@ -46,13 +48,34 @@ hf_llm_diagrams = [img for img in imgs if 'hf_llm_diagram' in os.path.basename(i
 # Getting the remaining images
 remaining_imgs = [img for img in imgs if 'hf_llm_diagram' not in os.path.basename(img)]
 st.write("HuggingFace Open LLM leaderboard by Model Size")
 st.image(hf_llm_diagrams[0],use_column_width="auto")
 cols = st.columns(2)
 cols[0].image(hf_llm_diagrams[1],caption="Other or commercially permissive licenses only", use_column_width="auto")
 cols[1].image(hf_llm_diagrams[2],caption="Commercially permissive license only", use_column_width="auto")
 st.divider()
 st.write("HuggingFace and Other Leaderboards: A Comparative Model Evaluation")

 # app.py
+import json
 import streamlit as st
 import glob
 import os
 # Getting the remaining images
 remaining_imgs = [img for img in imgs if 'hf_llm_diagram' not in os.path.basename(img)]
+def print_model_list(file_name, st):
+    file_path = file_name[:-4] + '.json'
+    # Read the list from the JSON file
+    with open(file_path, 'r') as file:
+        model_id_list_loaded = json.load(file)
+        model_str = "<ul>"
+        for model_id in model_id_list_loaded:
+            model_id_trunc = model_id
+            if len(model_id) > 35:
+                model_id_trunc = '...' + model_id[-35:]
+            model_str += f'<li><a href="https://huggingface.co/{model_id}">{model_id_trunc}</a></li>'
+        model_str += "</ul>"
+        st.write(model_str, unsafe_allow_html=True)
 st.write("HuggingFace Open LLM leaderboard by Model Size")
 st.image(hf_llm_diagrams[0],use_column_width="auto")
+print_model_list(hf_llm_diagrams[0],st)
 cols = st.columns(2)
 cols[0].image(hf_llm_diagrams[1],caption="Other or commercially permissive licenses only", use_column_width="auto")
+print_model_list(hf_llm_diagrams[1],cols[0])
 cols[1].image(hf_llm_diagrams[2],caption="Commercially permissive license only", use_column_width="auto")
+print_model_list(hf_llm_diagrams[2],cols[1])
 st.divider()
 st.write("HuggingFace and Other Leaderboards: A Comparative Model Evaluation")

data/20230826_0615/hf_llm_diagramv2.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ ["garage-bAInd/Platypus2-70B-instruct", "upstage/llama-65b-instruct", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrca-Platypus2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v0", "Fredithefish/ReasonixPajama-3B-HF", "open-llm-leaderboard/bloomz-1b7-4bit-alpaca-auto-eval-adapter-applied"]

data/20230826_0615/hf_llm_diagramv2.png ADDED Viewed

data/20230826_0615/hf_llm_diagramv2_other_permissive.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ ["psmathur/orca_mini_v3_70b", "TheBloke/gpt4-alpaca-lora_mlp-65B-HF", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrcaxOpenChat-Preview2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v1", "Fredithefish/ReasonixPajama-3B-HF", "aisquared/dlite-v2-774m"]

data/20230826_0615/hf_llm_diagramv2_other_permissive.png ADDED Viewed

data/20230826_0615/hf_llm_diagramv2_permissive.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ ["ehartford/Samantha-1.11-70b", "bavest/fin-llama-33b-merged", "Open-Orca/OpenOrcaxOpenChat-Preview2-13B", "circulus/Llama-2-7b-orca-v1", "togethercomputer/GPT-JT-6B-v1", "Fredithefish/ReasonixPajama-3B-HF", "aisquared/dlite-v2-774m"]

data/20230826_0615/hf_llm_diagramv2_permissive.png ADDED Viewed

data/20230826_0615/hf_llm_diagramv2_rescore.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ ["garage-bAInd/Platypus2-70B-instruct", "upstage/llama-65b-instruct", "ehartford/samantha-1.1-llama-33b", "Open-Orca/OpenOrca-Platypus2-13B", "psmathur/orca_mini_v3_7b", "togethercomputer/GPT-JT-6B-v0", "openlm-research/open_llama_3b_v2", "open-llm-leaderboard/bloomz-1b7-4bit-alpaca-auto-eval-adapter-applied"]

data/20230826_0615/hf_llm_diagramv2_rescore.png ADDED Viewed

data/20230826_0615/hg_average_to_agentbench_compare.png ADDED Viewed

data/20230826_0615/hg_average_to_alpacaeval_compare.png ADDED Viewed

data/20230826_0615/hg_average_to_mosaic_compare.png ADDED Viewed

data/20230826_0615/hg_average_to_mt_bench_compare.png ADDED Viewed

data/20230826_0615/hg_average_to_opencompass_compare.png ADDED Viewed