Spaces:

felixz
/

meta_open_llm_leaderboard

Sleeping

felix commited on Sep 7, 2023

Commit

b9fbf95

•

1 Parent(s): 67e2a45

add

Files changed (6) hide show

app.py CHANGED Viewed

@@ -44,6 +44,7 @@ imgs = glob.glob(os.path.join(data_path, '*.png'))
 # Extracting images that start with "hf_llm_diagram"
 hf_llm_diagrams = [img for img in imgs if 'hf_llm_diagram' in os.path.basename(img)]
 # Getting the remaining images
 remaining_imgs = [img for img in imgs if 'hf_llm_diagram' not in os.path.basename(img)]
@@ -105,6 +106,13 @@ cols[1].image(hf_llm_diagrams[2],caption="Commercially permissive license only",
 print_model_list(hf_llm_diagrams[2],cols[1])
 st.divider()
 st.write("HuggingFace and Other Leaderboards: A Comparative Model Evaluation")
 st.caption("Only models evaluated on both leaderboards are included.")
@@ -130,6 +138,7 @@ st.write(
         <li><a href="https://www.mosaicml.com/llm-evaluation">MosaicML</a> Balanced set of static benchmarks</li>
         <li><a href="https://opencompass.org.cn/leaderboard-llm">OpenCompass</a> Balanced set of static benchmarks</li>
         <li><a href="https://llmbench.ai/data">AgentBench</a> Benchmark evaluating Agent abilities</li>
         </ul>
     """, unsafe_allow_html=True
 )

 # Extracting images that start with "hf_llm_diagram"
 hf_llm_diagrams = [img for img in imgs if 'hf_llm_diagram' in os.path.basename(img)]
+bigcode_diagrams = [img for img in imgs if 'bigcode' in os.path.basename(img)]
 # Getting the remaining images
 remaining_imgs = [img for img in imgs if 'hf_llm_diagram' not in os.path.basename(img)]
 print_model_list(hf_llm_diagrams[2],cols[1])
+st.divider()
+st.write("Big Code Models Leaderboard")
+st.image(bigcode_diagrams[0],use_column_width="auto")
+print_model_list(bigcode_diagrams[0],st,True)
 st.divider()
 st.write("HuggingFace and Other Leaderboards: A Comparative Model Evaluation")
 st.caption("Only models evaluated on both leaderboards are included.")
         <li><a href="https://www.mosaicml.com/llm-evaluation">MosaicML</a> Balanced set of static benchmarks</li>
         <li><a href="https://opencompass.org.cn/leaderboard-llm">OpenCompass</a> Balanced set of static benchmarks</li>
         <li><a href="https://llmbench.ai/data">AgentBench</a> Benchmark evaluating Agent abilities</li>
+        <li><a href="https://huggingface.co/spaces/bigcode/bigcode-models-leaderboard">BigCode</a>  Compare performance of base multilingual code generation models</li>
         </ul>
     """, unsafe_allow_html=True
 )

data/20230820_0354/bigcode_leaderboard.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ []

data/20230823_0545/bigcode_leaderboard.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ []

data/20230824_0626/bigcode_leaderboard.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ []

data/20230825_0828/bigcode_leaderboard.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ []

fix_old_data.py CHANGED Viewed

@@ -6,6 +6,8 @@ data_path = './data/'
 no_generated_image_path = './no_generated_image.png'  # Update this path to the location of no_generated_image.png
 expected_files = [
     'hf_llm_diagramv2.json',
     'hf_llm_diagramv2.png',
     'hf_llm_diagramv2_other_permissive.json',

 no_generated_image_path = './no_generated_image.png'  # Update this path to the location of no_generated_image.png
 expected_files = [
+    'bigcode_leaderboard.json',
+    'bigcode_leaderboard.png',
     'hf_llm_diagramv2.json',
     'hf_llm_diagramv2.png',
     'hf_llm_diagramv2_other_permissive.json',