Ludwig Stumpp commited on
Commit
5a5e2af
2 Parent(s): 2fc8d56 af4ecbe

Merge remote-tracking branch 'origin/main' into hf-launch

Browse files
Files changed (2) hide show
  1. README.md +0 -0
  2. streamlit_app.py +8 -5
README.md CHANGED
The diff for this file is too large to render. See raw diff
 
streamlit_app.py CHANGED
@@ -214,15 +214,17 @@ def setup_leaderboard(readme: str):
214
 
215
  st.markdown("## Leaderboard")
216
  modify = st.checkbox("Add filters")
 
 
217
  if modify:
218
  df_leaderboard = filter_dataframe_by_row_and_columns(df_leaderboard, ignore_columns=NON_BENCHMARK_COLS)
219
  df_leaderboard = filter_dataframe_by_column_values(df_leaderboard)
220
 
221
- df_leaderboard = df_leaderboard.dropna(axis=1, how="all")
222
-
223
- benchmark_columns = [c for c in df_leaderboard.columns if df_leaderboard[c].dtype == float]
224
- rows_wo_any_benchmark = df_leaderboard[benchmark_columns].isna().all(axis=1)
225
- df_leaderboard = df_leaderboard[~rows_wo_any_benchmark]
226
 
227
  st.dataframe(df_leaderboard)
228
 
@@ -273,6 +275,7 @@ def setup_sources():
273
  - [lmsys.org - Chatbot Arena benchmarks](https://lmsys.org/blog/2023-05-03-arena/)
274
  - [Papers With Code](https://paperswithcode.com/)
275
  - [Stanford HELM](https://crfm.stanford.edu/helm/latest/)
 
276
  """
277
  )
278
 
 
214
 
215
  st.markdown("## Leaderboard")
216
  modify = st.checkbox("Add filters")
217
+ clear_empty_entries = st.checkbox("Clear empty entries", value=True)
218
+
219
  if modify:
220
  df_leaderboard = filter_dataframe_by_row_and_columns(df_leaderboard, ignore_columns=NON_BENCHMARK_COLS)
221
  df_leaderboard = filter_dataframe_by_column_values(df_leaderboard)
222
 
223
+ if clear_empty_entries:
224
+ df_leaderboard = df_leaderboard.dropna(axis=1, how="all")
225
+ benchmark_columns = [c for c in df_leaderboard.columns if df_leaderboard[c].dtype == float]
226
+ rows_wo_any_benchmark = df_leaderboard[benchmark_columns].isna().all(axis=1)
227
+ df_leaderboard = df_leaderboard[~rows_wo_any_benchmark]
228
 
229
  st.dataframe(df_leaderboard)
230
 
 
275
  - [lmsys.org - Chatbot Arena benchmarks](https://lmsys.org/blog/2023-05-03-arena/)
276
  - [Papers With Code](https://paperswithcode.com/)
277
  - [Stanford HELM](https://crfm.stanford.edu/helm/latest/)
278
+ - [HF Open LLM Leaderboard](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard)
279
  """
280
  )
281