Spaces:

dimbyTa
/

open-llm-leaderboard-viz

Sleeping

App Files Files Community

dimbyTa commited on Mar 11

Commit

ff0c7de

•

1 Parent(s): 174296d

adding feature of changing the order of the metrics on the circle of the chart

Browse files

Files changed (2) hide show

src/display.py +41 -8
src/load_data.py +31 -1

src/display.py CHANGED Viewed

@@ -1,10 +1,7 @@
-#import streamlit as st
-#from src.load_data import load_dataframe, sort_by
-#from src.plot import plot_radar_chart_index, plot_radar_chart_name
-#from st_aggrid import GridOptionsBuilder, AgGrid
 from st_aggrid import GridOptionsBuilder, AgGrid
 import streamlit as st
-from .load_data import load_dataframe, sort_by, show_dataframe_top, search_by_name
 from .plot import plot_radar_chart_name, plot_radar_chart_rows
@@ -32,8 +29,34 @@ def display_app():
     name = st.text_input(label = ":mag: Search by name")
     selection_mode = st.sidebar.radio(label= "Selection mode for the rows", options = ["single", "multiple"], index=0)
     st.sidebar.write("In multiple mode, you can select up to three models. If you select more than three models, only the first three will be displayed and plotted.")
     len_name_input = len(name)
     if len_name_input > 0:
         dataframe_by_search = search_by_name(name)
@@ -79,12 +102,22 @@ def display_app():
     with column2:
         if grid_response['selected_rows'] is not None and len(grid_response['selected_rows']) > 0:
-            figure = plot_radar_chart_rows(rows=grid_response['selected_rows'][:3])
-            #figure = plot_radar_chart_name(dataframe= dataframe, model_name=grid_response['selected_rows'][0]["model_name"])
             st.plotly_chart(figure, use_container_width=False)
         else:
             if len(subdata)>0:
-                figure = plot_radar_chart_name(dataframe=subdata, model_name=model_name)
                 st.plotly_chart(figure, use_container_width=True)
     if grid_response['selected_rows'] is not None and len(grid_response['selected_rows']) > 1:

 from st_aggrid import GridOptionsBuilder, AgGrid
 import streamlit as st
+from .load_data import load_dataframe, sort_by, show_dataframe_top, search_by_name, validate_categories
 from .plot import plot_radar_chart_name, plot_radar_chart_rows
     name = st.text_input(label = ":mag: Search by name")
+    #Sidebar configurations
     selection_mode = st.sidebar.radio(label= "Selection mode for the rows", options = ["single", "multiple"], index=0)
     st.sidebar.write("In multiple mode, you can select up to three models. If you select more than three models, only the first three will be displayed and plotted.")
+    ordering_metrics = st.sidebar.text_input(label = "Order of the metrics on the circle, counter-clock wise, beginning at 3 o'clock.",
+                                             placeholder = "ARC, GSM8K, TruthfulQA, Winogrande, HellaSwag, MMLU")
+    ordering_metrics = ordering_metrics.replace(" ", "")
+    ordering_metrics = ordering_metrics.split(",")
+    st.sidebar.markdown("""
+                        As a reminder, here are the different metrics:
+                        * ARC
+                        * GSM8K
+                        * TruthfulQA
+                        * Winogrande
+                        * HellaSwag
+                        * MMLU
+                        """)
+    st.sidebar.markdown("""
+                        If there are **typos** in the name of the metrics, or the number of metrics
+                        is **different of six**, there will be no effect on the chart and the
+                        default ordering will be used.
+                         """)
+    valid_categories = validate_categories(ordering_metrics)
+    # Search bar
     len_name_input = len(name)
     if len_name_input > 0:
         dataframe_by_search = search_by_name(name)
     with column2:
         if grid_response['selected_rows'] is not None and len(grid_response['selected_rows']) > 0:
+            figure = None
+            if valid_categories:
+                figure = plot_radar_chart_rows(rows=grid_response['selected_rows'][:3], categories = ordering_metrics)
+            else:
+                figure = plot_radar_chart_rows(rows=grid_response['selected_rows'][:3])
             st.plotly_chart(figure, use_container_width=False)
         else:
             if len(subdata)>0:
+                figure = None
+                if valid_categories:
+                    figure = plot_radar_chart_name(dataframe=subdata, categories = ordering_metrics, model_name=model_name)
+                else:
+                    figure = plot_radar_chart_name(dataframe=subdata, model_name=model_name)
                 st.plotly_chart(figure, use_container_width=True)
     if grid_response['selected_rows'] is not None and len(grid_response['selected_rows']) > 1:

src/load_data.py CHANGED Viewed

@@ -54,4 +54,34 @@ def search_by_name(name: str) -> pd.DataFrame:
     """
     dataframe = load_dataframe()
     indexes = dataframe["model_name"].str.contains(name)
-    return dataframe[indexes]

     """
     dataframe = load_dataframe()
     indexes = dataframe["model_name"].str.contains(name)
+    return dataframe[indexes]
+def validate_categories(categories: list) -> bool:
+    """
+    validate a list of categories to the columns in the dataframe
+    Arguments:
+    - categories: a list of categories for the ordering of the columns in the dataframe
+    This expects a list with six elements that should be (not necessary in order):
+    - ARC
+    - GSM8K
+    - TruthfulQA
+    - Winogrande
+    - HellaSwag
+    - MMLU
+    Returns
+    - True if the list has the right number of element and right elements
+    - False otherwise
+    """
+    valid_categories = False
+    if len(categories) == 6:
+        if ("ARC" in categories and "GSM8K" in categories and "TruthfulQA" in categories
+         and "Winogrande" in categories and "HellaSwag" in categories and "MMLU" in categories):
+            valid_categories = True
+        else:
+            valid_categories = False
+    else:
+        valid_categories = False
+    return valid_categories