rodrigomasini commited on
Commit
ac08188
1 Parent(s): 3698e25

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +31 -14
app.py CHANGED
@@ -744,15 +744,15 @@ def get_mteb_average():
744
  # Debugging:
745
  # DATA_OVERALL.to_csv("overall.csv")
746
 
747
- DATA_OVERALL.insert(1, f"Average ({len(TASK_LIST_EN)} datasets)", DATA_OVERALL[TASK_LIST_EN].mean(axis=1, skipna=False))
748
- DATA_OVERALL.insert(2, f"Classification Average ({len(TASK_LIST_CLASSIFICATION)} datasets)", DATA_OVERALL[TASK_LIST_CLASSIFICATION].mean(axis=1, skipna=False))
749
- DATA_OVERALL.insert(3, f"Clustering Average ({len(TASK_LIST_CLUSTERING)} datasets)", DATA_OVERALL[TASK_LIST_CLUSTERING].mean(axis=1, skipna=False))
750
- DATA_OVERALL.insert(4, f"Pair Classification Average ({len(TASK_LIST_PAIR_CLASSIFICATION)} datasets)", DATA_OVERALL[TASK_LIST_PAIR_CLASSIFICATION].mean(axis=1, skipna=False))
751
- DATA_OVERALL.insert(5, f"Reranking Average ({len(TASK_LIST_RERANKING)} datasets)", DATA_OVERALL[TASK_LIST_RERANKING].mean(axis=1, skipna=False))
752
- DATA_OVERALL.insert(6, f"Retrieval Average ({len(TASK_LIST_RETRIEVAL)} datasets)", DATA_OVERALL[TASK_LIST_RETRIEVAL].mean(axis=1, skipna=False))
753
- DATA_OVERALL.insert(7, f"STS Average ({len(TASK_LIST_STS)} datasets)", DATA_OVERALL[TASK_LIST_STS].mean(axis=1, skipna=False))
754
- DATA_OVERALL.insert(8, f"Summarization Average ({len(TASK_LIST_SUMMARIZATION)} dataset)", DATA_OVERALL[TASK_LIST_SUMMARIZATION].mean(axis=1, skipna=False))
755
- DATA_OVERALL.sort_values(f"Average ({len(TASK_LIST_EN)} datasets)", ascending=False, inplace=True)
756
  # Start ranking from 1
757
  DATA_OVERALL.insert(0, "Rank", list(range(1, len(DATA_OVERALL) + 1)))
758
 
@@ -769,14 +769,12 @@ def get_mteb_average():
769
  # Fill NaN after averaging
770
  DATA_OVERALL.fillna("", inplace=True)
771
 
772
- DATA_OVERALL = DATA_OVERALL[["Rank", "Model", "Model Size (GB)", "Embedding Dimensions", "Max Tokens", f"Average ({len(TASK_LIST_EN)} datasets)", f"Classification Average ({len(TASK_LIST_CLASSIFICATION)} datasets)", f"Clustering Average ({len(TASK_LIST_CLUSTERING)} datasets)", f"Pair Classification Average ({len(TASK_LIST_PAIR_CLASSIFICATION)} datasets)", f"Reranking Average ({len(TASK_LIST_RERANKING)} datasets)", f"Retrieval Average ({len(TASK_LIST_RETRIEVAL)} datasets)", f"STS Average ({len(TASK_LIST_STS)} datasets)", f"Summarization Average ({len(TASK_LIST_SUMMARIZATION)} dataset)"]]
773
  DATA_OVERALL = DATA_OVERALL[DATA_OVERALL.iloc[:, 5:].ne("").any(axis=1)]
774
 
775
  return DATA_OVERALL
776
 
777
  DATA_OVERALL=get_mteb_average()
778
- print(DATA_OVERALL)
779
- print(DATA_OVERALL.columns)
780
 
781
  import unicodedata
782
 
@@ -798,9 +796,28 @@ for column in DATA_OVERALL.columns:
798
  if DATA_OVERALL[column].dtype == 'object':
799
  DATA_OVERALL[column] = DATA_OVERALL[column].apply(remove_invalid_unicode)
800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
801
  data_overall = gr.components.Dataframe(
802
- headers=DATA_OVERALL.columns.tolist(),
803
- datatype=DATA_OVERALL.values.tolist(),
 
804
  visible=False,
805
  line_breaks=False,
806
  interactive=False
 
744
  # Debugging:
745
  # DATA_OVERALL.to_csv("overall.csv")
746
 
747
+ DATA_OVERALL.insert(1, f"Average", DATA_OVERALL[TASK_LIST_EN].mean(axis=1, skipna=False))
748
+ DATA_OVERALL.insert(2, f"Classification Average", DATA_OVERALL[TASK_LIST_CLASSIFICATION].mean(axis=1, skipna=False))
749
+ DATA_OVERALL.insert(3, f"Clustering Average", DATA_OVERALL[TASK_LIST_CLUSTERING].mean(axis=1, skipna=False))
750
+ DATA_OVERALL.insert(4, f"Pair Classification Average", DATA_OVERALL[TASK_LIST_PAIR_CLASSIFICATION].mean(axis=1, skipna=False))
751
+ DATA_OVERALL.insert(5, f"Reranking Average", DATA_OVERALL[TASK_LIST_RERANKING].mean(axis=1, skipna=False))
752
+ DATA_OVERALL.insert(6, f"Retrieval Average", DATA_OVERALL[TASK_LIST_RETRIEVAL].mean(axis=1, skipna=False))
753
+ DATA_OVERALL.insert(7, f"STS Average", DATA_OVERALL[TASK_LIST_STS].mean(axis=1, skipna=False))
754
+ DATA_OVERALL.insert(8, f"Summarization Average", DATA_OVERALL[TASK_LIST_SUMMARIZATION].mean(axis=1, skipna=False))
755
+ DATA_OVERALL.sort_values(f"Average", ascending=False, inplace=True)
756
  # Start ranking from 1
757
  DATA_OVERALL.insert(0, "Rank", list(range(1, len(DATA_OVERALL) + 1)))
758
 
 
769
  # Fill NaN after averaging
770
  DATA_OVERALL.fillna("", inplace=True)
771
 
772
+ DATA_OVERALL = DATA_OVERALL[["Rank", "Model", "Model Size (GB)", "Embedding Dimensions", "Max Tokens", f"Average", f"Classification Average", f"Clustering Average", f"Pair Classification Average", f"Reranking Average", f"Retrieval Average", f"STS Average", f"Summarization Average"]]
773
  DATA_OVERALL = DATA_OVERALL[DATA_OVERALL.iloc[:, 5:].ne("").any(axis=1)]
774
 
775
  return DATA_OVERALL
776
 
777
  DATA_OVERALL=get_mteb_average()
 
 
778
 
779
  import unicodedata
780
 
 
796
  if DATA_OVERALL[column].dtype == 'object':
797
  DATA_OVERALL[column] = DATA_OVERALL[column].apply(remove_invalid_unicode)
798
 
799
+ DATA_OVERALL_COLUMN_TO_DATATYPE = [
800
+ "Rank", "number",
801
+ "Model Size (GB)", "number",
802
+ "Embedding Dimensions", "number",
803
+ "Max Tokens", "number",
804
+ "Average", "number",
805
+ "Classification Average", "number",
806
+ "Classification Average", "number",
807
+ "Pair Classification Average", "number",
808
+ "Reranking Average", "number",
809
+ "Retrieval Average", "number",
810
+ "STS Average", "number",
811
+ "Summarization Average", "number"
812
+ ]
813
+
814
+ COLS = [col.name for col in DATA_OVERALL_COLUMN_TO_DATATYPE]
815
+ TYPES = [col.type for col in DATA_OVERALL_COLUMN_TO_DATATYPE]
816
+
817
  data_overall = gr.components.Dataframe(
818
+ DATA_OVERALL,
819
+ headers=COLS,
820
+ datatype=TYPES,
821
  visible=False,
822
  line_breaks=False,
823
  interactive=False