Spaces:
Runtime error
Runtime error
rodrigomasini
commited on
Commit
•
ac08188
1
Parent(s):
3698e25
Update app.py
Browse files
app.py
CHANGED
@@ -744,15 +744,15 @@ def get_mteb_average():
|
|
744 |
# Debugging:
|
745 |
# DATA_OVERALL.to_csv("overall.csv")
|
746 |
|
747 |
-
DATA_OVERALL.insert(1, f"Average
|
748 |
-
DATA_OVERALL.insert(2, f"Classification Average
|
749 |
-
DATA_OVERALL.insert(3, f"Clustering Average
|
750 |
-
DATA_OVERALL.insert(4, f"Pair Classification Average
|
751 |
-
DATA_OVERALL.insert(5, f"Reranking Average
|
752 |
-
DATA_OVERALL.insert(6, f"Retrieval Average
|
753 |
-
DATA_OVERALL.insert(7, f"STS Average
|
754 |
-
DATA_OVERALL.insert(8, f"Summarization Average
|
755 |
-
DATA_OVERALL.sort_values(f"Average
|
756 |
# Start ranking from 1
|
757 |
DATA_OVERALL.insert(0, "Rank", list(range(1, len(DATA_OVERALL) + 1)))
|
758 |
|
@@ -769,14 +769,12 @@ def get_mteb_average():
|
|
769 |
# Fill NaN after averaging
|
770 |
DATA_OVERALL.fillna("", inplace=True)
|
771 |
|
772 |
-
DATA_OVERALL = DATA_OVERALL[["Rank", "Model", "Model Size (GB)", "Embedding Dimensions", "Max Tokens", f"Average
|
773 |
DATA_OVERALL = DATA_OVERALL[DATA_OVERALL.iloc[:, 5:].ne("").any(axis=1)]
|
774 |
|
775 |
return DATA_OVERALL
|
776 |
|
777 |
DATA_OVERALL=get_mteb_average()
|
778 |
-
print(DATA_OVERALL)
|
779 |
-
print(DATA_OVERALL.columns)
|
780 |
|
781 |
import unicodedata
|
782 |
|
@@ -798,9 +796,28 @@ for column in DATA_OVERALL.columns:
|
|
798 |
if DATA_OVERALL[column].dtype == 'object':
|
799 |
DATA_OVERALL[column] = DATA_OVERALL[column].apply(remove_invalid_unicode)
|
800 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
801 |
data_overall = gr.components.Dataframe(
|
802 |
-
|
803 |
-
|
|
|
804 |
visible=False,
|
805 |
line_breaks=False,
|
806 |
interactive=False
|
|
|
744 |
# Debugging:
|
745 |
# DATA_OVERALL.to_csv("overall.csv")
|
746 |
|
747 |
+
DATA_OVERALL.insert(1, f"Average", DATA_OVERALL[TASK_LIST_EN].mean(axis=1, skipna=False))
|
748 |
+
DATA_OVERALL.insert(2, f"Classification Average", DATA_OVERALL[TASK_LIST_CLASSIFICATION].mean(axis=1, skipna=False))
|
749 |
+
DATA_OVERALL.insert(3, f"Clustering Average", DATA_OVERALL[TASK_LIST_CLUSTERING].mean(axis=1, skipna=False))
|
750 |
+
DATA_OVERALL.insert(4, f"Pair Classification Average", DATA_OVERALL[TASK_LIST_PAIR_CLASSIFICATION].mean(axis=1, skipna=False))
|
751 |
+
DATA_OVERALL.insert(5, f"Reranking Average", DATA_OVERALL[TASK_LIST_RERANKING].mean(axis=1, skipna=False))
|
752 |
+
DATA_OVERALL.insert(6, f"Retrieval Average", DATA_OVERALL[TASK_LIST_RETRIEVAL].mean(axis=1, skipna=False))
|
753 |
+
DATA_OVERALL.insert(7, f"STS Average", DATA_OVERALL[TASK_LIST_STS].mean(axis=1, skipna=False))
|
754 |
+
DATA_OVERALL.insert(8, f"Summarization Average", DATA_OVERALL[TASK_LIST_SUMMARIZATION].mean(axis=1, skipna=False))
|
755 |
+
DATA_OVERALL.sort_values(f"Average", ascending=False, inplace=True)
|
756 |
# Start ranking from 1
|
757 |
DATA_OVERALL.insert(0, "Rank", list(range(1, len(DATA_OVERALL) + 1)))
|
758 |
|
|
|
769 |
# Fill NaN after averaging
|
770 |
DATA_OVERALL.fillna("", inplace=True)
|
771 |
|
772 |
+
DATA_OVERALL = DATA_OVERALL[["Rank", "Model", "Model Size (GB)", "Embedding Dimensions", "Max Tokens", f"Average", f"Classification Average", f"Clustering Average", f"Pair Classification Average", f"Reranking Average", f"Retrieval Average", f"STS Average", f"Summarization Average"]]
|
773 |
DATA_OVERALL = DATA_OVERALL[DATA_OVERALL.iloc[:, 5:].ne("").any(axis=1)]
|
774 |
|
775 |
return DATA_OVERALL
|
776 |
|
777 |
DATA_OVERALL=get_mteb_average()
|
|
|
|
|
778 |
|
779 |
import unicodedata
|
780 |
|
|
|
796 |
if DATA_OVERALL[column].dtype == 'object':
|
797 |
DATA_OVERALL[column] = DATA_OVERALL[column].apply(remove_invalid_unicode)
|
798 |
|
799 |
+
DATA_OVERALL_COLUMN_TO_DATATYPE = [
|
800 |
+
"Rank", "number",
|
801 |
+
"Model Size (GB)", "number",
|
802 |
+
"Embedding Dimensions", "number",
|
803 |
+
"Max Tokens", "number",
|
804 |
+
"Average", "number",
|
805 |
+
"Classification Average", "number",
|
806 |
+
"Classification Average", "number",
|
807 |
+
"Pair Classification Average", "number",
|
808 |
+
"Reranking Average", "number",
|
809 |
+
"Retrieval Average", "number",
|
810 |
+
"STS Average", "number",
|
811 |
+
"Summarization Average", "number"
|
812 |
+
]
|
813 |
+
|
814 |
+
COLS = [col.name for col in DATA_OVERALL_COLUMN_TO_DATATYPE]
|
815 |
+
TYPES = [col.type for col in DATA_OVERALL_COLUMN_TO_DATATYPE]
|
816 |
+
|
817 |
data_overall = gr.components.Dataframe(
|
818 |
+
DATA_OVERALL,
|
819 |
+
headers=COLS,
|
820 |
+
datatype=TYPES,
|
821 |
visible=False,
|
822 |
line_breaks=False,
|
823 |
interactive=False
|