Spaces:
Runtime error
Runtime error
Santi Diana
commited on
Commit
·
c4a71e3
1
Parent(s):
8a7bf5e
Updated Leaderboard. Added multi-dataset models, added dataset-AUGMENTED models, also performed some reproductions
Browse files- .DS_Store +0 -0
- add_new_model/mteb_metadata.yaml +0 -114
- data/classification.csv +9 -4
- data/general.csv +9 -4
- data/sts.csv +9 -4
.DS_Store
CHANGED
Binary files a/.DS_Store and b/.DS_Store differ
|
|
add_new_model/mteb_metadata.yaml
DELETED
@@ -1,114 +0,0 @@
|
|
1 |
-
---
|
2 |
-
tags:
|
3 |
-
- mteb
|
4 |
-
model-index:
|
5 |
-
- name: multilingual-e5-large-STSAUGMENTED-b16-e10
|
6 |
-
results:
|
7 |
-
- task:
|
8 |
-
type: Classification
|
9 |
-
dataset:
|
10 |
-
type: mteb/amazon_reviews_multi
|
11 |
-
name: MTEB AmazonReviewsClassification (es)
|
12 |
-
config: es
|
13 |
-
split: test
|
14 |
-
revision: 1399c76144fd37290681b995c656ef9b2e06e26d
|
15 |
-
metrics:
|
16 |
-
- type: accuracy
|
17 |
-
value: 42.114
|
18 |
-
- type: f1
|
19 |
-
value: 40.962817058318876
|
20 |
-
- task:
|
21 |
-
type: Classification
|
22 |
-
dataset:
|
23 |
-
type: mteb/mtop_domain
|
24 |
-
name: MTEB MTOPDomainClassification (es)
|
25 |
-
config: es
|
26 |
-
split: test
|
27 |
-
revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
|
28 |
-
metrics:
|
29 |
-
- type: accuracy
|
30 |
-
value: 80.92394929953302
|
31 |
-
- type: f1
|
32 |
-
value: 80.87019762034018
|
33 |
-
- task:
|
34 |
-
type: Classification
|
35 |
-
dataset:
|
36 |
-
type: mteb/mtop_intent
|
37 |
-
name: MTEB MTOPIntentClassification (es)
|
38 |
-
config: es
|
39 |
-
split: test
|
40 |
-
revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
|
41 |
-
metrics:
|
42 |
-
- type: accuracy
|
43 |
-
value: 53.32555036691128
|
44 |
-
- type: f1
|
45 |
-
value: 37.93993994854238
|
46 |
-
- task:
|
47 |
-
type: Classification
|
48 |
-
dataset:
|
49 |
-
type: mteb/amazon_massive_intent
|
50 |
-
name: MTEB MassiveIntentClassification (es)
|
51 |
-
config: es
|
52 |
-
split: test
|
53 |
-
revision: 31efe3c427b0bae9c22cbb560b8f15491cc6bed7
|
54 |
-
metrics:
|
55 |
-
- type: accuracy
|
56 |
-
value: 60.178211163416286
|
57 |
-
- type: f1
|
58 |
-
value: 60.03972849482204
|
59 |
-
- task:
|
60 |
-
type: Classification
|
61 |
-
dataset:
|
62 |
-
type: mteb/amazon_massive_scenario
|
63 |
-
name: MTEB MassiveScenarioClassification (es)
|
64 |
-
config: es
|
65 |
-
split: test
|
66 |
-
revision: 7d571f92784cd94a019292a1f45445077d0ef634
|
67 |
-
metrics:
|
68 |
-
- type: accuracy
|
69 |
-
value: 64.1930060524546
|
70 |
-
- type: f1
|
71 |
-
value: 64.02551940330545
|
72 |
-
- task:
|
73 |
-
type: STS
|
74 |
-
dataset:
|
75 |
-
type: mteb/sts17-crosslingual-sts
|
76 |
-
name: MTEB STS17 (es-es)
|
77 |
-
config: es-es
|
78 |
-
split: test
|
79 |
-
revision: af5e6fb845001ecf41f4c1e033ce921939a2a68d
|
80 |
-
metrics:
|
81 |
-
- type: cos_sim_pearson
|
82 |
-
value: 88.27146953394649
|
83 |
-
- type: cos_sim_spearman
|
84 |
-
value: 88.57657349986717
|
85 |
-
- type: euclidean_pearson
|
86 |
-
value: 89.07302053356283
|
87 |
-
- type: euclidean_spearman
|
88 |
-
value: 88.57431075359631
|
89 |
-
- type: manhattan_pearson
|
90 |
-
value: 89.11306099359507
|
91 |
-
- type: manhattan_spearman
|
92 |
-
value: 88.61591595032135
|
93 |
-
- task:
|
94 |
-
type: STS
|
95 |
-
dataset:
|
96 |
-
type: mteb/sts22-crosslingual-sts
|
97 |
-
name: MTEB STS22 (es)
|
98 |
-
config: es
|
99 |
-
split: test
|
100 |
-
revision: 6d1ba47164174a496b7fa5d3569dae26a6813b80
|
101 |
-
metrics:
|
102 |
-
- type: cos_sim_pearson
|
103 |
-
value: 65.57570700756301
|
104 |
-
- type: cos_sim_spearman
|
105 |
-
value: 70.33230514473709
|
106 |
-
- type: euclidean_pearson
|
107 |
-
value: 66.56411956377407
|
108 |
-
- type: euclidean_spearman
|
109 |
-
value: 70.33230514473709
|
110 |
-
- type: manhattan_pearson
|
111 |
-
value: 66.32203605146594
|
112 |
-
- type: manhattan_spearman
|
113 |
-
value: 70.34809182527435
|
114 |
-
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
data/classification.csv
CHANGED
@@ -12,8 +12,6 @@ paraphrase-multilingual-mpnet-BASE-v2-ft-stsb_multi_mt-embeddings,64.0,37.25,86.
|
|
12 |
mstsb-paraphrase-multilingual-mpnet-BASE-v2,64.47,38.29,86.04,67.06,63.47,67.53
|
13 |
multilingual-e5-BASE-b16-e10,65.09,43.4,89.02,61.7,63.06,68.25
|
14 |
multilingual-e5-LARGE-stsb-tuned-b32-e10,66.19,43.31,89.3,64.04,64.62,69.69
|
15 |
-
multilingual-e5-LARGE-stsb-tuned-b16-e10,67.1,43.72,90.29,65.51,65.13,70.84
|
16 |
-
multilingual-e5-LARGE-stsb-tuned-b16-e5,66.23,43.62,89.33,62.93,65.11,70.16
|
17 |
multilingual-e5-LARGE-stsb-tuned-b64-e10,64.58,43.71,88.84,60.2,62.74,67.4
|
18 |
LaBSE,61.97,39.39,84.07,64.44,58.32,63.61
|
19 |
multilingual-e5-BASE-stsb-tuned-b16-e10-all-languages,64.39,43.04,88.81,59.25,63.04,67.8
|
@@ -21,5 +19,12 @@ bge-BASE-tuned-b16-e10,50.83,31.34,74.1,45.63,48.72,54.36
|
|
21 |
multilingual-e5-LARGE-stsb-tuned-b16-e10-all-languages,64.93,42.98,87.96,60.91,63.78,69.02
|
22 |
bge-LARGE-tuned-b16-e10,51.67,31.72,76.04,48.01,48.9,53.66
|
23 |
multilingual-e5-LARGE-stsb-tuned-b16-e15,67.56,43.35,90.98,67.27,65.35,70.87
|
24 |
-
|
25 |
-
multilingual-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
mstsb-paraphrase-multilingual-mpnet-BASE-v2,64.47,38.29,86.04,67.06,63.47,67.53
|
13 |
multilingual-e5-BASE-b16-e10,65.09,43.4,89.02,61.7,63.06,68.25
|
14 |
multilingual-e5-LARGE-stsb-tuned-b32-e10,66.19,43.31,89.3,64.04,64.62,69.69
|
|
|
|
|
15 |
multilingual-e5-LARGE-stsb-tuned-b64-e10,64.58,43.71,88.84,60.2,62.74,67.4
|
16 |
LaBSE,61.97,39.39,84.07,64.44,58.32,63.61
|
17 |
multilingual-e5-BASE-stsb-tuned-b16-e10-all-languages,64.39,43.04,88.81,59.25,63.04,67.8
|
|
|
19 |
multilingual-e5-LARGE-stsb-tuned-b16-e10-all-languages,64.93,42.98,87.96,60.91,63.78,69.02
|
20 |
bge-LARGE-tuned-b16-e10,51.67,31.72,76.04,48.01,48.9,53.66
|
21 |
multilingual-e5-LARGE-stsb-tuned-b16-e15,67.56,43.35,90.98,67.27,65.35,70.87
|
22 |
+
text2vec-base-multilingual,58.64,34.82,79.24,58.69,58.28,62.2
|
23 |
+
paraphrase-multilingual-MiniLM-L12-v2,61.1,37.49,83.04,60.28,59.66,65.04
|
24 |
+
text2vec-stsb-tuned-b16-e5,57.19,34.64,77.72,56.46,56.94,60.22
|
25 |
+
paraphrase-multilingual-MiniLM-L12-v2-stsb-tuned-b16-e5,60.41,37.28,82.83,60.45,58.56,62.96
|
26 |
+
multilingual-e5-LARGE-tuned-double-dataset-b16-e5,62.65,42.33,85.21,57.01,62.09,66.61
|
27 |
+
multilingual-e5-LARGE-stsb-tuned-b16-e5,66.33,43.02,89.71,64.4,64.8,69.72
|
28 |
+
multilingual-e5-LARGE-stsb-tuned-b16-e10,66.77,43.86,89.45,64.87,65.13,70.51
|
29 |
+
multilingual-e5-LARGE-STSAUGMENTED-b16-e5,64.23,44.25,86.83,59.76,63.08,67.21
|
30 |
+
multilingual-e5-LARGE-double-finetuning-b16-e5,63.55,44.23,86.21,57.96,62.58,66.75
|
data/general.csv
CHANGED
@@ -12,8 +12,6 @@ paraphrase-multilingual-mpnet-BASE-v2-ft-stsb_multi_mt-embeddings,,,68.62,64.0,,
|
|
12 |
mstsb-paraphrase-multilingual-mpnet-BASE-v2,,,69.39,64.48,,74.29,
|
13 |
multilingual-e5-BASE-b16-e10,,,71.97,65.09,,78.86,
|
14 |
multilingual-e5-LARGE-stsb-tuned-b32-e10,,,72.73,66.19,,79.27,
|
15 |
-
multilingual-e5-LARGE-stsb-tuned-b16-e10,,,73.07,67.1,,79.05,
|
16 |
-
multilingual-e5-LARGE-stsb-tuned-b16-e5,,,72.84,66.23,,79.46,
|
17 |
multilingual-e5-LARGE-stsb-tuned-b64-e10,,,71.83,64.58,,79.08,
|
18 |
LaBSE,,,66.99,61.97,,72.01,
|
19 |
multilingual-e5-BASE-stsb-tuned-b16-e10-all-languages,,,71.88,64.39,,79.38,
|
@@ -21,5 +19,12 @@ bge-BASE-tuned-b16-e10,,,59.69,50.83,,68.55,
|
|
21 |
multilingual-e5-LARGE-stsb-tuned-b16-e10-all-languages,,,72.22,64.93,,79.5,
|
22 |
bge-LARGE-tuned-b16-e10,,,61.5,51.67,,71.34,
|
23 |
multilingual-e5-LARGE-stsb-tuned-b16-e15,,,73.38,67.56,,79.19,
|
24 |
-
|
25 |
-
multilingual-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
mstsb-paraphrase-multilingual-mpnet-BASE-v2,,,69.39,64.48,,74.29,
|
13 |
multilingual-e5-BASE-b16-e10,,,71.97,65.09,,78.86,
|
14 |
multilingual-e5-LARGE-stsb-tuned-b32-e10,,,72.73,66.19,,79.27,
|
|
|
|
|
15 |
multilingual-e5-LARGE-stsb-tuned-b64-e10,,,71.83,64.58,,79.08,
|
16 |
LaBSE,,,66.99,61.97,,72.01,
|
17 |
multilingual-e5-BASE-stsb-tuned-b16-e10-all-languages,,,71.88,64.39,,79.38,
|
|
|
19 |
multilingual-e5-LARGE-stsb-tuned-b16-e10-all-languages,,,72.22,64.93,,79.5,
|
20 |
bge-LARGE-tuned-b16-e10,,,61.5,51.67,,71.34,
|
21 |
multilingual-e5-LARGE-stsb-tuned-b16-e15,,,73.38,67.56,,79.19,
|
22 |
+
text2vec-base-multilingual,,,66.04,58.64,,73.43,
|
23 |
+
paraphrase-multilingual-MiniLM-L12-v2,,,66.08,61.1,,71.06,
|
24 |
+
text2vec-stsb-tuned-b16-e5,,,66.0,57.19,,74.81,
|
25 |
+
paraphrase-multilingual-MiniLM-L12-v2-stsb-tuned-b16-e5,,,68.21,60.41,,76.01,
|
26 |
+
multilingual-e5-LARGE-tuned-double-dataset-b16-e5,,,71.19,62.65,,79.74,
|
27 |
+
multilingual-e5-LARGE-stsb-tuned-b16-e5,,,72.9,66.33,,79.47,
|
28 |
+
multilingual-e5-LARGE-stsb-tuned-b16-e10,,,73.03,66.77,,79.29,
|
29 |
+
multilingual-e5-LARGE-STSAUGMENTED-b16-e5,,,71.84,64.23,,79.44,
|
30 |
+
multilingual-e5-LARGE-double-finetuning-b16-e5,,,71.53,63.55,,79.5,
|
data/sts.csv
CHANGED
@@ -12,8 +12,6 @@ paraphrase-multilingual-mpnet-BASE-v2-ft-stsb_multi_mt-embeddings,73.24,86.89,59
|
|
12 |
mstsb-paraphrase-multilingual-mpnet-BASE-v2,74.28,88.22,60.36
|
13 |
multilingual-e5-BASE-b16-e10,78.86,87.51,70.21
|
14 |
multilingual-e5-LARGE-stsb-tuned-b32-e10,79.27,88.1,70.44
|
15 |
-
multilingual-e5-LARGE-stsb-tuned-b16-e10,79.05,88.53,69.58
|
16 |
-
multilingual-e5-LARGE-stsb-tuned-b16-e5,79.46,88.44,70.48
|
17 |
multilingual-e5-LARGE-stsb-tuned-b64-e10,79.08,88.03,70.12
|
18 |
LaBSE,72.01,80.83,63.18
|
19 |
multilingual-e5-BASE-stsb-tuned-b16-e10-all-languages,79.38,87.77,70.99
|
@@ -21,5 +19,12 @@ bge-BASE-tuned-b16-e10,68.55,82.01,55.08
|
|
21 |
multilingual-e5-LARGE-stsb-tuned-b16-e10-all-languages,79.5,88.66,70.35
|
22 |
bge-LARGE-tuned-b16-e10,71.34,81.57,61.12
|
23 |
multilingual-e5-LARGE-stsb-tuned-b16-e15,79.19,89.04,69.34
|
24 |
-
|
25 |
-
multilingual-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
mstsb-paraphrase-multilingual-mpnet-BASE-v2,74.28,88.22,60.36
|
13 |
multilingual-e5-BASE-b16-e10,78.86,87.51,70.21
|
14 |
multilingual-e5-LARGE-stsb-tuned-b32-e10,79.27,88.1,70.44
|
|
|
|
|
15 |
multilingual-e5-LARGE-stsb-tuned-b64-e10,79.08,88.03,70.12
|
16 |
LaBSE,72.01,80.83,63.18
|
17 |
multilingual-e5-BASE-stsb-tuned-b16-e10-all-languages,79.38,87.77,70.99
|
|
|
19 |
multilingual-e5-LARGE-stsb-tuned-b16-e10-all-languages,79.5,88.66,70.35
|
20 |
bge-LARGE-tuned-b16-e10,71.34,81.57,61.12
|
21 |
multilingual-e5-LARGE-stsb-tuned-b16-e15,79.19,89.04,69.34
|
22 |
+
text2vec-base-multilingual,73.43,87.91,58.94
|
23 |
+
paraphrase-multilingual-MiniLM-L12-v2,71.06,85.56,56.56
|
24 |
+
text2vec-stsb-tuned-b16-e5,74.81,88.28,61.34
|
25 |
+
paraphrase-multilingual-MiniLM-L12-v2-stsb-tuned-b16-e5,76.01,88.03,63.99
|
26 |
+
multilingual-e5-LARGE-tuned-double-dataset-b16-e5,79.74,88.98,70.5
|
27 |
+
multilingual-e5-LARGE-stsb-tuned-b16-e5,79.47,88.72,70.21
|
28 |
+
multilingual-e5-LARGE-stsb-tuned-b16-e10,79.29,89.1,69.48
|
29 |
+
multilingual-e5-LARGE-STSAUGMENTED-b16-e5,79.44,88.78,70.11
|
30 |
+
multilingual-e5-LARGE-double-finetuning-b16-e5,79.5,88.63,70.37
|