metadata
tags:
- mteb
model-index:
- name: xlm_0b6_mixlang_newstep3
results:
- task:
type: Classification
dataset:
type: mteb/amazon_counterfactual
name: MTEB AmazonCounterfactualClassification (en)
config: en
split: test
revision: e8379541af4e31359cca9fbcf4b00f2671dba205
metrics:
- type: accuracy
value: 68.61194029850746
- type: ap
value: 30.653298301473487
- type: f1
value: 62.25241612666261
- task:
type: Classification
dataset:
type: mteb/amazon_polarity
name: MTEB AmazonPolarityClassification
config: default
split: test
revision: e2d317d38cd51312af73b3d32a06d1a08b442046
metrics:
- type: accuracy
value: 93.38145000000002
- type: ap
value: 90.31356902458496
- type: f1
value: 93.37421180090173
- task:
type: Classification
dataset:
type: mteb/amazon_reviews_multi
name: MTEB AmazonReviewsClassification (en)
config: en
split: test
revision: 1399c76144fd37290681b995c656ef9b2e06e26d
metrics:
- type: accuracy
value: 50.64400000000001
- type: f1
value: 48.975535848642295
- task:
type: Retrieval
dataset:
type: arguana
name: MTEB ArguAna
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 18.777
- type: map_at_10
value: 32.274
- type: map_at_100
value: 33.652
- type: map_at_1000
value: 33.669
- type: map_at_3
value: 27.276
- type: map_at_5
value: 29.758000000000003
- type: mrr_at_1
value: 19.63
- type: mrr_at_10
value: 32.573
- type: mrr_at_100
value: 33.951
- type: mrr_at_1000
value: 33.967999999999996
- type: mrr_at_3
value: 27.608
- type: mrr_at_5
value: 30.047
- type: ndcg_at_1
value: 18.777
- type: ndcg_at_10
value: 40.774
- type: ndcg_at_100
value: 46.931
- type: ndcg_at_1000
value: 47.359
- type: ndcg_at_3
value: 30.213
- type: ndcg_at_5
value: 34.705999999999996
- type: precision_at_1
value: 18.777
- type: precision_at_10
value: 6.842
- type: precision_at_100
value: 0.959
- type: precision_at_1000
value: 0.099
- type: precision_at_3
value: 12.921
- type: precision_at_5
value: 9.943
- type: recall_at_1
value: 18.777
- type: recall_at_10
value: 68.42099999999999
- type: recall_at_100
value: 95.946
- type: recall_at_1000
value: 99.289
- type: recall_at_3
value: 38.762
- type: recall_at_5
value: 49.716
- task:
type: Clustering
dataset:
type: mteb/arxiv-clustering-p2p
name: MTEB ArxivClusteringP2P
config: default
split: test
revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
metrics:
- type: v_measure
value: 45.53512209912995
- task:
type: Clustering
dataset:
type: mteb/arxiv-clustering-s2s
name: MTEB ArxivClusteringS2S
config: default
split: test
revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
metrics:
- type: v_measure
value: 38.432491784931464
- task:
type: Reranking
dataset:
type: mteb/askubuntudupquestions-reranking
name: MTEB AskUbuntuDupQuestions
config: default
split: test
revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
metrics:
- type: map
value: 61.11465519830743
- type: mrr
value: 74.41509475442992
- task:
type: STS
dataset:
type: mteb/biosses-sts
name: MTEB BIOSSES
config: default
split: test
revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
metrics:
- type: cos_sim_pearson
value: 82.1318467537697
- type: cos_sim_spearman
value: 80.25062374562512
- type: euclidean_pearson
value: 81.08228995090938
- type: euclidean_spearman
value: 80.25062374562512
- type: manhattan_pearson
value: 80.69075497902021
- type: manhattan_spearman
value: 79.63916402996817
- task:
type: Classification
dataset:
type: mteb/banking77
name: MTEB Banking77Classification
config: default
split: test
revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
metrics:
- type: accuracy
value: 78.50324675324674
- type: f1
value: 77.34014983227601
- task:
type: Clustering
dataset:
type: mteb/biorxiv-clustering-p2p
name: MTEB BiorxivClusteringP2P
config: default
split: test
revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
metrics:
- type: v_measure
value: 39.3047565513338
- task:
type: Clustering
dataset:
type: mteb/biorxiv-clustering-s2s
name: MTEB BiorxivClusteringS2S
config: default
split: test
revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
metrics:
- type: v_measure
value: 35.114800929695775
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackAndroidRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 31.757
- type: map_at_10
value: 43.443
- type: map_at_100
value: 44.972
- type: map_at_1000
value: 45.092999999999996
- type: map_at_3
value: 39.566
- type: map_at_5
value: 41.628
- type: mrr_at_1
value: 39.485
- type: mrr_at_10
value: 49.597
- type: mrr_at_100
value: 50.275999999999996
- type: mrr_at_1000
value: 50.312999999999995
- type: mrr_at_3
value: 46.876
- type: mrr_at_5
value: 48.35
- type: ndcg_at_1
value: 39.485
- type: ndcg_at_10
value: 50.11600000000001
- type: ndcg_at_100
value: 55.469
- type: ndcg_at_1000
value: 57.253
- type: ndcg_at_3
value: 44.695
- type: ndcg_at_5
value: 46.963
- type: precision_at_1
value: 39.485
- type: precision_at_10
value: 9.8
- type: precision_at_100
value: 1.5789999999999997
- type: precision_at_1000
value: 0.20400000000000001
- type: precision_at_3
value: 21.793000000000003
- type: precision_at_5
value: 15.651000000000002
- type: recall_at_1
value: 31.757
- type: recall_at_10
value: 62.861
- type: recall_at_100
value: 85.09
- type: recall_at_1000
value: 96.54
- type: recall_at_3
value: 46.981
- type: recall_at_5
value: 53.488
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackEnglishRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 24.616
- type: map_at_10
value: 33.999
- type: map_at_100
value: 35.299
- type: map_at_1000
value: 35.44
- type: map_at_3
value: 31.283
- type: map_at_5
value: 32.71
- type: mrr_at_1
value: 30.701
- type: mrr_at_10
value: 39.115
- type: mrr_at_100
value: 39.912
- type: mrr_at_1000
value: 39.963
- type: mrr_at_3
value: 36.975
- type: mrr_at_5
value: 38.118
- type: ndcg_at_1
value: 30.701
- type: ndcg_at_10
value: 39.454
- type: ndcg_at_100
value: 44.393
- type: ndcg_at_1000
value: 46.822
- type: ndcg_at_3
value: 35.317
- type: ndcg_at_5
value: 37.066
- type: precision_at_1
value: 30.701
- type: precision_at_10
value: 7.661999999999999
- type: precision_at_100
value: 1.308
- type: precision_at_1000
value: 0.185
- type: precision_at_3
value: 17.346
- type: precision_at_5
value: 12.203999999999999
- type: recall_at_1
value: 24.616
- type: recall_at_10
value: 49.681
- type: recall_at_100
value: 70.729
- type: recall_at_1000
value: 86.361
- type: recall_at_3
value: 37.677
- type: recall_at_5
value: 42.713
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackGamingRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 36.11
- type: map_at_10
value: 47.619
- type: map_at_100
value: 48.758
- type: map_at_1000
value: 48.818
- type: map_at_3
value: 44.354
- type: map_at_5
value: 46.192
- type: mrr_at_1
value: 41.379
- type: mrr_at_10
value: 51.075
- type: mrr_at_100
value: 51.807
- type: mrr_at_1000
value: 51.842
- type: mrr_at_3
value: 48.464
- type: mrr_at_5
value: 49.944
- type: ndcg_at_1
value: 41.379
- type: ndcg_at_10
value: 53.510999999999996
- type: ndcg_at_100
value: 57.981
- type: ndcg_at_1000
value: 59.245999999999995
- type: ndcg_at_3
value: 47.915
- type: ndcg_at_5
value: 50.586
- type: precision_at_1
value: 41.379
- type: precision_at_10
value: 8.770999999999999
- type: precision_at_100
value: 1.193
- type: precision_at_1000
value: 0.134
- type: precision_at_3
value: 21.587999999999997
- type: precision_at_5
value: 14.934
- type: recall_at_1
value: 36.11
- type: recall_at_10
value: 67.539
- type: recall_at_100
value: 86.803
- type: recall_at_1000
value: 95.889
- type: recall_at_3
value: 52.312999999999995
- type: recall_at_5
value: 58.967999999999996
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackGisRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 16.831
- type: map_at_10
value: 24.314
- type: map_at_100
value: 25.374999999999996
- type: map_at_1000
value: 25.474000000000004
- type: map_at_3
value: 21.884
- type: map_at_5
value: 23.203
- type: mrr_at_1
value: 18.079
- type: mrr_at_10
value: 25.741000000000003
- type: mrr_at_100
value: 26.728
- type: mrr_at_1000
value: 26.808
- type: mrr_at_3
value: 23.39
- type: mrr_at_5
value: 24.684
- type: ndcg_at_1
value: 18.079
- type: ndcg_at_10
value: 28.738000000000003
- type: ndcg_at_100
value: 34.408
- type: ndcg_at_1000
value: 37.129
- type: ndcg_at_3
value: 23.921999999999997
- type: ndcg_at_5
value: 26.151000000000003
- type: precision_at_1
value: 18.079
- type: precision_at_10
value: 4.768
- type: precision_at_100
value: 0.8089999999999999
- type: precision_at_1000
value: 0.109
- type: precision_at_3
value: 10.508000000000001
- type: precision_at_5
value: 7.661
- type: recall_at_1
value: 16.831
- type: recall_at_10
value: 40.967
- type: recall_at_100
value: 68.059
- type: recall_at_1000
value: 88.836
- type: recall_at_3
value: 27.927999999999997
- type: recall_at_5
value: 33.201
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackMathematicaRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 8.937000000000001
- type: map_at_10
value: 15.146
- type: map_at_100
value: 16.29
- type: map_at_1000
value: 16.441
- type: map_at_3
value: 13.014999999999999
- type: map_at_5
value: 14.088999999999999
- type: mrr_at_1
value: 11.193999999999999
- type: mrr_at_10
value: 18.199
- type: mrr_at_100
value: 19.278000000000002
- type: mrr_at_1000
value: 19.378
- type: mrr_at_3
value: 15.878999999999998
- type: mrr_at_5
value: 17.141000000000002
- type: ndcg_at_1
value: 11.193999999999999
- type: ndcg_at_10
value: 19.286
- type: ndcg_at_100
value: 25.291999999999998
- type: ndcg_at_1000
value: 29.012999999999998
- type: ndcg_at_3
value: 15.129999999999999
- type: ndcg_at_5
value: 16.926
- type: precision_at_1
value: 11.193999999999999
- type: precision_at_10
value: 3.918
- type: precision_at_100
value: 0.803
- type: precision_at_1000
value: 0.128
- type: precision_at_3
value: 7.587000000000001
- type: precision_at_5
value: 5.8709999999999996
- type: recall_at_1
value: 8.937000000000001
- type: recall_at_10
value: 28.89
- type: recall_at_100
value: 56.12200000000001
- type: recall_at_1000
value: 82.749
- type: recall_at_3
value: 17.748
- type: recall_at_5
value: 22.042
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackPhysicsRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 19.559
- type: map_at_10
value: 28.77
- type: map_at_100
value: 30.144
- type: map_at_1000
value: 30.270999999999997
- type: map_at_3
value: 25.456
- type: map_at_5
value: 27.351999999999997
- type: mrr_at_1
value: 24.062
- type: mrr_at_10
value: 33.409
- type: mrr_at_100
value: 34.369
- type: mrr_at_1000
value: 34.434
- type: mrr_at_3
value: 30.574
- type: mrr_at_5
value: 32.287
- type: ndcg_at_1
value: 24.062
- type: ndcg_at_10
value: 34.537
- type: ndcg_at_100
value: 40.542
- type: ndcg_at_1000
value: 43.208999999999996
- type: ndcg_at_3
value: 29.032000000000004
- type: ndcg_at_5
value: 31.838
- type: precision_at_1
value: 24.062
- type: precision_at_10
value: 6.814000000000001
- type: precision_at_100
value: 1.167
- type: precision_at_1000
value: 0.161
- type: precision_at_3
value: 14.244000000000002
- type: precision_at_5
value: 10.837
- type: recall_at_1
value: 19.559
- type: recall_at_10
value: 47.175
- type: recall_at_100
value: 73.11
- type: recall_at_1000
value: 91.144
- type: recall_at_3
value: 31.895
- type: recall_at_5
value: 38.978
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackProgrammersRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 18.828
- type: map_at_10
value: 27.664
- type: map_at_100
value: 29.099999999999998
- type: map_at_1000
value: 29.220000000000002
- type: map_at_3
value: 24.779
- type: map_at_5
value: 26.227
- type: mrr_at_1
value: 23.744
- type: mrr_at_10
value: 32.11
- type: mrr_at_100
value: 33.152
- type: mrr_at_1000
value: 33.215
- type: mrr_at_3
value: 29.604000000000003
- type: mrr_at_5
value: 30.894
- type: ndcg_at_1
value: 23.744
- type: ndcg_at_10
value: 33.047
- type: ndcg_at_100
value: 39.354
- type: ndcg_at_1000
value: 41.967999999999996
- type: ndcg_at_3
value: 28.133999999999997
- type: ndcg_at_5
value: 30.097
- type: precision_at_1
value: 23.744
- type: precision_at_10
value: 6.381
- type: precision_at_100
value: 1.135
- type: precision_at_1000
value: 0.155
- type: precision_at_3
value: 13.699
- type: precision_at_5
value: 9.932
- type: recall_at_1
value: 18.828
- type: recall_at_10
value: 44.777
- type: recall_at_100
value: 72.02499999999999
- type: recall_at_1000
value: 89.883
- type: recall_at_3
value: 30.881999999999998
- type: recall_at_5
value: 36.15
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 19.89466666666667
- type: map_at_10
value: 28.13191666666667
- type: map_at_100
value: 29.374083333333335
- type: map_at_1000
value: 29.501999999999995
- type: map_at_3
value: 25.450666666666667
- type: map_at_5
value: 26.862083333333338
- type: mrr_at_1
value: 23.87775
- type: mrr_at_10
value: 31.796833333333336
- type: mrr_at_100
value: 32.70425
- type: mrr_at_1000
value: 32.774
- type: mrr_at_3
value: 29.411000000000005
- type: mrr_at_5
value: 30.71525
- type: ndcg_at_1
value: 23.87775
- type: ndcg_at_10
value: 33.14725
- type: ndcg_at_100
value: 38.63300000000001
- type: ndcg_at_1000
value: 41.29166666666668
- type: ndcg_at_3
value: 28.504250000000003
- type: ndcg_at_5
value: 30.546250000000004
- type: precision_at_1
value: 23.87775
- type: precision_at_10
value: 6.143166666666667
- type: precision_at_100
value: 1.0658333333333332
- type: precision_at_1000
value: 0.1495
- type: precision_at_3
value: 13.468083333333333
- type: precision_at_5
value: 9.763416666666664
- type: recall_at_1
value: 19.89466666666667
- type: recall_at_10
value: 44.33358333333333
- type: recall_at_100
value: 68.79966666666667
- type: recall_at_1000
value: 87.5325
- type: recall_at_3
value: 31.34816666666667
- type: recall_at_5
value: 36.612833333333334
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackStatsRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 11.779
- type: map_at_10
value: 16.581000000000003
- type: map_at_100
value: 17.374000000000002
- type: map_at_1000
value: 17.48
- type: map_at_3
value: 14.777000000000001
- type: map_at_5
value: 15.654000000000002
- type: mrr_at_1
value: 13.497
- type: mrr_at_10
value: 18.192
- type: mrr_at_100
value: 18.929000000000002
- type: mrr_at_1000
value: 19.014
- type: mrr_at_3
value: 16.488
- type: mrr_at_5
value: 17.285
- type: ndcg_at_1
value: 13.497
- type: ndcg_at_10
value: 19.676
- type: ndcg_at_100
value: 24.081
- type: ndcg_at_1000
value: 27.012000000000004
- type: ndcg_at_3
value: 16.179
- type: ndcg_at_5
value: 17.573
- type: precision_at_1
value: 13.497
- type: precision_at_10
value: 3.512
- type: precision_at_100
value: 0.632
- type: precision_at_1000
value: 0.095
- type: precision_at_3
value: 7.362
- type: precision_at_5
value: 5.367999999999999
- type: recall_at_1
value: 11.779
- type: recall_at_10
value: 27.613
- type: recall_at_100
value: 48.829
- type: recall_at_1000
value: 71.025
- type: recall_at_3
value: 17.815
- type: recall_at_5
value: 21.279999999999998
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackTexRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 11.181000000000001
- type: map_at_10
value: 16.724
- type: map_at_100
value: 17.806
- type: map_at_1000
value: 17.946
- type: map_at_3
value: 14.718
- type: map_at_5
value: 15.848
- type: mrr_at_1
value: 13.971
- type: mrr_at_10
value: 19.716
- type: mrr_at_100
value: 20.71
- type: mrr_at_1000
value: 20.804000000000002
- type: mrr_at_3
value: 17.727999999999998
- type: mrr_at_5
value: 18.862000000000002
- type: ndcg_at_1
value: 13.971
- type: ndcg_at_10
value: 20.531
- type: ndcg_at_100
value: 25.901000000000003
- type: ndcg_at_1000
value: 29.317999999999998
- type: ndcg_at_3
value: 16.828000000000003
- type: ndcg_at_5
value: 18.576
- type: precision_at_1
value: 13.971
- type: precision_at_10
value: 4.04
- type: precision_at_100
value: 0.803
- type: precision_at_1000
value: 0.129
- type: precision_at_3
value: 8.305
- type: precision_at_5
value: 6.29
- type: recall_at_1
value: 11.181000000000001
- type: recall_at_10
value: 29.042
- type: recall_at_100
value: 53.342
- type: recall_at_1000
value: 78.117
- type: recall_at_3
value: 18.804000000000002
- type: recall_at_5
value: 23.22
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackUnixRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 23.046
- type: map_at_10
value: 30.702
- type: map_at_100
value: 31.961000000000002
- type: map_at_1000
value: 32.077
- type: map_at_3
value: 28.083000000000002
- type: map_at_5
value: 29.391000000000002
- type: mrr_at_1
value: 27.239
- type: mrr_at_10
value: 34.472
- type: mrr_at_100
value: 35.485
- type: mrr_at_1000
value: 35.558
- type: mrr_at_3
value: 32.245000000000005
- type: mrr_at_5
value: 33.42
- type: ndcg_at_1
value: 27.239
- type: ndcg_at_10
value: 35.453
- type: ndcg_at_100
value: 41.347
- type: ndcg_at_1000
value: 43.986
- type: ndcg_at_3
value: 30.768
- type: ndcg_at_5
value: 32.694
- type: precision_at_1
value: 27.239
- type: precision_at_10
value: 6.138
- type: precision_at_100
value: 1.014
- type: precision_at_1000
value: 0.136
- type: precision_at_3
value: 13.775
- type: precision_at_5
value: 9.776
- type: recall_at_1
value: 23.046
- type: recall_at_10
value: 46.178999999999995
- type: recall_at_100
value: 72.366
- type: recall_at_1000
value: 90.713
- type: recall_at_3
value: 33.214
- type: recall_at_5
value: 38.186
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackWebmastersRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 22.006999999999998
- type: map_at_10
value: 30.791
- type: map_at_100
value: 32.495000000000005
- type: map_at_1000
value: 32.731
- type: map_at_3
value: 27.738000000000003
- type: map_at_5
value: 29.115000000000002
- type: mrr_at_1
value: 27.47
- type: mrr_at_10
value: 36.355
- type: mrr_at_100
value: 37.207
- type: mrr_at_1000
value: 37.262
- type: mrr_at_3
value: 33.267
- type: mrr_at_5
value: 34.918
- type: ndcg_at_1
value: 27.47
- type: ndcg_at_10
value: 37.314
- type: ndcg_at_100
value: 43.228
- type: ndcg_at_1000
value: 45.789
- type: ndcg_at_3
value: 32.178000000000004
- type: ndcg_at_5
value: 34.082
- type: precision_at_1
value: 27.47
- type: precision_at_10
value: 7.5889999999999995
- type: precision_at_100
value: 1.587
- type: precision_at_1000
value: 0.245
- type: precision_at_3
value: 15.613
- type: precision_at_5
value: 11.501999999999999
- type: recall_at_1
value: 22.006999999999998
- type: recall_at_10
value: 49.811
- type: recall_at_100
value: 76.175
- type: recall_at_1000
value: 92.432
- type: recall_at_3
value: 34.445
- type: recall_at_5
value: 39.834
- task:
type: Retrieval
dataset:
type: BeIR/cqadupstack
name: MTEB CQADupstackWordpressRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 14.085
- type: map_at_10
value: 21.83
- type: map_at_100
value: 22.915
- type: map_at_1000
value: 23.033
- type: map_at_3
value: 19.755
- type: map_at_5
value: 20.936
- type: mrr_at_1
value: 15.712000000000002
- type: mrr_at_10
value: 23.581
- type: mrr_at_100
value: 24.598
- type: mrr_at_1000
value: 24.697
- type: mrr_at_3
value: 21.442
- type: mrr_at_5
value: 22.68
- type: ndcg_at_1
value: 15.712000000000002
- type: ndcg_at_10
value: 26.104
- type: ndcg_at_100
value: 31.6
- type: ndcg_at_1000
value: 34.755
- type: ndcg_at_3
value: 21.953
- type: ndcg_at_5
value: 24.003
- type: precision_at_1
value: 15.712000000000002
- type: precision_at_10
value: 4.324999999999999
- type: precision_at_100
value: 0.76
- type: precision_at_1000
value: 0.11299999999999999
- type: precision_at_3
value: 9.797
- type: precision_at_5
value: 7.135
- type: recall_at_1
value: 14.085
- type: recall_at_10
value: 37.468
- type: recall_at_100
value: 62.946000000000005
- type: recall_at_1000
value: 86.701
- type: recall_at_3
value: 26.476
- type: recall_at_5
value: 31.294
- task:
type: Retrieval
dataset:
type: climate-fever
name: MTEB ClimateFEVER
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 8.305
- type: map_at_10
value: 14.971
- type: map_at_100
value: 16.634999999999998
- type: map_at_1000
value: 16.842
- type: map_at_3
value: 12.281
- type: map_at_5
value: 13.608
- type: mrr_at_1
value: 18.958
- type: mrr_at_10
value: 29.104000000000003
- type: mrr_at_100
value: 30.198000000000004
- type: mrr_at_1000
value: 30.264999999999997
- type: mrr_at_3
value: 25.548
- type: mrr_at_5
value: 27.805999999999997
- type: ndcg_at_1
value: 18.958
- type: ndcg_at_10
value: 21.84
- type: ndcg_at_100
value: 28.871999999999996
- type: ndcg_at_1000
value: 32.868
- type: ndcg_at_3
value: 16.991
- type: ndcg_at_5
value: 18.859
- type: precision_at_1
value: 18.958
- type: precision_at_10
value: 7.002999999999999
- type: precision_at_100
value: 1.4409999999999998
- type: precision_at_1000
value: 0.218
- type: precision_at_3
value: 12.681999999999999
- type: precision_at_5
value: 10.176
- type: recall_at_1
value: 8.305
- type: recall_at_10
value: 27.492
- type: recall_at_100
value: 52.053000000000004
- type: recall_at_1000
value: 74.52600000000001
- type: recall_at_3
value: 15.931999999999999
- type: recall_at_5
value: 20.71
- task:
type: Retrieval
dataset:
type: dbpedia-entity
name: MTEB DBPedia
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 7.928
- type: map_at_10
value: 17.128
- type: map_at_100
value: 23.657
- type: map_at_1000
value: 25.28
- type: map_at_3
value: 12.623999999999999
- type: map_at_5
value: 14.536999999999999
- type: mrr_at_1
value: 60.25
- type: mrr_at_10
value: 70.391
- type: mrr_at_100
value: 70.87
- type: mrr_at_1000
value: 70.879
- type: mrr_at_3
value: 69.125
- type: mrr_at_5
value: 69.85
- type: ndcg_at_1
value: 49.75
- type: ndcg_at_10
value: 37.473
- type: ndcg_at_100
value: 41.569
- type: ndcg_at_1000
value: 49.318
- type: ndcg_at_3
value: 42.791000000000004
- type: ndcg_at_5
value: 39.568999999999996
- type: precision_at_1
value: 60.25
- type: precision_at_10
value: 29.4
- type: precision_at_100
value: 9.468
- type: precision_at_1000
value: 2.077
- type: precision_at_3
value: 46.417
- type: precision_at_5
value: 37.95
- type: recall_at_1
value: 7.928
- type: recall_at_10
value: 22.603
- type: recall_at_100
value: 47.193000000000005
- type: recall_at_1000
value: 71.346
- type: recall_at_3
value: 14.472
- type: recall_at_5
value: 17.485999999999997
- task:
type: Classification
dataset:
type: mteb/emotion
name: MTEB EmotionClassification
config: default
split: test
revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
metrics:
- type: accuracy
value: 46.37
- type: f1
value: 40.27549527082307
- task:
type: Retrieval
dataset:
type: fever
name: MTEB FEVER
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 40.849999999999994
- type: map_at_10
value: 54.54
- type: map_at_100
value: 55.143
- type: map_at_1000
value: 55.16799999999999
- type: map_at_3
value: 51.318
- type: map_at_5
value: 53.403999999999996
- type: mrr_at_1
value: 43.984
- type: mrr_at_10
value: 58.07600000000001
- type: mrr_at_100
value: 58.605
- type: mrr_at_1000
value: 58.620000000000005
- type: mrr_at_3
value: 54.918
- type: mrr_at_5
value: 56.974999999999994
- type: ndcg_at_1
value: 43.984
- type: ndcg_at_10
value: 61.768
- type: ndcg_at_100
value: 64.42099999999999
- type: ndcg_at_1000
value: 64.97800000000001
- type: ndcg_at_3
value: 55.533
- type: ndcg_at_5
value: 59.14
- type: precision_at_1
value: 43.984
- type: precision_at_10
value: 8.822000000000001
- type: precision_at_100
value: 1.0250000000000001
- type: precision_at_1000
value: 0.109
- type: precision_at_3
value: 23.172
- type: precision_at_5
value: 15.857
- type: recall_at_1
value: 40.849999999999994
- type: recall_at_10
value: 80.663
- type: recall_at_100
value: 92.29899999999999
- type: recall_at_1000
value: 96.233
- type: recall_at_3
value: 64.031
- type: recall_at_5
value: 72.764
- task:
type: Retrieval
dataset:
type: fiqa
name: MTEB FiQA2018
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 18.852
- type: map_at_10
value: 31.392999999999997
- type: map_at_100
value: 33.324999999999996
- type: map_at_1000
value: 33.5
- type: map_at_3
value: 27.249000000000002
- type: map_at_5
value: 29.401
- type: mrr_at_1
value: 38.272
- type: mrr_at_10
value: 47.076
- type: mrr_at_100
value: 47.902
- type: mrr_at_1000
value: 47.942
- type: mrr_at_3
value: 44.624
- type: mrr_at_5
value: 46.098
- type: ndcg_at_1
value: 38.272
- type: ndcg_at_10
value: 39.214
- type: ndcg_at_100
value: 46.341
- type: ndcg_at_1000
value: 49.282
- type: ndcg_at_3
value: 35.757
- type: ndcg_at_5
value: 36.669000000000004
- type: precision_at_1
value: 38.272
- type: precision_at_10
value: 11.219
- type: precision_at_100
value: 1.8599999999999999
- type: precision_at_1000
value: 0.23800000000000002
- type: precision_at_3
value: 24.331
- type: precision_at_5
value: 17.87
- type: recall_at_1
value: 18.852
- type: recall_at_10
value: 46.078
- type: recall_at_100
value: 72.898
- type: recall_at_1000
value: 90.644
- type: recall_at_3
value: 32.221
- type: recall_at_5
value: 37.894
- task:
type: Retrieval
dataset:
type: hotpotqa
name: MTEB HotpotQA
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 32.714
- type: map_at_10
value: 46.743
- type: map_at_100
value: 47.64
- type: map_at_1000
value: 47.717999999999996
- type: map_at_3
value: 43.872
- type: map_at_5
value: 45.629
- type: mrr_at_1
value: 65.429
- type: mrr_at_10
value: 72.507
- type: mrr_at_100
value: 72.80799999999999
- type: mrr_at_1000
value: 72.82600000000001
- type: mrr_at_3
value: 70.98100000000001
- type: mrr_at_5
value: 71.967
- type: ndcg_at_1
value: 65.429
- type: ndcg_at_10
value: 55.84
- type: ndcg_at_100
value: 59.183
- type: ndcg_at_1000
value: 60.81100000000001
- type: ndcg_at_3
value: 51.327
- type: ndcg_at_5
value: 53.803
- type: precision_at_1
value: 65.429
- type: precision_at_10
value: 11.620999999999999
- type: precision_at_100
value: 1.425
- type: precision_at_1000
value: 0.164
- type: precision_at_3
value: 32.077
- type: precision_at_5
value: 21.199
- type: recall_at_1
value: 32.714
- type: recall_at_10
value: 58.103
- type: recall_at_100
value: 71.269
- type: recall_at_1000
value: 82.073
- type: recall_at_3
value: 48.116
- type: recall_at_5
value: 52.998
- task:
type: Classification
dataset:
type: mteb/imdb
name: MTEB ImdbClassification
config: default
split: test
revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
metrics:
- type: accuracy
value: 88.5384
- type: ap
value: 84.07244605493386
- type: f1
value: 88.51724847689141
- task:
type: Retrieval
dataset:
type: msmarco
name: MTEB MSMARCO
config: default
split: dev
revision: None
metrics:
- type: map_at_1
value: 17.169999999999998
- type: map_at_10
value: 28.601
- type: map_at_100
value: 29.869
- type: map_at_1000
value: 29.929
- type: map_at_3
value: 24.69
- type: map_at_5
value: 26.929
- type: mrr_at_1
value: 17.622
- type: mrr_at_10
value: 29.079
- type: mrr_at_100
value: 30.301000000000002
- type: mrr_at_1000
value: 30.354
- type: mrr_at_3
value: 25.232
- type: mrr_at_5
value: 27.458
- type: ndcg_at_1
value: 17.622
- type: ndcg_at_10
value: 35.357
- type: ndcg_at_100
value: 41.623
- type: ndcg_at_1000
value: 43.119
- type: ndcg_at_3
value: 27.344
- type: ndcg_at_5
value: 31.367
- type: precision_at_1
value: 17.622
- type: precision_at_10
value: 5.891
- type: precision_at_100
value: 0.9039999999999999
- type: precision_at_1000
value: 0.10300000000000001
- type: precision_at_3
value: 11.91
- type: precision_at_5
value: 9.189
- type: recall_at_1
value: 17.169999999999998
- type: recall_at_10
value: 56.369
- type: recall_at_100
value: 85.649
- type: recall_at_1000
value: 97.096
- type: recall_at_3
value: 34.499
- type: recall_at_5
value: 44.194
- task:
type: Classification
dataset:
type: mteb/mtop_domain
name: MTEB MTOPDomainClassification (en)
config: en
split: test
revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
metrics:
- type: accuracy
value: 90.4810761513908
- type: f1
value: 90.43983880684412
- task:
type: Classification
dataset:
type: mteb/mtop_intent
name: MTEB MTOPIntentClassification (en)
config: en
split: test
revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
metrics:
- type: accuracy
value: 59.824441404468764
- type: f1
value: 41.140870725364245
- task:
type: Classification
dataset:
type: mteb/amazon_massive_intent
name: MTEB MassiveIntentClassification (en)
config: en
split: test
revision: 31efe3c427b0bae9c22cbb560b8f15491cc6bed7
metrics:
- type: accuracy
value: 67.23940820443846
- type: f1
value: 63.866444501622254
- task:
type: Classification
dataset:
type: mteb/amazon_massive_scenario
name: MTEB MassiveScenarioClassification (en)
config: en
split: test
revision: 7d571f92784cd94a019292a1f45445077d0ef634
metrics:
- type: accuracy
value: 72.98251513113652
- type: f1
value: 72.26944666028224
- task:
type: Clustering
dataset:
type: mteb/medrxiv-clustering-p2p
name: MTEB MedrxivClusteringP2P
config: default
split: test
revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
metrics:
- type: v_measure
value: 34.7972586123168
- task:
type: Clustering
dataset:
type: mteb/medrxiv-clustering-s2s
name: MTEB MedrxivClusteringS2S
config: default
split: test
revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
metrics:
- type: v_measure
value: 32.77986542120405
- task:
type: Reranking
dataset:
type: mteb/mind_small
name: MTEB MindSmallReranking
config: default
split: test
revision: 3bdac13927fdc888b903db93b2ffdbd90b295a69
metrics:
- type: map
value: 28.827020967264875
- type: mrr
value: 29.491954633310463
- task:
type: Retrieval
dataset:
type: nfcorpus
name: MTEB NFCorpus
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 5.099
- type: map_at_10
value: 11.205
- type: map_at_100
value: 14.533999999999999
- type: map_at_1000
value: 16.012999999999998
- type: map_at_3
value: 8.074
- type: map_at_5
value: 9.515
- type: mrr_at_1
value: 43.034
- type: mrr_at_10
value: 50.903
- type: mrr_at_100
value: 51.62
- type: mrr_at_1000
value: 51.661
- type: mrr_at_3
value: 48.71
- type: mrr_at_5
value: 49.886
- type: ndcg_at_1
value: 39.938
- type: ndcg_at_10
value: 31.572
- type: ndcg_at_100
value: 29.652
- type: ndcg_at_1000
value: 38.971000000000004
- type: ndcg_at_3
value: 36.758
- type: ndcg_at_5
value: 34.481
- type: precision_at_1
value: 42.105
- type: precision_at_10
value: 24.056
- type: precision_at_100
value: 7.666
- type: precision_at_1000
value: 2.11
- type: precision_at_3
value: 35.088
- type: precision_at_5
value: 30.402
- type: recall_at_1
value: 5.099
- type: recall_at_10
value: 14.780999999999999
- type: recall_at_100
value: 31.653
- type: recall_at_1000
value: 63.724000000000004
- type: recall_at_3
value: 8.933
- type: recall_at_5
value: 11.413
- task:
type: Retrieval
dataset:
type: nq
name: MTEB NQ
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 25.232
- type: map_at_10
value: 39.704
- type: map_at_100
value: 40.93
- type: map_at_1000
value: 40.963
- type: map_at_3
value: 34.882999999999996
- type: map_at_5
value: 37.597
- type: mrr_at_1
value: 28.853
- type: mrr_at_10
value: 42.218
- type: mrr_at_100
value: 43.179
- type: mrr_at_1000
value: 43.202
- type: mrr_at_3
value: 38.157000000000004
- type: mrr_at_5
value: 40.483000000000004
- type: ndcg_at_1
value: 28.823999999999998
- type: ndcg_at_10
value: 47.729
- type: ndcg_at_100
value: 52.898999999999994
- type: ndcg_at_1000
value: 53.686
- type: ndcg_at_3
value: 38.548
- type: ndcg_at_5
value: 43.119
- type: precision_at_1
value: 28.823999999999998
- type: precision_at_10
value: 8.34
- type: precision_at_100
value: 1.1199999999999999
- type: precision_at_1000
value: 0.11900000000000001
- type: precision_at_3
value: 17.922
- type: precision_at_5
value: 13.331000000000001
- type: recall_at_1
value: 25.232
- type: recall_at_10
value: 69.95
- type: recall_at_100
value: 92.333
- type: recall_at_1000
value: 98.218
- type: recall_at_3
value: 45.946999999999996
- type: recall_at_5
value: 56.598000000000006
- task:
type: Retrieval
dataset:
type: quora
name: MTEB QuoraRetrieval
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 70.083
- type: map_at_10
value: 84.16
- type: map_at_100
value: 84.807
- type: map_at_1000
value: 84.822
- type: map_at_3
value: 81.181
- type: map_at_5
value: 83.094
- type: mrr_at_1
value: 80.83
- type: mrr_at_10
value: 87.173
- type: mrr_at_100
value: 87.28399999999999
- type: mrr_at_1000
value: 87.285
- type: mrr_at_3
value: 86.21
- type: mrr_at_5
value: 86.886
- type: ndcg_at_1
value: 80.85
- type: ndcg_at_10
value: 87.96199999999999
- type: ndcg_at_100
value: 89.225
- type: ndcg_at_1000
value: 89.32900000000001
- type: ndcg_at_3
value: 85.101
- type: ndcg_at_5
value: 86.74
- type: precision_at_1
value: 80.85
- type: precision_at_10
value: 13.378
- type: precision_at_100
value: 1.5310000000000001
- type: precision_at_1000
value: 0.157
- type: precision_at_3
value: 37.269999999999996
- type: precision_at_5
value: 24.568
- type: recall_at_1
value: 70.083
- type: recall_at_10
value: 95.194
- type: recall_at_100
value: 99.51100000000001
- type: recall_at_1000
value: 99.991
- type: recall_at_3
value: 87.027
- type: recall_at_5
value: 91.604
- task:
type: Clustering
dataset:
type: mteb/reddit-clustering
name: MTEB RedditClustering
config: default
split: test
revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
metrics:
- type: v_measure
value: 49.23995527989351
- task:
type: Clustering
dataset:
type: mteb/reddit-clustering-p2p
name: MTEB RedditClusteringP2P
config: default
split: test
revision: 282350215ef01743dc01b456c7f5241fa8937f16
metrics:
- type: v_measure
value: 58.81838285815132
- task:
type: Retrieval
dataset:
type: scidocs
name: MTEB SCIDOCS
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 4.463
- type: map_at_10
value: 11.387
- type: map_at_100
value: 13.621
- type: map_at_1000
value: 13.982
- type: map_at_3
value: 8.022
- type: map_at_5
value: 9.464
- type: mrr_at_1
value: 22
- type: mrr_at_10
value: 32.902
- type: mrr_at_100
value: 34.036
- type: mrr_at_1000
value: 34.093
- type: mrr_at_3
value: 29.317
- type: mrr_at_5
value: 31.141999999999996
- type: ndcg_at_1
value: 22
- type: ndcg_at_10
value: 19.483
- type: ndcg_at_100
value: 28.118
- type: ndcg_at_1000
value: 34.355999999999995
- type: ndcg_at_3
value: 18.032999999999998
- type: ndcg_at_5
value: 15.613
- type: precision_at_1
value: 22
- type: precision_at_10
value: 10.35
- type: precision_at_100
value: 2.282
- type: precision_at_1000
value: 0.378
- type: precision_at_3
value: 16.967
- type: precision_at_5
value: 13.719999999999999
- type: recall_at_1
value: 4.463
- type: recall_at_10
value: 20.963
- type: recall_at_100
value: 46.322
- type: recall_at_1000
value: 76.713
- type: recall_at_3
value: 10.308
- type: recall_at_5
value: 13.888
- task:
type: STS
dataset:
type: mteb/sickr-sts
name: MTEB SICK-R
config: default
split: test
revision: a6ea5a8cab320b040a23452cc28066d9beae2cee
metrics:
- type: cos_sim_pearson
value: 84.84563850617418
- type: cos_sim_spearman
value: 79.68400149970968
- type: euclidean_pearson
value: 82.75837054306935
- type: euclidean_spearman
value: 79.6840247099308
- type: manhattan_pearson
value: 82.73540970661433
- type: manhattan_spearman
value: 79.66844192381396
- task:
type: STS
dataset:
type: mteb/sts12-sts
name: MTEB STS12
config: default
split: test
revision: a0d554a64d88156834ff5ae9920b964011b16384
metrics:
- type: cos_sim_pearson
value: 77.81430060207765
- type: cos_sim_spearman
value: 69.94012785669503
- type: euclidean_pearson
value: 74.59541033717807
- type: euclidean_spearman
value: 69.94010426360558
- type: manhattan_pearson
value: 74.56400760328428
- type: manhattan_spearman
value: 69.92806341709132
- task:
type: STS
dataset:
type: mteb/sts13-sts
name: MTEB STS13
config: default
split: test
revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
metrics:
- type: cos_sim_pearson
value: 74.81511131302516
- type: cos_sim_spearman
value: 79.62625737683277
- type: euclidean_pearson
value: 77.45706601071352
- type: euclidean_spearman
value: 79.62625730605384
- type: manhattan_pearson
value: 77.3334919461798
- type: manhattan_spearman
value: 79.46650568750321
- task:
type: STS
dataset:
type: mteb/sts14-sts
name: MTEB STS14
config: default
split: test
revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
metrics:
- type: cos_sim_pearson
value: 73.43273002333167
- type: cos_sim_spearman
value: 71.34169412319034
- type: euclidean_pearson
value: 73.58628382548541
- type: euclidean_spearman
value: 71.3417253984979
- type: manhattan_pearson
value: 73.528660458135
- type: manhattan_spearman
value: 71.29492315680972
- task:
type: STS
dataset:
type: mteb/sts15-sts
name: MTEB STS15
config: default
split: test
revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
metrics:
- type: cos_sim_pearson
value: 79.7528032458892
- type: cos_sim_spearman
value: 82.80881645241301
- type: euclidean_pearson
value: 81.49065539033161
- type: euclidean_spearman
value: 82.80881911292607
- type: manhattan_pearson
value: 81.48964007971324
- type: manhattan_spearman
value: 82.82325035979333
- task:
type: STS
dataset:
type: mteb/sts16-sts
name: MTEB STS16
config: default
split: test
revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
metrics:
- type: cos_sim_pearson
value: 77.46090733936299
- type: cos_sim_spearman
value: 82.65342321085096
- type: euclidean_pearson
value: 81.6531230438912
- type: euclidean_spearman
value: 82.65342321085096
- type: manhattan_pearson
value: 81.6092667285348
- type: manhattan_spearman
value: 82.63811888178375
- task:
type: STS
dataset:
type: mteb/sts17-crosslingual-sts
name: MTEB STS17 (en-en)
config: en-en
split: test
revision: af5e6fb845001ecf41f4c1e033ce921939a2a68d
metrics:
- type: cos_sim_pearson
value: 88.36545028139912
- type: cos_sim_spearman
value: 88.8877047117119
- type: euclidean_pearson
value: 89.26155338214109
- type: euclidean_spearman
value: 88.8877047117119
- type: manhattan_pearson
value: 89.18322803188939
- type: manhattan_spearman
value: 88.74063459127103
- task:
type: STS
dataset:
type: mteb/sts22-crosslingual-sts
name: MTEB STS22 (en)
config: en
split: test
revision: 6d1ba47164174a496b7fa5d3569dae26a6813b80
metrics:
- type: cos_sim_pearson
value: 68.11778566972097
- type: cos_sim_spearman
value: 68.4773054255333
- type: euclidean_pearson
value: 69.06680343994812
- type: euclidean_spearman
value: 68.4773054255333
- type: manhattan_pearson
value: 68.866622017307
- type: manhattan_spearman
value: 68.15156375349754
- task:
type: STS
dataset:
type: mteb/stsbenchmark-sts
name: MTEB STSBenchmark
config: default
split: test
revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
metrics:
- type: cos_sim_pearson
value: 84.64200346870874
- type: cos_sim_spearman
value: 86.5043271353841
- type: euclidean_pearson
value: 86.36114472174944
- type: euclidean_spearman
value: 86.50433264867542
- type: manhattan_pearson
value: 86.29057032602698
- type: manhattan_spearman
value: 86.45171993846006
- task:
type: Reranking
dataset:
type: mteb/scidocs-reranking
name: MTEB SciDocsRR
config: default
split: test
revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
metrics:
- type: map
value: 85.9286721127671
- type: mrr
value: 95.76535029966404
- task:
type: Retrieval
dataset:
type: scifact
name: MTEB SciFact
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 53.067
- type: map_at_10
value: 63.580000000000005
- type: map_at_100
value: 64.238
- type: map_at_1000
value: 64.265
- type: map_at_3
value: 60.402
- type: map_at_5
value: 62.456999999999994
- type: mrr_at_1
value: 55.667
- type: mrr_at_10
value: 64.566
- type: mrr_at_100
value: 65.054
- type: mrr_at_1000
value: 65.08
- type: mrr_at_3
value: 61.944
- type: mrr_at_5
value: 63.761
- type: ndcg_at_1
value: 55.667
- type: ndcg_at_10
value: 68.354
- type: ndcg_at_100
value: 70.94
- type: ndcg_at_1000
value: 71.759
- type: ndcg_at_3
value: 62.814
- type: ndcg_at_5
value: 66.084
- type: precision_at_1
value: 55.667
- type: precision_at_10
value: 9.232999999999999
- type: precision_at_100
value: 1.06
- type: precision_at_1000
value: 0.11299999999999999
- type: precision_at_3
value: 24.444
- type: precision_at_5
value: 16.667
- type: recall_at_1
value: 53.067
- type: recall_at_10
value: 81.89999999999999
- type: recall_at_100
value: 93
- type: recall_at_1000
value: 99.667
- type: recall_at_3
value: 67.589
- type: recall_at_5
value: 75.506
- task:
type: PairClassification
dataset:
type: mteb/sprintduplicatequestions-pairclassification
name: MTEB SprintDuplicateQuestions
config: default
split: test
revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
metrics:
- type: cos_sim_accuracy
value: 99.61287128712871
- type: cos_sim_ap
value: 88.21320824985605
- type: cos_sim_f1
value: 80.15451472718492
- type: cos_sim_precision
value: 77.49766573295986
- type: cos_sim_recall
value: 83
- type: dot_accuracy
value: 99.61287128712871
- type: dot_ap
value: 88.21329368452164
- type: dot_f1
value: 80.15451472718492
- type: dot_precision
value: 77.49766573295986
- type: dot_recall
value: 83
- type: euclidean_accuracy
value: 99.61287128712871
- type: euclidean_ap
value: 88.21328696557586
- type: euclidean_f1
value: 80.15451472718492
- type: euclidean_precision
value: 77.49766573295986
- type: euclidean_recall
value: 83
- type: manhattan_accuracy
value: 99.61287128712871
- type: manhattan_ap
value: 88.26324850748259
- type: manhattan_f1
value: 80.36839554047503
- type: manhattan_precision
value: 77.9868297271872
- type: manhattan_recall
value: 82.89999999999999
- type: max_accuracy
value: 99.61287128712871
- type: max_ap
value: 88.26324850748259
- type: max_f1
value: 80.36839554047503
- task:
type: Clustering
dataset:
type: mteb/stackexchange-clustering
name: MTEB StackExchangeClustering
config: default
split: test
revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
metrics:
- type: v_measure
value: 58.88814718001269
- task:
type: Clustering
dataset:
type: mteb/stackexchange-clustering-p2p
name: MTEB StackExchangeClusteringP2P
config: default
split: test
revision: 815ca46b2622cec33ccafc3735d572c266efdb44
metrics:
- type: v_measure
value: 33.6023610692526
- task:
type: Reranking
dataset:
type: mteb/stackoverflowdupquestions-reranking
name: MTEB StackOverflowDupQuestions
config: default
split: test
revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
metrics:
- type: map
value: 46.52388882316049
- type: mrr
value: 46.98781406501995
- task:
type: Summarization
dataset:
type: mteb/summeval
name: MTEB SummEval
config: default
split: test
revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
metrics:
- type: cos_sim_pearson
value: 27.06710433803873
- type: cos_sim_spearman
value: 30.251609255580625
- type: dot_pearson
value: 27.0671067449827
- type: dot_spearman
value: 30.251609255580625
- task:
type: Retrieval
dataset:
type: trec-covid
name: MTEB TRECCOVID
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 0.16999999999999998
- type: map_at_10
value: 1.204
- type: map_at_100
value: 6.800000000000001
- type: map_at_1000
value: 16.753999999999998
- type: map_at_3
value: 0.441
- type: map_at_5
value: 0.692
- type: mrr_at_1
value: 64
- type: mrr_at_10
value: 75.5
- type: mrr_at_100
value: 75.667
- type: mrr_at_1000
value: 75.667
- type: mrr_at_3
value: 72.333
- type: mrr_at_5
value: 74.63300000000001
- type: ndcg_at_1
value: 60
- type: ndcg_at_10
value: 55.074
- type: ndcg_at_100
value: 43.342999999999996
- type: ndcg_at_1000
value: 40.217999999999996
- type: ndcg_at_3
value: 56.754000000000005
- type: ndcg_at_5
value: 56.267999999999994
- type: precision_at_1
value: 64
- type: precision_at_10
value: 57.8
- type: precision_at_100
value: 44.34
- type: precision_at_1000
value: 17.791999999999998
- type: precision_at_3
value: 59.333000000000006
- type: precision_at_5
value: 59.199999999999996
- type: recall_at_1
value: 0.16999999999999998
- type: recall_at_10
value: 1.522
- type: recall_at_100
value: 10.52
- type: recall_at_1000
value: 38.324999999999996
- type: recall_at_3
value: 0.48
- type: recall_at_5
value: 0.792
- task:
type: Retrieval
dataset:
type: webis-touche2020
name: MTEB Touche2020
config: default
split: test
revision: None
metrics:
- type: map_at_1
value: 1.078
- type: map_at_10
value: 5.463
- type: map_at_100
value: 9.914000000000001
- type: map_at_1000
value: 11.285
- type: map_at_3
value: 2.467
- type: map_at_5
value: 3.277
- type: mrr_at_1
value: 12.245000000000001
- type: mrr_at_10
value: 26.708
- type: mrr_at_100
value: 28.303
- type: mrr_at_1000
value: 28.321
- type: mrr_at_3
value: 23.128999999999998
- type: mrr_at_5
value: 24.558
- type: ndcg_at_1
value: 11.224
- type: ndcg_at_10
value: 15.221000000000002
- type: ndcg_at_100
value: 26.346999999999998
- type: ndcg_at_1000
value: 37.969
- type: ndcg_at_3
value: 13.318
- type: ndcg_at_5
value: 12.576
- type: precision_at_1
value: 12.245000000000001
- type: precision_at_10
value: 15.101999999999999
- type: precision_at_100
value: 5.9799999999999995
- type: precision_at_1000
value: 1.367
- type: precision_at_3
value: 14.966
- type: precision_at_5
value: 13.469000000000001
- type: recall_at_1
value: 1.078
- type: recall_at_10
value: 11.157
- type: recall_at_100
value: 38.190000000000005
- type: recall_at_1000
value: 73.831
- type: recall_at_3
value: 3.598
- type: recall_at_5
value: 5.122999999999999
- task:
type: Classification
dataset:
type: mteb/toxic_conversations_50k
name: MTEB ToxicConversationsClassification
config: default
split: test
revision: d7c0de2777da35d6aae2200a62c6e0e5af397c4c
metrics:
- type: accuracy
value: 71.1582
- type: ap
value: 14.92669801560963
- type: f1
value: 55.12856312799308
- task:
type: Classification
dataset:
type: mteb/tweet_sentiment_extraction
name: MTEB TweetSentimentExtractionClassification
config: default
split: test
revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
metrics:
- type: accuracy
value: 58.88511601584606
- type: f1
value: 58.85264576560652
- task:
type: Clustering
dataset:
type: mteb/twentynewsgroups-clustering
name: MTEB TwentyNewsgroupsClustering
config: default
split: test
revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
metrics:
- type: v_measure
value: 46.12909899358978
- task:
type: PairClassification
dataset:
type: mteb/twittersemeval2015-pairclassification
name: MTEB TwitterSemEval2015
config: default
split: test
revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
metrics:
- type: cos_sim_accuracy
value: 83.26876080348096
- type: cos_sim_ap
value: 64.7970240303098
- type: cos_sim_f1
value: 60.64945026847354
- type: cos_sim_precision
value: 58.82936507936508
- type: cos_sim_recall
value: 62.58575197889182
- type: dot_accuracy
value: 83.26876080348096
- type: dot_ap
value: 64.7970187478589
- type: dot_f1
value: 60.64945026847354
- type: dot_precision
value: 58.82936507936508
- type: dot_recall
value: 62.58575197889182
- type: euclidean_accuracy
value: 83.26876080348096
- type: euclidean_ap
value: 64.7970350594888
- type: euclidean_f1
value: 60.64945026847354
- type: euclidean_precision
value: 58.82936507936508
- type: euclidean_recall
value: 62.58575197889182
- type: manhattan_accuracy
value: 83.22703701496096
- type: manhattan_ap
value: 64.77489173378227
- type: manhattan_f1
value: 60.60833646263612
- type: manhattan_precision
value: 57.65658490116694
- type: manhattan_recall
value: 63.87862796833773
- type: max_accuracy
value: 83.26876080348096
- type: max_ap
value: 64.7970350594888
- type: max_f1
value: 60.64945026847354
- task:
type: PairClassification
dataset:
type: mteb/twitterurlcorpus-pairclassification
name: MTEB TwitterURLCorpus
config: default
split: test
revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
metrics:
- type: cos_sim_accuracy
value: 86.43613924787519
- type: cos_sim_ap
value: 80.48760161140632
- type: cos_sim_f1
value: 73.17976287962401
- type: cos_sim_precision
value: 68.0641102059739
- type: cos_sim_recall
value: 79.12688635663689
- type: dot_accuracy
value: 86.43613924787519
- type: dot_ap
value: 80.487599095952
- type: dot_f1
value: 73.17976287962401
- type: dot_precision
value: 68.0641102059739
- type: dot_recall
value: 79.12688635663689
- type: euclidean_accuracy
value: 86.43613924787519
- type: euclidean_ap
value: 80.48760636334994
- type: euclidean_f1
value: 73.17976287962401
- type: euclidean_precision
value: 68.0641102059739
- type: euclidean_recall
value: 79.12688635663689
- type: manhattan_accuracy
value: 86.41673458299375
- type: manhattan_ap
value: 80.47462765492928
- type: manhattan_f1
value: 73.16093396936981
- type: manhattan_precision
value: 68.48183710468005
- type: manhattan_recall
value: 78.5263319987681
- type: max_accuracy
value: 86.43613924787519
- type: max_ap
value: 80.48760636334994
- type: max_f1
value: 73.17976287962401