rodrigomasini commited on
Commit
38d0600
1 Parent(s): f8805de

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -120
app.py CHANGED
@@ -280,23 +280,14 @@ EXTERNAL_MODELS = [
280
  "all-mpnet-base-v2",
281
  "allenai-specter",
282
  "Baichuan-text-embedding",
283
- "bert-base-swedish-cased",
284
  "bert-base-uncased",
285
- "bge-base-zh-v1.5",
286
- "bge-large-zh-v1.5",
287
- "bge-large-zh-noinstruct",
288
- "bge-small-zh-v1.5",
289
  "contriever-base-msmarco",
290
- "cross-en-de-roberta-sentence-transformer",
291
  "dfm-encoder-large-v1",
292
  "dfm-sentence-encoder-large-1",
293
  "distiluse-base-multilingual-cased-v2",
294
- "DanskBERT",
295
  "e5-base",
296
  "e5-large",
297
  "e5-small",
298
- "electra-small-nordic",
299
- "electra-small-swedish-cased-discriminator",
300
  "gbert-base",
301
  "gbert-large",
302
  "gelectra-base",
@@ -324,29 +315,14 @@ EXTERNAL_MODELS = [
324
  "norbert3-large",
325
  "paraphrase-multilingual-MiniLM-L12-v2",
326
  "paraphrase-multilingual-mpnet-base-v2",
327
- "sentence-bert-swedish-cased",
328
  "sentence-t5-base",
329
  "sentence-t5-large",
330
  "sentence-t5-xl",
331
  "sentence-t5-xxl",
332
  "sup-simcse-bert-base-uncased",
333
- "st-polish-paraphrase-from-distilroberta",
334
- "st-polish-paraphrase-from-mpnet",
335
- "text2vec-base-chinese",
336
- "text2vec-large-chinese",
337
  "text-embedding-3-small",
338
  "text-embedding-3-large",
339
  "text-embedding-3-large-256",
340
- "text-embedding-ada-002",
341
- "text-similarity-ada-001",
342
- "text-similarity-babbage-001",
343
- "text-similarity-curie-001",
344
- "text-similarity-davinci-001",
345
- "text-search-ada-doc-001",
346
- "text-search-ada-001",
347
- "text-search-babbage-001",
348
- "text-search-curie-001",
349
- "text-search-davinci-001",
350
  "titan-embed-text-v1",
351
  "unsup-simcse-bert-base-uncased",
352
  "use-cmlm-multilingual",
@@ -362,24 +338,14 @@ EXTERNAL_MODEL_TO_LINK = {
362
  "all-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L12-v2",
363
  "all-MiniLM-L6-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2",
364
  "all-mpnet-base-v2": "https://huggingface.co/sentence-transformers/all-mpnet-base-v2",
365
- "Baichuan-text-embedding": "https://platform.baichuan-ai.com/docs/text-Embedding",
366
- "bert-base-swedish-cased": "https://huggingface.co/KB/bert-base-swedish-cased",
367
  "bert-base-uncased": "https://huggingface.co/bert-base-uncased",
368
- "bge-base-zh-v1.5": "https://huggingface.co/BAAI/bge-base-zh-v1.5",
369
- "bge-large-zh-v1.5": "https://huggingface.co/BAAI/bge-large-zh-v1.5",
370
- "bge-large-zh-noinstruct": "https://huggingface.co/BAAI/bge-large-zh-noinstruct",
371
- "bge-small-zh-v1.5": "https://huggingface.co/BAAI/bge-small-zh-v1.5",
372
  "contriever-base-msmarco": "https://huggingface.co/nthakur/contriever-base-msmarco",
373
- "cross-en-de-roberta-sentence-transformer": "https://huggingface.co/T-Systems-onsite/cross-en-de-roberta-sentence-transformer",
374
- "DanskBERT": "https://huggingface.co/vesteinn/DanskBERT",
375
  "distiluse-base-multilingual-cased-v2": "https://huggingface.co/sentence-transformers/distiluse-base-multilingual-cased-v2",
376
  "dfm-encoder-large-v1": "https://huggingface.co/chcaa/dfm-encoder-large-v1",
377
  "dfm-sentence-encoder-large-1": "https://huggingface.co/chcaa/dfm-encoder-large-v1",
378
  "e5-base": "https://huggingface.co/intfloat/e5-base",
379
  "e5-large": "https://huggingface.co/intfloat/e5-large",
380
  "e5-small": "https://huggingface.co/intfloat/e5-small",
381
- "electra-small-nordic": "https://huggingface.co/jonfd/electra-small-nordic",
382
- "electra-small-swedish-cased-discriminator": "https://huggingface.co/KBLab/electra-small-swedish-cased-discriminator",
383
  "gbert-base": "https://huggingface.co/deepset/gbert-base",
384
  "gbert-large": "https://huggingface.co/deepset/gbert-large",
385
  "gelectra-base": "https://huggingface.co/deepset/gelectra-base",
@@ -407,30 +373,14 @@ EXTERNAL_MODEL_TO_LINK = {
407
  "norbert3-large": "https://huggingface.co/ltg/norbert3-large",
408
  "paraphrase-multilingual-mpnet-base-v2": "https://huggingface.co/sentence-transformers/paraphrase-multilingual-mpnet-base-v2",
409
  "paraphrase-multilingual-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2",
410
- "sentence-bert-swedish-cased": "https://huggingface.co/KBLab/sentence-bert-swedish-cased",
411
  "sentence-t5-base": "https://huggingface.co/sentence-transformers/sentence-t5-base",
412
  "sentence-t5-large": "https://huggingface.co/sentence-transformers/sentence-t5-large",
413
  "sentence-t5-xl": "https://huggingface.co/sentence-transformers/sentence-t5-xl",
414
  "sentence-t5-xxl": "https://huggingface.co/sentence-transformers/sentence-t5-xxl",
415
  "sup-simcse-bert-base-uncased": "https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased",
416
- "st-polish-paraphrase-from-distilroberta": "https://huggingface.co/sdadas/st-polish-paraphrase-from-distilroberta",
417
- "st-polish-paraphrase-from-mpnet": "https://huggingface.co/sdadas/st-polish-paraphrase-from-mpnet",
418
- "text2vec-base-chinese": "https://huggingface.co/shibing624/text2vec-base-chinese",
419
- "text2vec-large-chinese": "https://huggingface.co/GanymedeNil/text2vec-large-chinese",
420
  "text-embedding-3-small": "https://openai.com/blog/new-embedding-models-and-api-updates",
421
  "text-embedding-3-large": "https://openai.com/blog/new-embedding-models-and-api-updates",
422
  "text-embedding-3-large-256": "https://openai.com/blog/new-embedding-models-and-api-updates",
423
- "text-embedding-ada-002": "https://openai.com/blog/new-and-improved-embedding-model",
424
- "text-similarity-ada-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
425
- "text-similarity-babbage-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
426
- "text-similarity-curie-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
427
- "text-similarity-davinci-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
428
- "text-search-ada-doc-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
429
- "text-search-ada-query-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
430
- "text-search-ada-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
431
- "text-search-curie-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
432
- "text-search-babbage-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
433
- "text-search-davinci-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
434
  "titan-embed-text-v1": "https://docs.aws.amazon.com/bedrock/latest/userguide/embeddings.html",
435
  "unsup-simcse-bert-base-uncased": "https://huggingface.co/princeton-nlp/unsup-simcse-bert-base-uncased",
436
  "use-cmlm-multilingual": "https://huggingface.co/sentence-transformers/use-cmlm-multilingual",
@@ -445,24 +395,14 @@ EXTERNAL_MODEL_TO_DIM = {
445
  "all-MiniLM-L6-v2": 384,
446
  "all-mpnet-base-v2": 768,
447
  "allenai-specter": 768,
448
- "Baichuan-text-embedding": 1024,
449
- "bert-base-swedish-cased": 768,
450
  "bert-base-uncased": 768,
451
- "bge-base-zh-v1.5": 768,
452
- "bge-large-zh-v1.5": 1024,
453
- "bge-large-zh-noinstruct": 1024,
454
- "bge-small-zh-v1.5": 512,
455
  "contriever-base-msmarco": 768,
456
- "cross-en-de-roberta-sentence-transformer": 768,
457
- "DanskBERT": 768,
458
  "distiluse-base-multilingual-cased-v2": 512,
459
  "dfm-encoder-large-v1": 1024,
460
  "dfm-sentence-encoder-large-1": 1024,
461
  "e5-base": 768,
462
  "e5-small": 384,
463
  "e5-large": 1024,
464
- "electra-small-nordic": 256,
465
- "electra-small-swedish-cased-discriminator": 256,
466
  "luotuo-bert-medium": 768,
467
  "LASER2": 1024,
468
  "LaBSE": 768,
@@ -490,30 +430,14 @@ EXTERNAL_MODEL_TO_DIM = {
490
  "norbert3-large": 1024,
491
  "paraphrase-multilingual-MiniLM-L12-v2": 384,
492
  "paraphrase-multilingual-mpnet-base-v2": 768,
493
- "sentence-bert-swedish-cased": 768,
494
  "sentence-t5-base": 768,
495
  "sentence-t5-large": 768,
496
  "sentence-t5-xl": 768,
497
  "sentence-t5-xxl": 768,
498
  "sup-simcse-bert-base-uncased": 768,
499
- "st-polish-paraphrase-from-distilroberta": 768,
500
- "st-polish-paraphrase-from-mpnet": 768,
501
- "text2vec-base-chinese": 768,
502
- "text2vec-large-chinese": 1024,
503
  "text-embedding-3-large": 3072,
504
  "text-embedding-3-large-256": 256,
505
  "text-embedding-3-small": 1536,
506
- "text-embedding-ada-002": 1536,
507
- "text-similarity-ada-001": 1024,
508
- "text-similarity-babbage-001": 2048,
509
- "text-similarity-curie-001": 4096,
510
- "text-similarity-davinci-001": 12288,
511
- "text-search-ada-doc-001": 1024,
512
- "text-search-ada-query-001": 1024,
513
- "text-search-ada-001": 1024,
514
- "text-search-babbage-001": 2048,
515
- "text-search-curie-001": 4096,
516
- "text-search-davinci-001": 12288,
517
  "titan-embed-text-v1": 1536,
518
  "unsup-simcse-bert-base-uncased": 768,
519
  "use-cmlm-multilingual": 768,
@@ -528,24 +452,14 @@ EXTERNAL_MODEL_TO_SEQLEN = {
528
  "all-MiniLM-L6-v2": 512,
529
  "all-mpnet-base-v2": 514,
530
  "allenai-specter": 512,
531
- "Baichuan-text-embedding": 512,
532
- "bert-base-swedish-cased": 512,
533
- "bert-base-uncased": 512,
534
- "bge-base-zh-v1.5": 512,
535
- "bge-large-zh-v1.5": 512,
536
- "bge-large-zh-noinstruct": 512,
537
- "bge-small-zh-v1.5": 512,
538
- "contriever-base-msmarco": 512,
539
- "cross-en-de-roberta-sentence-transformer": 514,
540
- "DanskBERT": 514,
541
  "dfm-encoder-large-v1": 512,
542
  "dfm-sentence-encoder-large-1": 512,
543
  "distiluse-base-multilingual-cased-v2": 512,
544
  "e5-base": 512,
545
  "e5-large": 512,
546
  "e5-small": 512,
547
- "electra-small-nordic": 512,
548
- "electra-small-swedish-cased-discriminator": 512,
549
  "gbert-base": 512,
550
  "gbert-large": 512,
551
  "gelectra-base": 512,
@@ -573,30 +487,14 @@ EXTERNAL_MODEL_TO_SEQLEN = {
573
  "norbert3-large": 512,
574
  "paraphrase-multilingual-MiniLM-L12-v2": 512,
575
  "paraphrase-multilingual-mpnet-base-v2": 514,
576
- "sentence-bert-swedish-cased": 512,
577
  "sentence-t5-base": 512,
578
  "sentence-t5-large": 512,
579
  "sentence-t5-xl": 512,
580
  "sentence-t5-xxl": 512,
581
  "sup-simcse-bert-base-uncased": 512,
582
- "st-polish-paraphrase-from-distilroberta": 514,
583
- "st-polish-paraphrase-from-mpnet": 514,
584
- "text2vec-base-chinese": 512,
585
- "text2vec-large-chinese": 512,
586
  "text-embedding-3-large": 8191,
587
  "text-embedding-3-large-256": 8191,
588
  "text-embedding-3-small": 8191,
589
- "text-embedding-ada-002": 8191,
590
- "text-similarity-ada-001": 2046,
591
- "text-similarity-babbage-001": 2046,
592
- "text-similarity-curie-001": 2046,
593
- "text-similarity-davinci-001": 2046,
594
- "text-search-ada-doc-001": 2046,
595
- "text-search-ada-query-001": 2046,
596
- "text-search-ada-001": 2046,
597
- "text-search-babbage-001": 2046,
598
- "text-search-curie-001": 2046,
599
- "text-search-davinci-001": 2046,
600
  "titan-embed-text-v1": 8000,
601
  "use-cmlm-multilingual": 512,
602
  "unsup-simcse-bert-base-uncased": 512,
@@ -611,23 +509,14 @@ EXTERNAL_MODEL_TO_SIZE = {
611
  "all-MiniLM-L12-v2": 0.13,
612
  "all-MiniLM-L6-v2": 0.09,
613
  "all-mpnet-base-v2": 0.44,
614
- "bert-base-uncased": 0.44,
615
- "bert-base-swedish-cased": 0.50,
616
- "bge-base-zh-v1.5": 0.41,
617
- "bge-large-zh-v1.5": 1.30,
618
- "bge-large-zh-noinstruct": 1.30,
619
- "bge-small-zh-v1.5": 0.10,
620
- "cross-en-de-roberta-sentence-transformer": 1.11,
621
  "contriever-base-msmarco": 0.44,
622
- "DanskBERT": 0.50,
623
  "distiluse-base-multilingual-cased-v2": 0.54,
624
  "dfm-encoder-large-v1": 1.42,
625
  "dfm-sentence-encoder-large-1": 1.63,
626
  "e5-base": 0.44,
627
  "e5-small": 0.13,
628
  "e5-large": 1.34,
629
- "electra-small-nordic": 0.09,
630
- "electra-small-swedish-cased-discriminator": 0.06,
631
  "gbert-base": 0.44,
632
  "gbert-large": 1.35,
633
  "gelectra-base": 0.44,
@@ -655,16 +544,11 @@ EXTERNAL_MODEL_TO_SIZE = {
655
  "norbert3-large": 1.47,
656
  "paraphrase-multilingual-mpnet-base-v2": 1.11,
657
  "paraphrase-multilingual-MiniLM-L12-v2": 0.47,
658
- "sentence-bert-swedish-cased": 0.50,
659
  "sentence-t5-base": 0.22,
660
  "sentence-t5-large": 0.67,
661
  "sentence-t5-xl": 2.48,
662
  "sentence-t5-xxl": 9.73,
663
- "sup-simcse-bert-base-uncased": 0.44,
664
- "st-polish-paraphrase-from-distilroberta": 0.50,
665
- "st-polish-paraphrase-from-mpnet": 0.50,
666
- "text2vec-base-chinese": 0.41,
667
- "text2vec-large-chinese": 1.30,
668
  "unsup-simcse-bert-base-uncased": 0.44,
669
  "use-cmlm-multilingual": 1.89,
670
  "xlm-roberta-base": 1.12,
 
280
  "all-mpnet-base-v2",
281
  "allenai-specter",
282
  "Baichuan-text-embedding",
 
283
  "bert-base-uncased",
 
 
 
 
284
  "contriever-base-msmarco",
 
285
  "dfm-encoder-large-v1",
286
  "dfm-sentence-encoder-large-1",
287
  "distiluse-base-multilingual-cased-v2",
 
288
  "e5-base",
289
  "e5-large",
290
  "e5-small",
 
 
291
  "gbert-base",
292
  "gbert-large",
293
  "gelectra-base",
 
315
  "norbert3-large",
316
  "paraphrase-multilingual-MiniLM-L12-v2",
317
  "paraphrase-multilingual-mpnet-base-v2",
 
318
  "sentence-t5-base",
319
  "sentence-t5-large",
320
  "sentence-t5-xl",
321
  "sentence-t5-xxl",
322
  "sup-simcse-bert-base-uncased",
 
 
 
 
323
  "text-embedding-3-small",
324
  "text-embedding-3-large",
325
  "text-embedding-3-large-256",
 
 
 
 
 
 
 
 
 
 
326
  "titan-embed-text-v1",
327
  "unsup-simcse-bert-base-uncased",
328
  "use-cmlm-multilingual",
 
338
  "all-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L12-v2",
339
  "all-MiniLM-L6-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2",
340
  "all-mpnet-base-v2": "https://huggingface.co/sentence-transformers/all-mpnet-base-v2",
 
 
341
  "bert-base-uncased": "https://huggingface.co/bert-base-uncased",
 
 
 
 
342
  "contriever-base-msmarco": "https://huggingface.co/nthakur/contriever-base-msmarco",
 
 
343
  "distiluse-base-multilingual-cased-v2": "https://huggingface.co/sentence-transformers/distiluse-base-multilingual-cased-v2",
344
  "dfm-encoder-large-v1": "https://huggingface.co/chcaa/dfm-encoder-large-v1",
345
  "dfm-sentence-encoder-large-1": "https://huggingface.co/chcaa/dfm-encoder-large-v1",
346
  "e5-base": "https://huggingface.co/intfloat/e5-base",
347
  "e5-large": "https://huggingface.co/intfloat/e5-large",
348
  "e5-small": "https://huggingface.co/intfloat/e5-small",
 
 
349
  "gbert-base": "https://huggingface.co/deepset/gbert-base",
350
  "gbert-large": "https://huggingface.co/deepset/gbert-large",
351
  "gelectra-base": "https://huggingface.co/deepset/gelectra-base",
 
373
  "norbert3-large": "https://huggingface.co/ltg/norbert3-large",
374
  "paraphrase-multilingual-mpnet-base-v2": "https://huggingface.co/sentence-transformers/paraphrase-multilingual-mpnet-base-v2",
375
  "paraphrase-multilingual-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2",
 
376
  "sentence-t5-base": "https://huggingface.co/sentence-transformers/sentence-t5-base",
377
  "sentence-t5-large": "https://huggingface.co/sentence-transformers/sentence-t5-large",
378
  "sentence-t5-xl": "https://huggingface.co/sentence-transformers/sentence-t5-xl",
379
  "sentence-t5-xxl": "https://huggingface.co/sentence-transformers/sentence-t5-xxl",
380
  "sup-simcse-bert-base-uncased": "https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased",
 
 
 
 
381
  "text-embedding-3-small": "https://openai.com/blog/new-embedding-models-and-api-updates",
382
  "text-embedding-3-large": "https://openai.com/blog/new-embedding-models-and-api-updates",
383
  "text-embedding-3-large-256": "https://openai.com/blog/new-embedding-models-and-api-updates",
 
 
 
 
 
 
 
 
 
 
 
384
  "titan-embed-text-v1": "https://docs.aws.amazon.com/bedrock/latest/userguide/embeddings.html",
385
  "unsup-simcse-bert-base-uncased": "https://huggingface.co/princeton-nlp/unsup-simcse-bert-base-uncased",
386
  "use-cmlm-multilingual": "https://huggingface.co/sentence-transformers/use-cmlm-multilingual",
 
395
  "all-MiniLM-L6-v2": 384,
396
  "all-mpnet-base-v2": 768,
397
  "allenai-specter": 768,
 
 
398
  "bert-base-uncased": 768,
 
 
 
 
399
  "contriever-base-msmarco": 768,
 
 
400
  "distiluse-base-multilingual-cased-v2": 512,
401
  "dfm-encoder-large-v1": 1024,
402
  "dfm-sentence-encoder-large-1": 1024,
403
  "e5-base": 768,
404
  "e5-small": 384,
405
  "e5-large": 1024,
 
 
406
  "luotuo-bert-medium": 768,
407
  "LASER2": 1024,
408
  "LaBSE": 768,
 
430
  "norbert3-large": 1024,
431
  "paraphrase-multilingual-MiniLM-L12-v2": 384,
432
  "paraphrase-multilingual-mpnet-base-v2": 768,
 
433
  "sentence-t5-base": 768,
434
  "sentence-t5-large": 768,
435
  "sentence-t5-xl": 768,
436
  "sentence-t5-xxl": 768,
437
  "sup-simcse-bert-base-uncased": 768,
 
 
 
 
438
  "text-embedding-3-large": 3072,
439
  "text-embedding-3-large-256": 256,
440
  "text-embedding-3-small": 1536,
 
 
 
 
 
 
 
 
 
 
 
441
  "titan-embed-text-v1": 1536,
442
  "unsup-simcse-bert-base-uncased": 768,
443
  "use-cmlm-multilingual": 768,
 
452
  "all-MiniLM-L6-v2": 512,
453
  "all-mpnet-base-v2": 514,
454
  "allenai-specter": 512,
455
+ "bert-base-uncased": 512,
456
+ "contriever-base-msmarco": 512,4,
 
 
 
 
 
 
 
 
457
  "dfm-encoder-large-v1": 512,
458
  "dfm-sentence-encoder-large-1": 512,
459
  "distiluse-base-multilingual-cased-v2": 512,
460
  "e5-base": 512,
461
  "e5-large": 512,
462
  "e5-small": 512,
 
 
463
  "gbert-base": 512,
464
  "gbert-large": 512,
465
  "gelectra-base": 512,
 
487
  "norbert3-large": 512,
488
  "paraphrase-multilingual-MiniLM-L12-v2": 512,
489
  "paraphrase-multilingual-mpnet-base-v2": 514,
 
490
  "sentence-t5-base": 512,
491
  "sentence-t5-large": 512,
492
  "sentence-t5-xl": 512,
493
  "sentence-t5-xxl": 512,
494
  "sup-simcse-bert-base-uncased": 512,
 
 
 
 
495
  "text-embedding-3-large": 8191,
496
  "text-embedding-3-large-256": 8191,
497
  "text-embedding-3-small": 8191,
 
 
 
 
 
 
 
 
 
 
 
498
  "titan-embed-text-v1": 8000,
499
  "use-cmlm-multilingual": 512,
500
  "unsup-simcse-bert-base-uncased": 512,
 
509
  "all-MiniLM-L12-v2": 0.13,
510
  "all-MiniLM-L6-v2": 0.09,
511
  "all-mpnet-base-v2": 0.44,
512
+ "bert-base-uncased": 0.44,
 
 
 
 
 
 
513
  "contriever-base-msmarco": 0.44,
 
514
  "distiluse-base-multilingual-cased-v2": 0.54,
515
  "dfm-encoder-large-v1": 1.42,
516
  "dfm-sentence-encoder-large-1": 1.63,
517
  "e5-base": 0.44,
518
  "e5-small": 0.13,
519
  "e5-large": 1.34,
 
 
520
  "gbert-base": 0.44,
521
  "gbert-large": 1.35,
522
  "gelectra-base": 0.44,
 
544
  "norbert3-large": 1.47,
545
  "paraphrase-multilingual-mpnet-base-v2": 1.11,
546
  "paraphrase-multilingual-MiniLM-L12-v2": 0.47,
 
547
  "sentence-t5-base": 0.22,
548
  "sentence-t5-large": 0.67,
549
  "sentence-t5-xl": 2.48,
550
  "sentence-t5-xxl": 9.73,
551
+ "sup-simcse-bert-base-uncased": 0.44,
 
 
 
 
552
  "unsup-simcse-bert-base-uncased": 0.44,
553
  "use-cmlm-multilingual": 1.89,
554
  "xlm-roberta-base": 1.12,