Spaces:
Runtime error
Runtime error
Commit
•
38d0600
1
Parent(s):
f8805de
Update app.py
Browse files
app.py
CHANGED
@@ -280,23 +280,14 @@ EXTERNAL_MODELS = [
|
|
280 |
"all-mpnet-base-v2",
|
281 |
"allenai-specter",
|
282 |
"Baichuan-text-embedding",
|
283 |
-
"bert-base-swedish-cased",
|
284 |
"bert-base-uncased",
|
285 |
-
"bge-base-zh-v1.5",
|
286 |
-
"bge-large-zh-v1.5",
|
287 |
-
"bge-large-zh-noinstruct",
|
288 |
-
"bge-small-zh-v1.5",
|
289 |
"contriever-base-msmarco",
|
290 |
-
"cross-en-de-roberta-sentence-transformer",
|
291 |
"dfm-encoder-large-v1",
|
292 |
"dfm-sentence-encoder-large-1",
|
293 |
"distiluse-base-multilingual-cased-v2",
|
294 |
-
"DanskBERT",
|
295 |
"e5-base",
|
296 |
"e5-large",
|
297 |
"e5-small",
|
298 |
-
"electra-small-nordic",
|
299 |
-
"electra-small-swedish-cased-discriminator",
|
300 |
"gbert-base",
|
301 |
"gbert-large",
|
302 |
"gelectra-base",
|
@@ -324,29 +315,14 @@ EXTERNAL_MODELS = [
|
|
324 |
"norbert3-large",
|
325 |
"paraphrase-multilingual-MiniLM-L12-v2",
|
326 |
"paraphrase-multilingual-mpnet-base-v2",
|
327 |
-
"sentence-bert-swedish-cased",
|
328 |
"sentence-t5-base",
|
329 |
"sentence-t5-large",
|
330 |
"sentence-t5-xl",
|
331 |
"sentence-t5-xxl",
|
332 |
"sup-simcse-bert-base-uncased",
|
333 |
-
"st-polish-paraphrase-from-distilroberta",
|
334 |
-
"st-polish-paraphrase-from-mpnet",
|
335 |
-
"text2vec-base-chinese",
|
336 |
-
"text2vec-large-chinese",
|
337 |
"text-embedding-3-small",
|
338 |
"text-embedding-3-large",
|
339 |
"text-embedding-3-large-256",
|
340 |
-
"text-embedding-ada-002",
|
341 |
-
"text-similarity-ada-001",
|
342 |
-
"text-similarity-babbage-001",
|
343 |
-
"text-similarity-curie-001",
|
344 |
-
"text-similarity-davinci-001",
|
345 |
-
"text-search-ada-doc-001",
|
346 |
-
"text-search-ada-001",
|
347 |
-
"text-search-babbage-001",
|
348 |
-
"text-search-curie-001",
|
349 |
-
"text-search-davinci-001",
|
350 |
"titan-embed-text-v1",
|
351 |
"unsup-simcse-bert-base-uncased",
|
352 |
"use-cmlm-multilingual",
|
@@ -362,24 +338,14 @@ EXTERNAL_MODEL_TO_LINK = {
|
|
362 |
"all-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L12-v2",
|
363 |
"all-MiniLM-L6-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2",
|
364 |
"all-mpnet-base-v2": "https://huggingface.co/sentence-transformers/all-mpnet-base-v2",
|
365 |
-
"Baichuan-text-embedding": "https://platform.baichuan-ai.com/docs/text-Embedding",
|
366 |
-
"bert-base-swedish-cased": "https://huggingface.co/KB/bert-base-swedish-cased",
|
367 |
"bert-base-uncased": "https://huggingface.co/bert-base-uncased",
|
368 |
-
"bge-base-zh-v1.5": "https://huggingface.co/BAAI/bge-base-zh-v1.5",
|
369 |
-
"bge-large-zh-v1.5": "https://huggingface.co/BAAI/bge-large-zh-v1.5",
|
370 |
-
"bge-large-zh-noinstruct": "https://huggingface.co/BAAI/bge-large-zh-noinstruct",
|
371 |
-
"bge-small-zh-v1.5": "https://huggingface.co/BAAI/bge-small-zh-v1.5",
|
372 |
"contriever-base-msmarco": "https://huggingface.co/nthakur/contriever-base-msmarco",
|
373 |
-
"cross-en-de-roberta-sentence-transformer": "https://huggingface.co/T-Systems-onsite/cross-en-de-roberta-sentence-transformer",
|
374 |
-
"DanskBERT": "https://huggingface.co/vesteinn/DanskBERT",
|
375 |
"distiluse-base-multilingual-cased-v2": "https://huggingface.co/sentence-transformers/distiluse-base-multilingual-cased-v2",
|
376 |
"dfm-encoder-large-v1": "https://huggingface.co/chcaa/dfm-encoder-large-v1",
|
377 |
"dfm-sentence-encoder-large-1": "https://huggingface.co/chcaa/dfm-encoder-large-v1",
|
378 |
"e5-base": "https://huggingface.co/intfloat/e5-base",
|
379 |
"e5-large": "https://huggingface.co/intfloat/e5-large",
|
380 |
"e5-small": "https://huggingface.co/intfloat/e5-small",
|
381 |
-
"electra-small-nordic": "https://huggingface.co/jonfd/electra-small-nordic",
|
382 |
-
"electra-small-swedish-cased-discriminator": "https://huggingface.co/KBLab/electra-small-swedish-cased-discriminator",
|
383 |
"gbert-base": "https://huggingface.co/deepset/gbert-base",
|
384 |
"gbert-large": "https://huggingface.co/deepset/gbert-large",
|
385 |
"gelectra-base": "https://huggingface.co/deepset/gelectra-base",
|
@@ -407,30 +373,14 @@ EXTERNAL_MODEL_TO_LINK = {
|
|
407 |
"norbert3-large": "https://huggingface.co/ltg/norbert3-large",
|
408 |
"paraphrase-multilingual-mpnet-base-v2": "https://huggingface.co/sentence-transformers/paraphrase-multilingual-mpnet-base-v2",
|
409 |
"paraphrase-multilingual-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2",
|
410 |
-
"sentence-bert-swedish-cased": "https://huggingface.co/KBLab/sentence-bert-swedish-cased",
|
411 |
"sentence-t5-base": "https://huggingface.co/sentence-transformers/sentence-t5-base",
|
412 |
"sentence-t5-large": "https://huggingface.co/sentence-transformers/sentence-t5-large",
|
413 |
"sentence-t5-xl": "https://huggingface.co/sentence-transformers/sentence-t5-xl",
|
414 |
"sentence-t5-xxl": "https://huggingface.co/sentence-transformers/sentence-t5-xxl",
|
415 |
"sup-simcse-bert-base-uncased": "https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased",
|
416 |
-
"st-polish-paraphrase-from-distilroberta": "https://huggingface.co/sdadas/st-polish-paraphrase-from-distilroberta",
|
417 |
-
"st-polish-paraphrase-from-mpnet": "https://huggingface.co/sdadas/st-polish-paraphrase-from-mpnet",
|
418 |
-
"text2vec-base-chinese": "https://huggingface.co/shibing624/text2vec-base-chinese",
|
419 |
-
"text2vec-large-chinese": "https://huggingface.co/GanymedeNil/text2vec-large-chinese",
|
420 |
"text-embedding-3-small": "https://openai.com/blog/new-embedding-models-and-api-updates",
|
421 |
"text-embedding-3-large": "https://openai.com/blog/new-embedding-models-and-api-updates",
|
422 |
"text-embedding-3-large-256": "https://openai.com/blog/new-embedding-models-and-api-updates",
|
423 |
-
"text-embedding-ada-002": "https://openai.com/blog/new-and-improved-embedding-model",
|
424 |
-
"text-similarity-ada-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
425 |
-
"text-similarity-babbage-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
426 |
-
"text-similarity-curie-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
427 |
-
"text-similarity-davinci-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
428 |
-
"text-search-ada-doc-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
429 |
-
"text-search-ada-query-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
430 |
-
"text-search-ada-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
431 |
-
"text-search-curie-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
432 |
-
"text-search-babbage-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
433 |
-
"text-search-davinci-001": "https://openai.com/blog/introducing-text-and-code-embeddings",
|
434 |
"titan-embed-text-v1": "https://docs.aws.amazon.com/bedrock/latest/userguide/embeddings.html",
|
435 |
"unsup-simcse-bert-base-uncased": "https://huggingface.co/princeton-nlp/unsup-simcse-bert-base-uncased",
|
436 |
"use-cmlm-multilingual": "https://huggingface.co/sentence-transformers/use-cmlm-multilingual",
|
@@ -445,24 +395,14 @@ EXTERNAL_MODEL_TO_DIM = {
|
|
445 |
"all-MiniLM-L6-v2": 384,
|
446 |
"all-mpnet-base-v2": 768,
|
447 |
"allenai-specter": 768,
|
448 |
-
"Baichuan-text-embedding": 1024,
|
449 |
-
"bert-base-swedish-cased": 768,
|
450 |
"bert-base-uncased": 768,
|
451 |
-
"bge-base-zh-v1.5": 768,
|
452 |
-
"bge-large-zh-v1.5": 1024,
|
453 |
-
"bge-large-zh-noinstruct": 1024,
|
454 |
-
"bge-small-zh-v1.5": 512,
|
455 |
"contriever-base-msmarco": 768,
|
456 |
-
"cross-en-de-roberta-sentence-transformer": 768,
|
457 |
-
"DanskBERT": 768,
|
458 |
"distiluse-base-multilingual-cased-v2": 512,
|
459 |
"dfm-encoder-large-v1": 1024,
|
460 |
"dfm-sentence-encoder-large-1": 1024,
|
461 |
"e5-base": 768,
|
462 |
"e5-small": 384,
|
463 |
"e5-large": 1024,
|
464 |
-
"electra-small-nordic": 256,
|
465 |
-
"electra-small-swedish-cased-discriminator": 256,
|
466 |
"luotuo-bert-medium": 768,
|
467 |
"LASER2": 1024,
|
468 |
"LaBSE": 768,
|
@@ -490,30 +430,14 @@ EXTERNAL_MODEL_TO_DIM = {
|
|
490 |
"norbert3-large": 1024,
|
491 |
"paraphrase-multilingual-MiniLM-L12-v2": 384,
|
492 |
"paraphrase-multilingual-mpnet-base-v2": 768,
|
493 |
-
"sentence-bert-swedish-cased": 768,
|
494 |
"sentence-t5-base": 768,
|
495 |
"sentence-t5-large": 768,
|
496 |
"sentence-t5-xl": 768,
|
497 |
"sentence-t5-xxl": 768,
|
498 |
"sup-simcse-bert-base-uncased": 768,
|
499 |
-
"st-polish-paraphrase-from-distilroberta": 768,
|
500 |
-
"st-polish-paraphrase-from-mpnet": 768,
|
501 |
-
"text2vec-base-chinese": 768,
|
502 |
-
"text2vec-large-chinese": 1024,
|
503 |
"text-embedding-3-large": 3072,
|
504 |
"text-embedding-3-large-256": 256,
|
505 |
"text-embedding-3-small": 1536,
|
506 |
-
"text-embedding-ada-002": 1536,
|
507 |
-
"text-similarity-ada-001": 1024,
|
508 |
-
"text-similarity-babbage-001": 2048,
|
509 |
-
"text-similarity-curie-001": 4096,
|
510 |
-
"text-similarity-davinci-001": 12288,
|
511 |
-
"text-search-ada-doc-001": 1024,
|
512 |
-
"text-search-ada-query-001": 1024,
|
513 |
-
"text-search-ada-001": 1024,
|
514 |
-
"text-search-babbage-001": 2048,
|
515 |
-
"text-search-curie-001": 4096,
|
516 |
-
"text-search-davinci-001": 12288,
|
517 |
"titan-embed-text-v1": 1536,
|
518 |
"unsup-simcse-bert-base-uncased": 768,
|
519 |
"use-cmlm-multilingual": 768,
|
@@ -528,24 +452,14 @@ EXTERNAL_MODEL_TO_SEQLEN = {
|
|
528 |
"all-MiniLM-L6-v2": 512,
|
529 |
"all-mpnet-base-v2": 514,
|
530 |
"allenai-specter": 512,
|
531 |
-
"
|
532 |
-
"
|
533 |
-
"bert-base-uncased": 512,
|
534 |
-
"bge-base-zh-v1.5": 512,
|
535 |
-
"bge-large-zh-v1.5": 512,
|
536 |
-
"bge-large-zh-noinstruct": 512,
|
537 |
-
"bge-small-zh-v1.5": 512,
|
538 |
-
"contriever-base-msmarco": 512,
|
539 |
-
"cross-en-de-roberta-sentence-transformer": 514,
|
540 |
-
"DanskBERT": 514,
|
541 |
"dfm-encoder-large-v1": 512,
|
542 |
"dfm-sentence-encoder-large-1": 512,
|
543 |
"distiluse-base-multilingual-cased-v2": 512,
|
544 |
"e5-base": 512,
|
545 |
"e5-large": 512,
|
546 |
"e5-small": 512,
|
547 |
-
"electra-small-nordic": 512,
|
548 |
-
"electra-small-swedish-cased-discriminator": 512,
|
549 |
"gbert-base": 512,
|
550 |
"gbert-large": 512,
|
551 |
"gelectra-base": 512,
|
@@ -573,30 +487,14 @@ EXTERNAL_MODEL_TO_SEQLEN = {
|
|
573 |
"norbert3-large": 512,
|
574 |
"paraphrase-multilingual-MiniLM-L12-v2": 512,
|
575 |
"paraphrase-multilingual-mpnet-base-v2": 514,
|
576 |
-
"sentence-bert-swedish-cased": 512,
|
577 |
"sentence-t5-base": 512,
|
578 |
"sentence-t5-large": 512,
|
579 |
"sentence-t5-xl": 512,
|
580 |
"sentence-t5-xxl": 512,
|
581 |
"sup-simcse-bert-base-uncased": 512,
|
582 |
-
"st-polish-paraphrase-from-distilroberta": 514,
|
583 |
-
"st-polish-paraphrase-from-mpnet": 514,
|
584 |
-
"text2vec-base-chinese": 512,
|
585 |
-
"text2vec-large-chinese": 512,
|
586 |
"text-embedding-3-large": 8191,
|
587 |
"text-embedding-3-large-256": 8191,
|
588 |
"text-embedding-3-small": 8191,
|
589 |
-
"text-embedding-ada-002": 8191,
|
590 |
-
"text-similarity-ada-001": 2046,
|
591 |
-
"text-similarity-babbage-001": 2046,
|
592 |
-
"text-similarity-curie-001": 2046,
|
593 |
-
"text-similarity-davinci-001": 2046,
|
594 |
-
"text-search-ada-doc-001": 2046,
|
595 |
-
"text-search-ada-query-001": 2046,
|
596 |
-
"text-search-ada-001": 2046,
|
597 |
-
"text-search-babbage-001": 2046,
|
598 |
-
"text-search-curie-001": 2046,
|
599 |
-
"text-search-davinci-001": 2046,
|
600 |
"titan-embed-text-v1": 8000,
|
601 |
"use-cmlm-multilingual": 512,
|
602 |
"unsup-simcse-bert-base-uncased": 512,
|
@@ -611,23 +509,14 @@ EXTERNAL_MODEL_TO_SIZE = {
|
|
611 |
"all-MiniLM-L12-v2": 0.13,
|
612 |
"all-MiniLM-L6-v2": 0.09,
|
613 |
"all-mpnet-base-v2": 0.44,
|
614 |
-
"bert-base-uncased": 0.44,
|
615 |
-
"bert-base-swedish-cased": 0.50,
|
616 |
-
"bge-base-zh-v1.5": 0.41,
|
617 |
-
"bge-large-zh-v1.5": 1.30,
|
618 |
-
"bge-large-zh-noinstruct": 1.30,
|
619 |
-
"bge-small-zh-v1.5": 0.10,
|
620 |
-
"cross-en-de-roberta-sentence-transformer": 1.11,
|
621 |
"contriever-base-msmarco": 0.44,
|
622 |
-
"DanskBERT": 0.50,
|
623 |
"distiluse-base-multilingual-cased-v2": 0.54,
|
624 |
"dfm-encoder-large-v1": 1.42,
|
625 |
"dfm-sentence-encoder-large-1": 1.63,
|
626 |
"e5-base": 0.44,
|
627 |
"e5-small": 0.13,
|
628 |
"e5-large": 1.34,
|
629 |
-
"electra-small-nordic": 0.09,
|
630 |
-
"electra-small-swedish-cased-discriminator": 0.06,
|
631 |
"gbert-base": 0.44,
|
632 |
"gbert-large": 1.35,
|
633 |
"gelectra-base": 0.44,
|
@@ -655,16 +544,11 @@ EXTERNAL_MODEL_TO_SIZE = {
|
|
655 |
"norbert3-large": 1.47,
|
656 |
"paraphrase-multilingual-mpnet-base-v2": 1.11,
|
657 |
"paraphrase-multilingual-MiniLM-L12-v2": 0.47,
|
658 |
-
"sentence-bert-swedish-cased": 0.50,
|
659 |
"sentence-t5-base": 0.22,
|
660 |
"sentence-t5-large": 0.67,
|
661 |
"sentence-t5-xl": 2.48,
|
662 |
"sentence-t5-xxl": 9.73,
|
663 |
-
"sup-simcse-bert-base-uncased": 0.44,
|
664 |
-
"st-polish-paraphrase-from-distilroberta": 0.50,
|
665 |
-
"st-polish-paraphrase-from-mpnet": 0.50,
|
666 |
-
"text2vec-base-chinese": 0.41,
|
667 |
-
"text2vec-large-chinese": 1.30,
|
668 |
"unsup-simcse-bert-base-uncased": 0.44,
|
669 |
"use-cmlm-multilingual": 1.89,
|
670 |
"xlm-roberta-base": 1.12,
|
|
|
280 |
"all-mpnet-base-v2",
|
281 |
"allenai-specter",
|
282 |
"Baichuan-text-embedding",
|
|
|
283 |
"bert-base-uncased",
|
|
|
|
|
|
|
|
|
284 |
"contriever-base-msmarco",
|
|
|
285 |
"dfm-encoder-large-v1",
|
286 |
"dfm-sentence-encoder-large-1",
|
287 |
"distiluse-base-multilingual-cased-v2",
|
|
|
288 |
"e5-base",
|
289 |
"e5-large",
|
290 |
"e5-small",
|
|
|
|
|
291 |
"gbert-base",
|
292 |
"gbert-large",
|
293 |
"gelectra-base",
|
|
|
315 |
"norbert3-large",
|
316 |
"paraphrase-multilingual-MiniLM-L12-v2",
|
317 |
"paraphrase-multilingual-mpnet-base-v2",
|
|
|
318 |
"sentence-t5-base",
|
319 |
"sentence-t5-large",
|
320 |
"sentence-t5-xl",
|
321 |
"sentence-t5-xxl",
|
322 |
"sup-simcse-bert-base-uncased",
|
|
|
|
|
|
|
|
|
323 |
"text-embedding-3-small",
|
324 |
"text-embedding-3-large",
|
325 |
"text-embedding-3-large-256",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
326 |
"titan-embed-text-v1",
|
327 |
"unsup-simcse-bert-base-uncased",
|
328 |
"use-cmlm-multilingual",
|
|
|
338 |
"all-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L12-v2",
|
339 |
"all-MiniLM-L6-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2",
|
340 |
"all-mpnet-base-v2": "https://huggingface.co/sentence-transformers/all-mpnet-base-v2",
|
|
|
|
|
341 |
"bert-base-uncased": "https://huggingface.co/bert-base-uncased",
|
|
|
|
|
|
|
|
|
342 |
"contriever-base-msmarco": "https://huggingface.co/nthakur/contriever-base-msmarco",
|
|
|
|
|
343 |
"distiluse-base-multilingual-cased-v2": "https://huggingface.co/sentence-transformers/distiluse-base-multilingual-cased-v2",
|
344 |
"dfm-encoder-large-v1": "https://huggingface.co/chcaa/dfm-encoder-large-v1",
|
345 |
"dfm-sentence-encoder-large-1": "https://huggingface.co/chcaa/dfm-encoder-large-v1",
|
346 |
"e5-base": "https://huggingface.co/intfloat/e5-base",
|
347 |
"e5-large": "https://huggingface.co/intfloat/e5-large",
|
348 |
"e5-small": "https://huggingface.co/intfloat/e5-small",
|
|
|
|
|
349 |
"gbert-base": "https://huggingface.co/deepset/gbert-base",
|
350 |
"gbert-large": "https://huggingface.co/deepset/gbert-large",
|
351 |
"gelectra-base": "https://huggingface.co/deepset/gelectra-base",
|
|
|
373 |
"norbert3-large": "https://huggingface.co/ltg/norbert3-large",
|
374 |
"paraphrase-multilingual-mpnet-base-v2": "https://huggingface.co/sentence-transformers/paraphrase-multilingual-mpnet-base-v2",
|
375 |
"paraphrase-multilingual-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2",
|
|
|
376 |
"sentence-t5-base": "https://huggingface.co/sentence-transformers/sentence-t5-base",
|
377 |
"sentence-t5-large": "https://huggingface.co/sentence-transformers/sentence-t5-large",
|
378 |
"sentence-t5-xl": "https://huggingface.co/sentence-transformers/sentence-t5-xl",
|
379 |
"sentence-t5-xxl": "https://huggingface.co/sentence-transformers/sentence-t5-xxl",
|
380 |
"sup-simcse-bert-base-uncased": "https://huggingface.co/princeton-nlp/sup-simcse-bert-base-uncased",
|
|
|
|
|
|
|
|
|
381 |
"text-embedding-3-small": "https://openai.com/blog/new-embedding-models-and-api-updates",
|
382 |
"text-embedding-3-large": "https://openai.com/blog/new-embedding-models-and-api-updates",
|
383 |
"text-embedding-3-large-256": "https://openai.com/blog/new-embedding-models-and-api-updates",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
384 |
"titan-embed-text-v1": "https://docs.aws.amazon.com/bedrock/latest/userguide/embeddings.html",
|
385 |
"unsup-simcse-bert-base-uncased": "https://huggingface.co/princeton-nlp/unsup-simcse-bert-base-uncased",
|
386 |
"use-cmlm-multilingual": "https://huggingface.co/sentence-transformers/use-cmlm-multilingual",
|
|
|
395 |
"all-MiniLM-L6-v2": 384,
|
396 |
"all-mpnet-base-v2": 768,
|
397 |
"allenai-specter": 768,
|
|
|
|
|
398 |
"bert-base-uncased": 768,
|
|
|
|
|
|
|
|
|
399 |
"contriever-base-msmarco": 768,
|
|
|
|
|
400 |
"distiluse-base-multilingual-cased-v2": 512,
|
401 |
"dfm-encoder-large-v1": 1024,
|
402 |
"dfm-sentence-encoder-large-1": 1024,
|
403 |
"e5-base": 768,
|
404 |
"e5-small": 384,
|
405 |
"e5-large": 1024,
|
|
|
|
|
406 |
"luotuo-bert-medium": 768,
|
407 |
"LASER2": 1024,
|
408 |
"LaBSE": 768,
|
|
|
430 |
"norbert3-large": 1024,
|
431 |
"paraphrase-multilingual-MiniLM-L12-v2": 384,
|
432 |
"paraphrase-multilingual-mpnet-base-v2": 768,
|
|
|
433 |
"sentence-t5-base": 768,
|
434 |
"sentence-t5-large": 768,
|
435 |
"sentence-t5-xl": 768,
|
436 |
"sentence-t5-xxl": 768,
|
437 |
"sup-simcse-bert-base-uncased": 768,
|
|
|
|
|
|
|
|
|
438 |
"text-embedding-3-large": 3072,
|
439 |
"text-embedding-3-large-256": 256,
|
440 |
"text-embedding-3-small": 1536,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
441 |
"titan-embed-text-v1": 1536,
|
442 |
"unsup-simcse-bert-base-uncased": 768,
|
443 |
"use-cmlm-multilingual": 768,
|
|
|
452 |
"all-MiniLM-L6-v2": 512,
|
453 |
"all-mpnet-base-v2": 514,
|
454 |
"allenai-specter": 512,
|
455 |
+
"bert-base-uncased": 512,
|
456 |
+
"contriever-base-msmarco": 512,4,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
457 |
"dfm-encoder-large-v1": 512,
|
458 |
"dfm-sentence-encoder-large-1": 512,
|
459 |
"distiluse-base-multilingual-cased-v2": 512,
|
460 |
"e5-base": 512,
|
461 |
"e5-large": 512,
|
462 |
"e5-small": 512,
|
|
|
|
|
463 |
"gbert-base": 512,
|
464 |
"gbert-large": 512,
|
465 |
"gelectra-base": 512,
|
|
|
487 |
"norbert3-large": 512,
|
488 |
"paraphrase-multilingual-MiniLM-L12-v2": 512,
|
489 |
"paraphrase-multilingual-mpnet-base-v2": 514,
|
|
|
490 |
"sentence-t5-base": 512,
|
491 |
"sentence-t5-large": 512,
|
492 |
"sentence-t5-xl": 512,
|
493 |
"sentence-t5-xxl": 512,
|
494 |
"sup-simcse-bert-base-uncased": 512,
|
|
|
|
|
|
|
|
|
495 |
"text-embedding-3-large": 8191,
|
496 |
"text-embedding-3-large-256": 8191,
|
497 |
"text-embedding-3-small": 8191,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
498 |
"titan-embed-text-v1": 8000,
|
499 |
"use-cmlm-multilingual": 512,
|
500 |
"unsup-simcse-bert-base-uncased": 512,
|
|
|
509 |
"all-MiniLM-L12-v2": 0.13,
|
510 |
"all-MiniLM-L6-v2": 0.09,
|
511 |
"all-mpnet-base-v2": 0.44,
|
512 |
+
"bert-base-uncased": 0.44,
|
|
|
|
|
|
|
|
|
|
|
|
|
513 |
"contriever-base-msmarco": 0.44,
|
|
|
514 |
"distiluse-base-multilingual-cased-v2": 0.54,
|
515 |
"dfm-encoder-large-v1": 1.42,
|
516 |
"dfm-sentence-encoder-large-1": 1.63,
|
517 |
"e5-base": 0.44,
|
518 |
"e5-small": 0.13,
|
519 |
"e5-large": 1.34,
|
|
|
|
|
520 |
"gbert-base": 0.44,
|
521 |
"gbert-large": 1.35,
|
522 |
"gelectra-base": 0.44,
|
|
|
544 |
"norbert3-large": 1.47,
|
545 |
"paraphrase-multilingual-mpnet-base-v2": 1.11,
|
546 |
"paraphrase-multilingual-MiniLM-L12-v2": 0.47,
|
|
|
547 |
"sentence-t5-base": 0.22,
|
548 |
"sentence-t5-large": 0.67,
|
549 |
"sentence-t5-xl": 2.48,
|
550 |
"sentence-t5-xxl": 9.73,
|
551 |
+
"sup-simcse-bert-base-uncased": 0.44,
|
|
|
|
|
|
|
|
|
552 |
"unsup-simcse-bert-base-uncased": 0.44,
|
553 |
"use-cmlm-multilingual": 1.89,
|
554 |
"xlm-roberta-base": 1.12,
|