Upload ONNX weights (+ Transformers.js integration)

by Xenova HF staff - opened Jun 25

base: refs/heads/main

←

from: refs/pr/9

Discussion Files changed

+83

-0

Files changed (8) hide show

README.md +62 -0
onnx/model.onnx +3 -0
onnx/model_bnb4.onnx +3 -0
onnx/model_fp16.onnx +3 -0
onnx/model_int8.onnx +3 -0
onnx/model_q4.onnx +3 -0
onnx/model_quantized.onnx +3 -0
onnx/model_uint8.onnx +3 -0

README.md CHANGED Viewed

@@ -4,6 +4,7 @@ tags:
 - transformers
 - reranker
 - cross-encoder
 language:
 - multilingual
 inference: false
@@ -127,6 +128,67 @@ pip install flash-attn --no-build-isolation
 ```
 Enjoy the 3x-6x speedup with flash attention! ⚡️⚡️⚡️
 That's it! You can now use the `jina-reranker-v2-base-multilingual` model in your projects.

 - transformers
 - reranker
 - cross-encoder
+- transformers.js
 language:
 - multilingual
 inference: false
 ```
 Enjoy the 3x-6x speedup with flash attention! ⚡️⚡️⚡️
+3. You can also use the `transformers.js` library to run the model directly in JavaScript (in-browser, Node.js, Deno, etc.)!
+If you haven't already, you can install the [Transformers.js](https://huggingface.co/docs/transformers.js) JavaScript library (v3) using:
+```bash
+npm i xenova/transformers.js#v3
+```
+Then, you can use the following code to interact with the model:
+```js
+import { AutoTokenizer, XLMRobertaModel } from '@xenova/transformers';
+const model_id = 'jinaai/jina-reranker-v2-base-multilingual';
+const model = await XLMRobertaModel.from_pretrained(model_id, { dtype: 'fp32' });
+const tokenizer = await AutoTokenizer.from_pretrained(model_id);
+/**
+ * Performs ranking with the CrossEncoder on the given query and documents. Returns a sorted list with the document indices and scores.
+ * @param {string} query A single query
+ * @param {string[]} documents A list of documents
+ * @param {Object} options Options for ranking
+ * @param {number} [options.top_k=undefined] Return the top-k documents. If undefined, all documents are returned.
+ * @param {number} [options.return_documents=false] If true, also returns the documents. If false, only returns the indices and scores.
+ */
+async function rank(query, documents, {
+    top_k = undefined,
+    return_documents = false,
+} = {}) {
+    const inputs = tokenizer(
+        new Array(documents.length).fill(query),
+        { text_pair: documents, padding: true, truncation: true }
+    )
+    const { logits } = await model(inputs);
+    return logits.sigmoid().tolist()
+        .map(([score], i) => ({
+            corpus_id: i,
+            score,
+            ...(return_documents ? { text: documents[i] } : {})
+        })).sort((a, b) => b.score - a.score).slice(0, top_k);
+}
+// Example usage:
+const query = "Organic skincare products for sensitive skin"
+const documents = [
+    "Organic skincare for sensitive skin with aloe vera and chamomile.",
+    "New makeup trends focus on bold colors and innovative techniques",
+    "Bio-Hautpflege für empfindliche Haut mit Aloe Vera und Kamille",
+    "Neue Make-up-Trends setzen auf kräftige Farben und innovative Techniken",
+    "Cuidado de la piel orgánico para piel sensible con aloe vera y manzanilla",
+    "Las nuevas tendencias de maquillaje se centran en colores vivos y técnicas innovadoras",
+    "针对敏感肌专门设计的天然有机护肤产品",
+    "新的化妆趋势注重鲜艳的颜色和创新的技巧",
+    "敏感肌のために特別に設計された天然有機スキンケア製品",
+    "新しいメイクのトレンドは鮮やかな色と革新的な技術に焦点を当てています",
+]
+const results = await rank(query, documents, { return_documents: true, top_k: 3 });
+console.log(results);
+```
 That's it! You can now use the `jina-reranker-v2-base-multilingual` model in your projects.

onnx/model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ef3f7978f7bc52360864d74edc1a0e03d159af770a7767c4d5943496e616012
+size 1114040223

onnx/model_bnb4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df70759eb3ebb4e96b7d82e9af1e99c4979f76b96205ea18dddb101d32b07f80
+size 822084838

onnx/model_fp16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ad94bcc1d7313ec5f76e18de8ffa7469e3f34b76810b8fd7206619b9cde1bc4
+size 557164815

onnx/model_int8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5220cf8fe023f8aa0ed2a3eb787d4451a7f17cf53f6b787e35718dd4b8815c3
+size 279577152

onnx/model_q4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a3744ee702adeb08230fba13258cc4ad441b73310a1060df2066bebbda080de7
+size 827392882

onnx/model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5220cf8fe023f8aa0ed2a3eb787d4451a7f17cf53f6b787e35718dd4b8815c3
+size 279577152

onnx/model_uint8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9498f606988b84e23b98d04101f3623c084baf3f1e16fd43a46ea6259b4f5924
+size 279577151