lv12
/

esci-nomic-embed-text-v1_5

@@ -5,67 +5,36 @@ tags:
 - sentence-transformers
 - sentence-similarity
 - feature-extraction
-- dataset_size:1K<n<10K
 - loss:CachedGISTEmbedLoss
 base_model: nomic-ai/nomic-embed-text-v1.5
-metrics:
-- cosine_accuracy
-- dot_accuracy
-- manhattan_accuracy
-- euclidean_accuracy
-- max_accuracy
 widget:
-- source_sentence: Pilot
   sentences:
-  - Episode Two
-  - dog dinosaur bone
-  - 10' x 12' gazebo
-- source_sentence: skull
   sentences:
-  - cool head s
-  - trunk bike rack 4
-  - bread without gluten
-- source_sentence: pipes
   sentences:
-  - chillum pipe
-  - Deckle Edge Ruler
-  - dog collar for boxer
-- source_sentence: ddj400
   sentences:
-  - lc27h711qenxza
-  - bed frame for full
-  - chicago bears gifts
-- source_sentence: primes
   sentences:
-  - Newton
-  - big boys sneakers
-  - large dog clothes
 pipeline_tag: sentence-similarity
-model-index:
-- name: SentenceTransformer based on nomic-ai/nomic-embed-text-v1.5
-  results:
-  - task:
-      type: triplet
-      name: Triplet
-    dataset:
-      name: esci dev
-      type: esci-dev
-    metrics:
-    - type: cosine_accuracy
-      value: 0.6414052697616061
-      name: Cosine Accuracy
-    - type: dot_accuracy
-      value: 0.36637390213299875
-      name: Dot Accuracy
-    - type: manhattan_accuracy
-      value: 0.6404015056461732
-      name: Manhattan Accuracy
-    - type: euclidean_accuracy
-      value: 0.6406524466750314
-      name: Euclidean Accuracy
-    - type: max_accuracy
-      value: 0.6414052697616061
-      name: Max Accuracy
 ---
 # SentenceTransformer based on nomic-ai/nomic-embed-text-v1.5
@@ -117,9 +86,9 @@ from sentence_transformers import SentenceTransformer
 model = SentenceTransformer("sentence_transformers_model_id")
 # Run inference
 sentences = [
-    'primes',
-    'Newton',
-    'big boys sneakers',
 ]
 embeddings = model.encode(sentences)
 print(embeddings.shape)
@@ -155,22 +124,6 @@ You can finetune this model on your own dataset.
 *List how the model may foreseeably be misused and address what users ought not to do with the model.*
 -->
-## Evaluation
-### Metrics
-#### Triplet
-* Dataset: `esci-dev`
-* Evaluated with [<code>TripletEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.TripletEvaluator)
-| Metric             | Value      |
-|:-------------------|:-----------|
-| cosine_accuracy    | 0.6414     |
-| dot_accuracy       | 0.3664     |
-| manhattan_accuracy | 0.6404     |
-| euclidean_accuracy | 0.6407     |
-| **max_accuracy**   | **0.6414** |
 <!--
 ## Bias, Risks and Limitations
@@ -190,46 +143,19 @@ You can finetune this model on your own dataset.
 #### Unnamed Dataset
-* Size: 9,090 training samples
-* Columns: <code>query</code>, <code>pos</code>, and <code>neg</code>
-* Approximate statistics based on the first 1000 samples:
-  |         | query                                                                            | pos                                                                               | neg                                                                              |
-  |:--------|:---------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|:---------------------------------------------------------------------------------|
-  | type    | string                                                                           | string                                                                            | string                                                                           |
-  | details | <ul><li>min: 3 tokens</li><li>mean: 7.42 tokens</li><li>max: 30 tokens</li></ul> | <ul><li>min: 3 tokens</li><li>mean: 29.27 tokens</li><li>max: 87 tokens</li></ul> | <ul><li>min: 4 tokens</li><li>mean: 29.8 tokens</li><li>max: 82 tokens</li></ul> |
-* Samples:
-  | query                                                         | pos                                                                                                                                                                                                                   | neg                                                                                                                                                                                         |
-  |:--------------------------------------------------------------|:----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-  | <code>1 3/4 inch tooled belt strap without belt buckle</code> | <code>BS3501 Solid Brass Leaf Belt Buckle Fits 1-3/4"(45mm) Wide Belt</code>                                                                                                                                          | <code>Nocona Men's Hired Brown Floral Eagle, 40</code>                                                                                                                                      |
-  | <code>7edge phone case peacock</code>                         | <code>Galaxy S7 Edge Case for Girls Women Clear with Flowers Design Shockproof Protective Cell Phone Cases for Samsung Galaxy S7 Edge 5.5 Inch Cute Floral Pattern Print Flexible Slim Fit Bumper Rubber Cover</code> | <code>Galaxy S7 Case, Galaxy S7 Phone Case with HD Screen Protector for Girls Women, Gritup Cute Clear Gradient Glitter Liquid TPU Slim Phone Case for Samsung Galaxy S7 Teal/Purple</code> |
-  | <code>girls white shoes</code>                                | <code>adidas Women's Coast Star Shoes, ftwr White/Silver Met./ core Black, 6 M US</code>                                                                                                                              | <code>Converse Optical White M7650 - HI TOP Size 6 M US Women / 4 M US Men</code>                                                                                                           |
-* Loss: [<code>CachedGISTEmbedLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cachedgistembedloss) with these parameters:
-  ```json
-  {'guide': SentenceTransformer(
-    (0): Transformer({'max_seq_length': 256, 'do_lower_case': False}) with Transformer model: BertModel
-    (1): Pooling({'word_embedding_dimension': 384, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
-    (2): Normalize()
-  ), 'temperature': 0.01}
-  ```
-### Evaluation Dataset
-#### Unnamed Dataset
-* Size: 3,985 evaluation samples
-* Columns: <code>query</code>, <code>pos</code>, and <code>neg</code>
 * Approximate statistics based on the first 1000 samples:
-  |         | query                                                                            | pos                                                                                | neg                                                                               |
-  |:--------|:---------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|
-  | type    | string                                                                           | string                                                                             | string                                                                            |
-  | details | <ul><li>min: 3 tokens</li><li>mean: 7.28 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 3 tokens</li><li>mean: 28.58 tokens</li><li>max: 116 tokens</li></ul> | <ul><li>min: 3 tokens</li><li>mean: 29.26 tokens</li><li>max: 79 tokens</li></ul> |
 * Samples:
-  | query                                 | pos                                                                                                                                                                                                        | neg                                                                                                                                                                                                           |
-  |:--------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-  | <code>colors for dining room</code>   | <code>AOOS CUSTOM Dimmable LED Neon Signs for Home Bedroom Salon Dining Room Wall Decor (Customization: Texts, Designs, Logos, Languages, Colors, Sizes, Fonts, Color-Changing) (24" / 1 Line Text)</code> | <code>Jetec 5 Pieces EAT Sign Kitchen Wood Rustic Sign Arrow Wall Decor EAT Farmhouse Decoration Hanging Arrow Wooden Sign for Kitchen Wall Home Dining Room (Charming Color)</code>                          |
-  | <code>mix no 6 heels for women</code> | <code>DREAM PAIRS Women's Hi-Chunk Gold Glitter High Heel Pump Sandals - 6 M US</code>                                                                                                                     | <code>Fashare Womens High Heels Pointed Toe Bowtie Back Ankle Buckle Strap Wedding Evening Party Dress Pumps Shoes</code>                                                                                     |
-  | <code>goxlrmini</code>                | <code>Singing Machine SMM-205 Unidirectional Dynamic Microphone with 10 Ft. Cord,Black, one size</code>                                                                                                    | <code>Behringer U-Phoria Studio Pro Complete Recording Bundle with UMC202HD USB Audio Interface - With 20' 6mm Rubber XLR Microphone Cable, On-Stage MBS5000 Broadcast/Webcast Boom Arm with XLR Cable</code> |
 * Loss: [<code>CachedGISTEmbedLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cachedgistembedloss) with these parameters:
   ```json
   {'guide': SentenceTransformer(
@@ -242,9 +168,10 @@ You can finetune this model on your own dataset.
 ### Training Hyperparameters
 #### Non-Default Hyperparameters
-- `per_device_train_batch_size`: 16
-- `per_device_eval_batch_size`: 16
-- `num_train_epochs`: 10
 - `warmup_ratio`: 0.1
 - `fp16`: True
 - `batch_sampler`: no_duplicates
@@ -255,21 +182,21 @@ You can finetune this model on your own dataset.
 - `overwrite_output_dir`: False
 - `do_predict`: False
 - `prediction_loss_only`: True
-- `per_device_train_batch_size`: 16
-- `per_device_eval_batch_size`: 16
 - `per_gpu_train_batch_size`: None
 - `per_gpu_eval_batch_size`: None
-- `gradient_accumulation_steps`: 1
 - `eval_accumulation_steps`: None
-- `learning_rate`: 5e-05
 - `weight_decay`: 0.0
 - `adam_beta1`: 0.9
 - `adam_beta2`: 0.999
 - `adam_epsilon`: 1e-08
 - `max_grad_norm`: 1.0
-- `num_train_epochs`: 10
 - `max_steps`: -1
-- `lr_scheduler_type`: linear
 - `lr_scheduler_kwargs`: {}
 - `warmup_ratio`: 0.1
 - `warmup_steps`: 0
@@ -359,65 +286,78 @@ You can finetune this model on your own dataset.
 </details>
 ### Training Logs
-| Epoch  | Step | Training Loss | esci-dev_max_accuracy |
-|:------:|:----:|:-------------:|:---------------------:|
-| 0      | 0    | -             | 0.6414                |
-| 0.1757 | 100  | 0.8875        | -                     |
-| 0.3515 | 200  | 0.5281        | -                     |
-| 0.5272 | 300  | 0.4621        | -                     |
-| 0.7030 | 400  | 0.4669        | -                     |
-| 0.8787 | 500  | 0.4501        | -                     |
-| 1.0545 | 600  | 0.5379        | -                     |
-| 1.2302 | 700  | 0.4288        | -                     |
-| 1.4060 | 800  | 0.2112        | -                     |
-| 1.5817 | 900  | 0.1508        | -                     |
-| 1.7575 | 1000 | 0.1133        | -                     |
-| 1.9332 | 1100 | 0.1312        | -                     |
-| 2.1090 | 1200 | 0.0784        | -                     |
-| 2.2847 | 1300 | 0.0983        | -                     |
-| 2.4605 | 1400 | 0.106         | -                     |
-| 2.6362 | 1500 | 0.1058        | -                     |
-| 2.8120 | 1600 | 0.0673        | -                     |
-| 2.9877 | 1700 | 0.0355        | -                     |
-| 3.1634 | 1800 | 0.0175        | -                     |
-| 3.3392 | 1900 | 0.0366        | -                     |
-| 3.5149 | 2000 | 0.0332        | -                     |
-| 3.6907 | 2100 | 0.0682        | -                     |
-| 3.8664 | 2200 | 0.0378        | -                     |
-| 4.0422 | 2300 | 0.0239        | -                     |
-| 4.2179 | 2400 | 0.0282        | -                     |
-| 4.3937 | 2500 | 0.0401        | -                     |
-| 4.5694 | 2600 | 0.0268        | -                     |
-| 4.7452 | 2700 | 0.0208        | -                     |
-| 4.9209 | 2800 | 0.0117        | -                     |
-| 5.0967 | 2900 | 0.0045        | -                     |
-| 5.2724 | 3000 | 0.0145        | -                     |
-| 5.4482 | 3100 | 0.029         | -                     |
-| 5.6239 | 3200 | 0.0009        | -                     |
-| 5.7996 | 3300 | 0.0033        | -                     |
-| 5.9754 | 3400 | 0.0088        | -                     |
-| 6.1511 | 3500 | 0.0014        | -                     |
-| 6.3269 | 3600 | 0.0027        | -                     |
-| 6.5026 | 3700 | 0.0021        | -                     |
-| 6.6784 | 3800 | 0.0001        | -                     |
-| 6.8541 | 3900 | 0.0025        | -                     |
-| 7.0299 | 4000 | 0.0059        | -                     |
-| 7.2056 | 4100 | 0.0025        | -                     |
-| 7.3814 | 4200 | 0.0029        | -                     |
-| 7.5571 | 4300 | 0.0007        | -                     |
-| 7.7329 | 4400 | 0.0018        | -                     |
-| 7.9086 | 4500 | 0.0032        | -                     |
-| 8.0844 | 4600 | 0.0007        | -                     |
-| 8.2601 | 4700 | 0.0027        | -                     |
-| 8.4359 | 4800 | 0.0027        | -                     |
-| 8.6116 | 4900 | 0.0           | -                     |
-| 8.7873 | 5000 | 0.0025        | -                     |
-| 8.9631 | 5100 | 0.0025        | -                     |
-| 9.1388 | 5200 | 0.0014        | -                     |
-| 9.3146 | 5300 | 0.0027        | -                     |
-| 9.4903 | 5400 | 0.0021        | -                     |
-| 9.6661 | 5500 | 0.0           | -                     |
-| 9.8418 | 5600 | 0.0025        | -                     |
 ### Framework Versions

 - sentence-transformers
 - sentence-similarity
 - feature-extraction
+- dataset_size:1M<n<10M
 - loss:CachedGISTEmbedLoss
 base_model: nomic-ai/nomic-embed-text-v1.5
 widget:
+- source_sentence: 'search_query: 楢崎壮太'
   sentences:
+  - 'search_query: 野崎萌香'
+  - 'search_query: ps4 slim 1tb'
+  - 'search_query: toy story 4 on dvd'
+- source_sentence: 'search_query: テプラ'
   sentences:
+  - 'search_query: 携帯デコシール'
+  - 'search_query: womens boots'
+  - 'search_query: nfl gift'
+- source_sentence: 'search_query: 扇子 布'
   sentences:
+  - 'search_query: 天気の子'
+  - 'search_query: 登山ぐつ メンズ 紐なし'
+  - 'search_query: 10gbe switch'
+- source_sentence: 'search_query: リング棒'
   sentences:
+  - 'search_query: ライトショアジギング'
+  - 'search_query: auvハンガーすべらない'
+  - 'search_query: plastic drum lid'
+- source_sentence: 'search_query: 聖 龍人'
   sentences:
+  - 'search_query: 越前かに職人甲羅組'
+  - 'search_query: tea tree oil'
+  - 'search_query: lift storage bed'
 pipeline_tag: sentence-similarity
 ---
 # SentenceTransformer based on nomic-ai/nomic-embed-text-v1.5
 model = SentenceTransformer("sentence_transformers_model_id")
 # Run inference
 sentences = [
+    'search_query: 聖 龍人',
+    'search_query: 越前かに職人甲羅組',
+    'search_query: tea tree oil',
 ]
 embeddings = model.encode(sentences)
 print(embeddings.shape)
 *List how the model may foreseeably be misused and address what users ought not to do with the model.*
 -->
 <!--
 ## Bias, Risks and Limitations
 #### Unnamed Dataset
+* Size: 1,767,572 training samples
+* Columns: <code>anchor</code>, <code>positive</code>, and <code>negative</code>
 * Approximate statistics based on the first 1000 samples:
+  |         | anchor                                                                            | positive                                                                           | negative                                                                          |
+  |:--------|:----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|
+  | type    | string                                                                            | string                                                                             | string                                                                            |
+  | details | <ul><li>min: 7 tokens</li><li>mean: 12.26 tokens</li><li>max: 59 tokens</li></ul> | <ul><li>min: 7 tokens</li><li>mean: 31.93 tokens</li><li>max: 140 tokens</li></ul> | <ul><li>min: 7 tokens</li><li>mean: 34.3 tokens</li><li>max: 157 tokens</li></ul> |
 * Samples:
+  | anchor                                                   | positive                                                                                                                                      | negative                                                                                                                                        |
+  |:---------------------------------------------------------|:----------------------------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------------------------|
+  | <code>search_query: plus tops for women</code>           | <code>search_document:Just My Size Women's Plus-Size Graphic Short Sleeve V-Neck T-Shirt, White-Y07188, 5X, JUST MY SIZE, White-y07188</code> | <code>search_document:Calvin Klein Women's Regular Modern Cotton Bralette, Nymph's Thigh, S, Calvin Klein, Nymph's Thigh</code>                 |
+  | <code>search_query: mens black wallet trifold</code>     | <code>search_document:Stealth Mode Trifold RFID Blocking Leather Wallet for Men (Black), Stealth Mode, Black</code>                           | <code>search_document:RFID Trifold Canvas Outdoor Sports Wallet for Kids - Front Pocket Wallet with Magic Sticker (Black), AI-DEE, Black</code> |
+  | <code>search_query: ipad pro reacondicionado 12,9</code> | <code>search_document:Apple iPad Pro (12.9 Pouces, Wi-FI, 64Go) 2018 - Gray (Renewed), Apple, Gris Espacial</code>                            | <code>search_document:Apple iPad Pro 3rd Generation (11-Inch, Wi-FI Only 64GB) - Space Gray (Renewed), Apple, Gris Espacial</code>              |
 * Loss: [<code>CachedGISTEmbedLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cachedgistembedloss) with these parameters:
   ```json
   {'guide': SentenceTransformer(
 ### Training Hyperparameters
 #### Non-Default Hyperparameters
+- `per_device_eval_batch_size`: 2
+- `gradient_accumulation_steps`: 2
+- `learning_rate`: 1e-05
+- `lr_scheduler_type`: cosine_with_restarts
 - `warmup_ratio`: 0.1
 - `fp16`: True
 - `batch_sampler`: no_duplicates
 - `overwrite_output_dir`: False
 - `do_predict`: False
 - `prediction_loss_only`: True
+- `per_device_train_batch_size`: 8
+- `per_device_eval_batch_size`: 2
 - `per_gpu_train_batch_size`: None
 - `per_gpu_eval_batch_size`: None
+- `gradient_accumulation_steps`: 2
 - `eval_accumulation_steps`: None
+- `learning_rate`: 1e-05
 - `weight_decay`: 0.0
 - `adam_beta1`: 0.9
 - `adam_beta2`: 0.999
 - `adam_epsilon`: 1e-08
 - `max_grad_norm`: 1.0
+- `num_train_epochs`: 3
 - `max_steps`: -1
+- `lr_scheduler_type`: cosine_with_restarts
 - `lr_scheduler_kwargs`: {}
 - `warmup_ratio`: 0.1
 - `warmup_steps`: 0
 </details>
 ### Training Logs
+| Epoch  | Step | Training Loss |
+|:------:|:----:|:-------------:|
+| 0.0009 | 100  | 3.7009        |
+| 0.0018 | 200  | 3.3796        |
+| 0.0027 | 300  | 2.8348        |
+| 0.0036 | 400  | 2.1803        |
+| 0.0045 | 500  | 1.8272        |
+| 0.0054 | 600  | 1.4715        |
+| 0.0063 | 700  | 1.0056        |
+| 0.0072 | 800  | 0.7984        |
+| 0.0081 | 900  | 0.6925        |
+| 0.0091 | 1000 | 0.6552        |
+| 0.0100 | 1100 | 0.6054        |
+| 0.0109 | 1200 | 0.5874        |
+| 0.0118 | 1300 | 0.5641        |
+| 0.0127 | 1400 | 0.528         |
+| 0.0136 | 1500 | 0.5285        |
+| 0.0145 | 1600 | 0.5032        |
+| 0.0154 | 1700 | 0.5238        |
+| 0.0163 | 1800 | 0.4565        |
+| 0.0172 | 1900 | 0.4739        |
+| 0.0181 | 2000 | 0.4614        |
+| 0.0190 | 2100 | 0.4334        |
+| 0.0199 | 2200 | 0.4217        |
+| 0.0208 | 2300 | 0.3931        |
+| 0.0217 | 2400 | 0.4102        |
+| 0.0226 | 2500 | 0.3936        |
+| 0.0235 | 2600 | 0.415         |
+| 0.0244 | 2700 | 0.4462        |
+| 0.0253 | 2800 | 0.3886        |
+| 0.0263 | 2900 | 0.3887        |
+| 0.0272 | 3000 | 0.3629        |
+| 0.0281 | 3100 | 0.37          |
+| 0.0290 | 3200 | 0.3861        |
+| 0.0299 | 3300 | 0.3813        |
+| 0.0308 | 3400 | 0.3348        |
+| 0.0317 | 3500 | 0.3566        |
+| 0.0326 | 3600 | 0.3674        |
+| 0.0335 | 3700 | 0.3421        |
+| 0.0344 | 3800 | 0.3225        |
+| 0.0353 | 3900 | 0.406         |
+| 0.0362 | 4000 | 0.3975        |
+| 0.0371 | 4100 | 0.368         |
+| 0.0380 | 4200 | 0.3481        |
+| 0.0389 | 4300 | 0.3405        |
+| 0.0398 | 4400 | 0.3529        |
+| 0.0407 | 4500 | 0.3968        |
+| 0.0416 | 4600 | 0.3634        |
+| 0.0425 | 4700 | 0.3518        |
+| 0.0434 | 4800 | 0.383         |
+| 0.0444 | 4900 | 0.3261        |
+| 0.0453 | 5000 | 0.323         |
+| 0.0462 | 5100 | 0.3372        |
+| 0.0471 | 5200 | 0.358         |
+| 0.0480 | 5300 | 0.3207        |
+| 0.0489 | 5400 | 0.341         |
+| 0.0498 | 5500 | 0.3146        |
+| 0.0507 | 5600 | 0.3065        |
+| 0.0516 | 5700 | 0.3597        |
+| 0.0525 | 5800 | 0.3352        |
+| 0.0534 | 5900 | 0.3212        |
+| 0.0543 | 6000 | 0.316         |
+| 0.0552 | 6100 | 0.3405        |
+| 0.0561 | 6200 | 0.3416        |
+| 0.0570 | 6300 | 0.3124        |
+| 0.0579 | 6400 | 0.3146        |
+| 0.0588 | 6500 | 0.3043        |
+| 0.0597 | 6600 | 0.3687        |
+| 0.0606 | 6700 | 0.3359        |
+| 0.0616 | 6800 | 0.3414        |
+| 0.0625 | 6900 | 0.3161        |
+| 0.0634 | 7000 | 0.3266        |
 ### Framework Versions

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "models/nomic-embed-text-esci/checkpoint-5600",
   "activation_function": "swiglu",
   "architectures": [
     "NomicBertModel"

 {
+  "_name_or_path": "models/nomic-embed-text-esci/checkpoint-7000",
   "activation_function": "swiglu",
   "architectures": [
     "NomicBertModel"

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:85c0ee2699043dfafce03c1ee919a4bf7ef793421919aeb9892d0f41a6b7de62
 size 546938168

 version https://git-lfs.github.com/spec/v1
+oid sha256:5d84393e7281f9fa1749b614ba8833b120c31a65d73fe00f693417d03f68231c
 size 546938168