alixnaveed commited on
Commit
795c6c6
1 Parent(s): a5e85a8

Add new SentenceTransformer model.

Browse files
Files changed (4) hide show
  1. README.md +3 -3
  2. config.json +1 -1
  3. model.safetensors +1 -1
  4. tokenizer_config.json +7 -0
README.md CHANGED
@@ -47,9 +47,9 @@ The model was trained with the parameters:
47
 
48
  **DataLoader**:
49
 
50
- `torch.utils.data.dataloader.DataLoader` of length 4612 with parameters:
51
  ```
52
- {'batch_size': 2, 'sampler': 'torch.utils.data.sampler.RandomSampler', 'batch_sampler': 'torch.utils.data.sampler.BatchSampler'}
53
  ```
54
 
55
  **Loss**:
@@ -72,7 +72,7 @@ Parameters of the fit()-Method:
72
  },
73
  "scheduler": "WarmupLinear",
74
  "steps_per_epoch": null,
75
- "warmup_steps": 46120,
76
  "weight_decay": 0.01
77
  }
78
  ```
 
47
 
48
  **DataLoader**:
49
 
50
+ `torch.utils.data.dataloader.DataLoader` of length 1153 with parameters:
51
  ```
52
+ {'batch_size': 8, 'sampler': 'torch.utils.data.sampler.RandomSampler', 'batch_sampler': 'torch.utils.data.sampler.BatchSampler'}
53
  ```
54
 
55
  **Loss**:
 
72
  },
73
  "scheduler": "WarmupLinear",
74
  "steps_per_epoch": null,
75
+ "warmup_steps": 11530,
76
  "weight_decay": 0.01
77
  }
78
  ```
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "intfloat/multilingual-e5-base",
3
  "architectures": [
4
  "XLMRobertaModel"
5
  ],
 
1
  {
2
+ "_name_or_path": "alixnaveed/MERGEDMODELV1",
3
  "architectures": [
4
  "XLMRobertaModel"
5
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:046a3d93889f2b0cf41c0bc4ad87b55420047c896cf9c1eccdd49ba2c44e7f81
3
  size 1112197096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2446871b3ba7dc244657e8c12717aba6ccc3ee0ef333c8b4b32d3e30e25b8c5
3
  size 1112197096
tokenizer_config.json CHANGED
@@ -46,9 +46,16 @@
46
  "cls_token": "<s>",
47
  "eos_token": "</s>",
48
  "mask_token": "<mask>",
 
49
  "model_max_length": 512,
 
50
  "pad_token": "<pad>",
 
 
51
  "sep_token": "</s>",
 
52
  "tokenizer_class": "XLMRobertaTokenizer",
 
 
53
  "unk_token": "<unk>"
54
  }
 
46
  "cls_token": "<s>",
47
  "eos_token": "</s>",
48
  "mask_token": "<mask>",
49
+ "max_length": 512,
50
  "model_max_length": 512,
51
+ "pad_to_multiple_of": null,
52
  "pad_token": "<pad>",
53
+ "pad_token_type_id": 0,
54
+ "padding_side": "right",
55
  "sep_token": "</s>",
56
+ "stride": 0,
57
  "tokenizer_class": "XLMRobertaTokenizer",
58
+ "truncation_side": "right",
59
+ "truncation_strategy": "longest_first",
60
  "unk_token": "<unk>"
61
  }