Make compatible to sentence-transformers (#10)
Browse files- Create 1_Pooling/config.json (0f70498f958347edab17f3b8779f9ecdcd1eeadc)
- Update 1_Pooling/config.json (a67fee46332d9fdc30942ae03ed1f6b0b032547a)
- Create sentence_bert_config.json (a2d0739b4e768032c2d0d1829ad1d5379bdda27c)
- Create modules.json (be17b6f9ac568ce4a977495f80968e53b999c3a8)
- Update sentence_bert_config.json (0eb14a491b64ce772c9def7f0ef3087b9f7e4588)
- Update tokenizer_config.json (d1a50b3624e901f12f9f4808126c30f6b01247a0)
- Update modules.json (807090377c246ba0eb0c6340fb6bbf7cca224a8a)
Co-authored-by: Michael <michaelfeil@users.noreply.huggingface.co>
- 1_Pooling/config.json +10 -0
- modules.json +14 -0
- sentence_bert_config.json +4 -0
- tokenizer_config.json +1 -1
1_Pooling/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 4096,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": false,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
7 |
+
"pooling_mode_weightedmean_tokens": false,
|
8 |
+
"pooling_mode_lasttoken": true,
|
9 |
+
"include_prompt": true
|
10 |
+
}
|
modules.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
}
|
14 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 32768,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
tokenizer_config.json
CHANGED
@@ -61,7 +61,7 @@
|
|
61 |
"clean_up_tokenization_spaces": false,
|
62 |
"eos_token": "</s>",
|
63 |
"legacy": true,
|
64 |
-
"model_max_length":
|
65 |
"pad_token": "<unk>",
|
66 |
"sp_model_kwargs": {},
|
67 |
"spaces_between_special_tokens": false,
|
|
|
61 |
"clean_up_tokenization_spaces": false,
|
62 |
"eos_token": "</s>",
|
63 |
"legacy": true,
|
64 |
+
"model_max_length": 32768,
|
65 |
"pad_token": "<unk>",
|
66 |
"sp_model_kwargs": {},
|
67 |
"spaces_between_special_tokens": false,
|