Merge branch 'main' of https://huggingface.co/togethercomputer/m2-bert-80M-2k-retrieval into main
Browse files- README.md +2 -2
- config.json +1 -1
README.md
CHANGED
@@ -2,7 +2,7 @@
|
|
2 |
license: apache-2.0
|
3 |
language:
|
4 |
- en
|
5 |
-
pipeline_tag:
|
6 |
inference: false
|
7 |
---
|
8 |
|
@@ -104,4 +104,4 @@ If you use this model, or otherwise found our work valuable, you can cite us as
|
|
104 |
booktitle={Advances in Neural Information Processing Systems},
|
105 |
year={2023}
|
106 |
}
|
107 |
-
```
|
|
|
2 |
license: apache-2.0
|
3 |
language:
|
4 |
- en
|
5 |
+
pipeline_tag: sentence-similarity
|
6 |
inference: false
|
7 |
---
|
8 |
|
|
|
104 |
booktitle={Advances in Neural Information Processing Systems},
|
105 |
year={2023}
|
106 |
}
|
107 |
+
```
|
config.json
CHANGED
@@ -30,7 +30,7 @@
|
|
30 |
"long_conv_kernel_learning_rate": 0.001,
|
31 |
"long_conv_l_max": 2048,
|
32 |
"max_position_embeddings": 2048,
|
33 |
-
"model_type": "
|
34 |
"monarch_mlp_nblocks": 4,
|
35 |
"num_attention_heads": 12,
|
36 |
"num_hidden_layers": 12,
|
|
|
30 |
"long_conv_kernel_learning_rate": 0.001,
|
31 |
"long_conv_l_max": 2048,
|
32 |
"max_position_embeddings": 2048,
|
33 |
+
"model_type": "m2_bert",
|
34 |
"monarch_mlp_nblocks": 4,
|
35 |
"num_attention_heads": 12,
|
36 |
"num_hidden_layers": 12,
|