Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +40 -0
- added_tokens.json +4 -0
- config.json +26 -0
- mergekit_config.yml +7 -0
- model-00001-of-00165.safetensors +3 -0
- model-00002-of-00165.safetensors +3 -0
- model-00003-of-00165.safetensors +3 -0
- model-00004-of-00165.safetensors +3 -0
- model-00005-of-00165.safetensors +3 -0
- model-00006-of-00165.safetensors +3 -0
- model-00007-of-00165.safetensors +3 -0
- model-00008-of-00165.safetensors +3 -0
- model-00009-of-00165.safetensors +3 -0
- model-00010-of-00165.safetensors +3 -0
- model-00011-of-00165.safetensors +3 -0
- model-00012-of-00165.safetensors +3 -0
- model-00013-of-00165.safetensors +3 -0
- model-00014-of-00165.safetensors +3 -0
- model-00015-of-00165.safetensors +3 -0
- model-00016-of-00165.safetensors +3 -0
- model-00017-of-00165.safetensors +3 -0
- model-00018-of-00165.safetensors +3 -0
- model-00019-of-00165.safetensors +3 -0
- model-00020-of-00165.safetensors +3 -0
- model-00021-of-00165.safetensors +3 -0
- model-00022-of-00165.safetensors +3 -0
- model-00023-of-00165.safetensors +3 -0
- model-00024-of-00165.safetensors +3 -0
- model-00025-of-00165.safetensors +3 -0
- model-00026-of-00165.safetensors +3 -0
- model-00027-of-00165.safetensors +3 -0
- model-00028-of-00165.safetensors +3 -0
- model-00029-of-00165.safetensors +3 -0
- model-00030-of-00165.safetensors +3 -0
- model-00031-of-00165.safetensors +3 -0
- model-00032-of-00165.safetensors +3 -0
- model-00033-of-00165.safetensors +3 -0
- model-00034-of-00165.safetensors +3 -0
- model-00035-of-00165.safetensors +3 -0
- model-00036-of-00165.safetensors +3 -0
- model-00037-of-00165.safetensors +3 -0
- model-00038-of-00165.safetensors +3 -0
- model-00039-of-00165.safetensors +3 -0
- model-00040-of-00165.safetensors +3 -0
- model-00041-of-00165.safetensors +3 -0
- model-00042-of-00165.safetensors +3 -0
- model-00043-of-00165.safetensors +3 -0
- model-00044-of-00165.safetensors +3 -0
- model-00045-of-00165.safetensors +3 -0
- model-00046-of-00165.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model:
|
3 |
+
- FuseAI/OpenChat-3.5-7B-Mixtral
|
4 |
+
- openchat/openchat_3.5
|
5 |
+
- FuseAI/OpenChat-3.5-7B-Solar
|
6 |
+
library_name: transformers
|
7 |
+
tags:
|
8 |
+
- mergekit
|
9 |
+
- merge
|
10 |
+
|
11 |
+
---
|
12 |
+
# merge
|
13 |
+
|
14 |
+
This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
|
15 |
+
|
16 |
+
## Merge Details
|
17 |
+
### Merge Method
|
18 |
+
|
19 |
+
This model was merged using the [Model Stock](https://arxiv.org/abs/2403.19522) merge method using [openchat/openchat_3.5](https://huggingface.co/openchat/openchat_3.5) as a base.
|
20 |
+
|
21 |
+
### Models Merged
|
22 |
+
|
23 |
+
The following models were included in the merge:
|
24 |
+
* [FuseAI/OpenChat-3.5-7B-Mixtral](https://huggingface.co/FuseAI/OpenChat-3.5-7B-Mixtral)
|
25 |
+
* [FuseAI/OpenChat-3.5-7B-Solar](https://huggingface.co/FuseAI/OpenChat-3.5-7B-Solar)
|
26 |
+
|
27 |
+
### Configuration
|
28 |
+
|
29 |
+
The following YAML configuration was used to produce this model:
|
30 |
+
|
31 |
+
```yaml
|
32 |
+
models:
|
33 |
+
- model: openchat/openchat_3.5
|
34 |
+
- model: FuseAI/OpenChat-3.5-7B-Mixtral
|
35 |
+
- model: FuseAI/OpenChat-3.5-7B-Solar
|
36 |
+
merge_method: model_stock
|
37 |
+
base_model: openchat/openchat_3.5
|
38 |
+
dtype: bfloat16
|
39 |
+
|
40 |
+
```
|
added_tokens.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|end_of_turn|>": 32000,
|
3 |
+
"<|pad_0|>": 32001
|
4 |
+
}
|
config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "openchat/openchat_3.5",
|
3 |
+
"architectures": [
|
4 |
+
"MistralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 32000,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 4096,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 14336,
|
13 |
+
"max_position_embeddings": 8192,
|
14 |
+
"model_type": "mistral",
|
15 |
+
"num_attention_heads": 32,
|
16 |
+
"num_hidden_layers": 32,
|
17 |
+
"num_key_value_heads": 8,
|
18 |
+
"rms_norm_eps": 1e-05,
|
19 |
+
"rope_theta": 10000.0,
|
20 |
+
"sliding_window": 4096,
|
21 |
+
"tie_word_embeddings": false,
|
22 |
+
"torch_dtype": "bfloat16",
|
23 |
+
"transformers_version": "4.38.2",
|
24 |
+
"use_cache": true,
|
25 |
+
"vocab_size": 32002
|
26 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
models:
|
2 |
+
- model: openchat/openchat_3.5
|
3 |
+
- model: FuseAI/OpenChat-3.5-7B-Mixtral
|
4 |
+
- model: FuseAI/OpenChat-3.5-7B-Solar
|
5 |
+
merge_method: model_stock
|
6 |
+
base_model: openchat/openchat_3.5
|
7 |
+
dtype: bfloat16
|
model-00001-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce93532eb1d560a2e65e639f7b3aa50267fb419a9785d8375b310d56daa9ca78
|
3 |
+
size 117440664
|
model-00002-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ab13d889b27b3e3791e0b8d199951ced886771e8f93d9c53ed545669e5fda3d
|
3 |
+
size 117440656
|
model-00003-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae825884bd94a02efa04d99e942a3c08a1bf0d2e2685f5b89339b66146cac996
|
3 |
+
size 50332024
|
model-00004-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97fc5ddff77b2451c8122010d17f97daed28e68439b565e1a429f207a98eeede
|
3 |
+
size 33554584
|
model-00005-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5cc1cb1c683a0a1ee6fc7b4402f36e05bfeb30b4f2801720fbcdd1dba0a4a9b
|
3 |
+
size 117440664
|
model-00006-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df34bc6fed299bb3d4e275c738c599fc7da3dd7ad9975ae66ebfe719a7d40f72
|
3 |
+
size 117440664
|
model-00007-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03eeb608b0f1ce4c046e51915e0fdf64b55d01eb831b4d80aaa1fa99cb01f26e
|
3 |
+
size 117440656
|
model-00008-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01b4770b33493a4af9e5358e5c24f146b040eb0f98d07a7e205671a2dcb67837
|
3 |
+
size 50340320
|
model-00009-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bfc0e7e05faa58f40ef1dab7d6d2fbda721ac98405936057a74ad264c3c58c6
|
3 |
+
size 33562872
|
model-00010-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c92742f20959349e316ee175bd82887bdd4e6da63b73fdfc16009e79b8ebd843
|
3 |
+
size 117440664
|
model-00011-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16551728ad65bc9067d5ff16525f349cc5826069286bf52c8fab6f8665615283
|
3 |
+
size 117440664
|
model-00012-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0c72eba5c1727e5a7ec35c15628cd5022c66a04349633270627f0721f52719f
|
3 |
+
size 117440656
|
model-00013-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aef14a63b73926e6a8ad59683d136eecc8d76e72700cdbdbce680df27d65bff1
|
3 |
+
size 50340320
|
model-00014-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b16c5fe4d9b9007bce6ff019018563c03968fb2b3d8d1cf8d4ec920d789e8233
|
3 |
+
size 33562872
|
model-00015-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb7670ae7cec3322253f19870b57814a91241d42f4be330ce52e7b53b20479eb
|
3 |
+
size 117440664
|
model-00016-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6643039826ee39ea0b7b091defc090bdad98c5d5f4f07ff4452a1cbbf87c2087
|
3 |
+
size 117440664
|
model-00017-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24bcb4f02d9d97102f1cfd7ad267fdcf4bef831257cc8a622274980689186c4d
|
3 |
+
size 117440656
|
model-00018-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cd04fafbaaa6e44bbef79e8a317fad9e60cc9c63944867174ab0ee8e3b74156
|
3 |
+
size 50340320
|
model-00019-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7689c07b7986f93387f45696f74f6548101dba0fb0de61f1fe83d7987729bdc2
|
3 |
+
size 33562872
|
model-00020-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c6a82b32e991ca4894e38863382daf48cd12769e4de0416f4be3f429004fbb
|
3 |
+
size 117440664
|
model-00021-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff3758a1620ffc60e5116cd82a432f23082c2880b11cbe0a1a94cc9ea58681ed
|
3 |
+
size 117440664
|
model-00022-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc97b41ad393ec7d144796c861907fedbe961be14407094ee7248e9b952a5d24
|
3 |
+
size 117440656
|
model-00023-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:346a26e531d31bacfacd8401e0b2d5ae01d521ec7e0ada58dc15d74469d1a12f
|
3 |
+
size 50340320
|
model-00024-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac45125c80b6d866647d2c1be918f32c728377fa273f079ed94b26e2f6371061
|
3 |
+
size 33562872
|
model-00025-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cbab63590a2a0670fc597c587a8f9d6c82c0a1b540324ca1cfbfadf43ff903d
|
3 |
+
size 117440664
|
model-00026-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21cf36398d18cc1c3ea8f44bc93231becbe007fb7825d94ab26f9b011f8f1d4e
|
3 |
+
size 117440664
|
model-00027-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:141a0c5f3f50aa41f07a8f0628f72d9c828dec9c57d09c7a3a1c6e93cff7375f
|
3 |
+
size 117440656
|
model-00028-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2300d3acd6bdc23b9c40248a1d34afa17c4987dd695e33d9f77127cc9ab14cb1
|
3 |
+
size 50340320
|
model-00029-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeb189be1bb63400da15b80258cef9d376dfaf609d4e01e7bc92eb259d436889
|
3 |
+
size 33562872
|
model-00030-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4491060437ca170b8f775f918eb70d04b7ca0c37c63ffcc803c1b04ccbb7fbe4
|
3 |
+
size 117440664
|
model-00031-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:061b5a5aee57fabad93d232295dc78cdd2585610f3a5d7459be593989da9dc2f
|
3 |
+
size 117440664
|
model-00032-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f81ae5879b01a5fbcd2e099127ef909a0e98c18bfcc1fda66f62c823836cb2e3
|
3 |
+
size 117440656
|
model-00033-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eacdeceaae2adbe975e2be481d0d8bf1b52a461522ec8b5816c4a5907c18e912
|
3 |
+
size 50340320
|
model-00034-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4564bf8937512653ddf5f36bfd8f5ac24a66f503effa2120ff9434ba7f1c96b2
|
3 |
+
size 33562872
|
model-00035-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:326fd974e1e7f45d4136d0bf4d2827f426dd695b8fc4cb46056f5563172e5096
|
3 |
+
size 117440664
|
model-00036-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ffccac9a80b65b451c3a16cbe1c384448fe27ed3abb9fa6df35fee4110d6d90
|
3 |
+
size 117440664
|
model-00037-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:548d545bea0111e33ddf5f55ac1a4226d179518f93131484014a10162c0ee137
|
3 |
+
size 117440656
|
model-00038-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01bd4c6a943b4073ac3015bb70d4d421934489cc662774dd509f888af5260a52
|
3 |
+
size 50340320
|
model-00039-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77af5c9ecc93f712092f5b107f5d5511dd643e5d1e7c20e6fd303a59125aea05
|
3 |
+
size 33562872
|
model-00040-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d5d8e1aeb8c226b82aaff389558f76537d21ca17c427593929de4fc6bc8cf77
|
3 |
+
size 117440664
|
model-00041-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f530436252ee6d76352954f38db20657cd84ab1c5ba777fa5b14a0eedcc8e70
|
3 |
+
size 117440664
|
model-00042-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea54e7fdb5120fbe1fa2d0055e6d683e988fc8174cdd2f2d73752a85caefb55f
|
3 |
+
size 117440656
|
model-00043-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41f201103d208edff2b9f98034016d6420913fbcc8bf61c3025fb611111c8a3a
|
3 |
+
size 50340320
|
model-00044-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:425bdbc71f894f2310d1e0b3cd4b0d68d7bfc0864a82424f1ebf41e0d2367967
|
3 |
+
size 33562872
|
model-00045-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f63246176962ddaee486856c969c088706753d4a0f9e4e4336e280cc30917453
|
3 |
+
size 117440664
|
model-00046-of-00165.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42f1a068b8c41edbc0ab9e5720916d6a5afe21fbffea569ccc75b8fc1f2df51a
|
3 |
+
size 117440664
|