97c0044e975e80035b19b5d1ba727fa3e57f39154e5df6f5556ec0719e48c285
Browse files- ._README.md +0 -0
- ._config.json +0 -0
- ._model-00001-of-00002.safetensors +3 -0
- ._model-00001-of-00003.safetensors +3 -0
- ._model-00001-of-00004.safetensors +3 -0
- ._model-00001-of-00007.safetensors +3 -0
- ._model-00001-of-00015.safetensors +3 -0
- ._model-00002-of-00002.safetensors +3 -0
- ._model-00002-of-00003.safetensors +3 -0
- ._model-00002-of-00004.safetensors +3 -0
- ._model-00002-of-00007.safetensors +3 -0
- ._model-00002-of-00015.safetensors +3 -0
- ._model-00003-of-00003.safetensors +3 -0
- ._model-00003-of-00004.safetensors +3 -0
- ._model-00003-of-00007.safetensors +3 -0
- ._model-00003-of-00015.safetensors +3 -0
- ._model-00004-of-00004.safetensors +3 -0
- ._model-00004-of-00007.safetensors +3 -0
- ._model-00004-of-00015.safetensors +3 -0
- ._model-00005-of-00007.safetensors +3 -0
- ._model-00005-of-00015.safetensors +3 -0
- ._model-00006-of-00007.safetensors +3 -0
- ._model-00006-of-00015.safetensors +3 -0
- ._model-00007-of-00007.safetensors +3 -0
- ._model-00007-of-00015.safetensors +3 -0
- ._model-00008-of-00015.safetensors +3 -0
- ._model-00009-of-00015.safetensors +3 -0
- ._model-00010-of-00015.safetensors +3 -0
- ._model-00011-of-00015.safetensors +3 -0
- ._model-00012-of-00015.safetensors +3 -0
- ._model-00013-of-00015.safetensors +3 -0
- ._model-00014-of-00015.safetensors +3 -0
- ._model-00015-of-00015.safetensors +3 -0
- ._model.safetensors.index.json +0 -0
- ._special_tokens_map.json +0 -0
- ._tokenizer.json +0 -0
- ._tokenizer.model +3 -0
- ._tokenizer_config.json +0 -0
- ._zero_to_fp32.py +0 -0
- README.md +22 -0
- config.json +31 -0
- model-00004-of-00004.safetensors +3 -0
._README.md
ADDED
Binary file (4.1 kB). View file
|
|
._config.json
ADDED
Binary file (4.1 kB). View file
|
|
._model-00001-of-00002.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e0132362e3f14586558ea35f7deac27a808e1403b9718472218b91f2d24ff00
|
3 |
+
size 4096
|
._model-00001-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e29ea358685c1e26094bf7b0e3fd0fa2e369f17410ca5aca9c7be466d1ca526e
|
3 |
+
size 4096
|
._model-00001-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b02c2dcdc4c6aabfcd0cabb910f86695b914e882561f6c8ac355dccfc018882
|
3 |
+
size 4096
|
._model-00001-of-00007.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61b559ade639a1958997d9a951b8ef095bb8168e0672d7adc9c1b239573917cf
|
3 |
+
size 4096
|
._model-00001-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea6b8fd0dc56c93433a2f5b71438a51624703f796a5f863d55ffd011d664d0ec
|
3 |
+
size 4096
|
._model-00002-of-00002.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5764471db54bb615689a5e6570ae22453a86097500d8e635ca0b949c985c0c4d
|
3 |
+
size 4096
|
._model-00002-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb2733b7419dca4130b294a823f527390ed2187259392156ba438497fd40154e
|
3 |
+
size 4096
|
._model-00002-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76a1271127d523215ac3375f0115c45473b5fb7fe284f83faa36583fcfdf225a
|
3 |
+
size 4096
|
._model-00002-of-00007.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:117e6d093b9a15651bd48c1369b48ca95555a248b09c3fdfc49afd04b87e4f76
|
3 |
+
size 4096
|
._model-00002-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c235354f33e244fa3e4cd372bfe93ae374f23bf78ef9cb856a43dfb9d22c1d77
|
3 |
+
size 4096
|
._model-00003-of-00003.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a182c95d420ca2016bc51b581afc5c1113ebd2543b9bf6fee6932e1965115372
|
3 |
+
size 4096
|
._model-00003-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:132052a34c70aa92fcff8de9e5bde8534a4883567d5be80530abd033a3e8cb30
|
3 |
+
size 4096
|
._model-00003-of-00007.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf7feb93dc15a4ab7d646ad9c03ee0380827572d5c8f48eced51ac1cd82937e6
|
3 |
+
size 4096
|
._model-00003-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31faaeba3773c44774e0b666e8e20329e21e8567d9dce5580771afd4ffc8d7bc
|
3 |
+
size 4096
|
._model-00004-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a59f30e662b209d0b505295434ef486ad235b705912018efbc7cfcf13997457d
|
3 |
+
size 4096
|
._model-00004-of-00007.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fa3de64d5d7a2b8a9ca8f7ef98a7a07ba50830ee173df2c2988c95af1ad4a0e
|
3 |
+
size 4096
|
._model-00004-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bd0236ca79347555fd2be86dbf15e264cacef369c99b0aebac5c79c94223784
|
3 |
+
size 4096
|
._model-00005-of-00007.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6b9a722169c45e79bef535cd5c8b0a25120d108b2bd1fdfb7c14ad114382e76
|
3 |
+
size 4096
|
._model-00005-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cef1fde03ecd52167a067bdfcda5a27e18ccc2131736111f0fb3caa75e7511a6
|
3 |
+
size 4096
|
._model-00006-of-00007.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5f575ba91a89567194ec551cb0db167eff57af2d2d3b253c87e990e8130706
|
3 |
+
size 4096
|
._model-00006-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d10fa729290791235ce627a26a9f7312031b5556ad01a28f01462ff308536ea7
|
3 |
+
size 4096
|
._model-00007-of-00007.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:baa0a2728098c72d270232ad499110b3d01ea93fbce11d9886b55a8ae46c3aca
|
3 |
+
size 4096
|
._model-00007-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b902b41efa179243f2035166ae65ccd0d7b2285e7a9aaaee4f552cf4ddcdeede
|
3 |
+
size 4096
|
._model-00008-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e492b53cdaa9faa78bf088b161aa7a6084a97d54a8d5b74e5f45f997a368a7df
|
3 |
+
size 4096
|
._model-00009-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f60e901fd1c1d3d566e4723856bb65c048b02e434bc0bdb0c2e4fb066071df45
|
3 |
+
size 4096
|
._model-00010-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:030d3e1a58d932c3f46e4a1808c9dac73702beba6be5d0e349a893290a71053f
|
3 |
+
size 4096
|
._model-00011-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09b44f0faedb0da5a3e51cabe7d1d9ab28da6e5bc717cf95f23f7f30c1a6816b
|
3 |
+
size 4096
|
._model-00012-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21781b2466729f1af747641516a3d0ce816f86f4462a3578d96732980e504fb9
|
3 |
+
size 4096
|
._model-00013-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e49126766a6b8280d546b02cb0fa0505d72a2c97579fb9099a8c0edebb52317
|
3 |
+
size 4096
|
._model-00014-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:416246206c87c9eb220f273166793541da0622fdaf1f33196bd3ec72bcad0476
|
3 |
+
size 4096
|
._model-00015-of-00015.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a4e76134e10c6b31d4dbfd9326b2d2e3b70d583a06fb95d486a29213888ffc5
|
3 |
+
size 4096
|
._model.safetensors.index.json
ADDED
Binary file (4.1 kB). View file
|
|
._special_tokens_map.json
ADDED
Binary file (4.1 kB). View file
|
|
._tokenizer.json
ADDED
Binary file (4.1 kB). View file
|
|
._tokenizer.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95f56195e40a17bfe3fc486caa87cfaa8829255ea10768cabdd7331d1df5aecd
|
3 |
+
size 4096
|
._tokenizer_config.json
ADDED
Binary file (4.1 kB). View file
|
|
._zero_to_fp32.py
ADDED
Binary file (4.1 kB). View file
|
|
README.md
ADDED
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
tags:
|
4 |
+
- mlx
|
5 |
+
---
|
6 |
+
|
7 |
+
# voxmenthe/Yi-1.5-34B-Chat-16K-8bit
|
8 |
+
|
9 |
+
The Model [voxmenthe/Yi-1.5-34B-Chat-16K-8bit](https://huggingface.co/voxmenthe/Yi-1.5-34B-Chat-16K-8bit) was converted to MLX format from [01-ai/Yi-1.5-34B-Chat-16K](https://huggingface.co/01-ai/Yi-1.5-34B-Chat-16K) using mlx-lm version **0.13.1**.
|
10 |
+
|
11 |
+
## Use with mlx
|
12 |
+
|
13 |
+
```bash
|
14 |
+
pip install mlx-lm
|
15 |
+
```
|
16 |
+
|
17 |
+
```python
|
18 |
+
from mlx_lm import load, generate
|
19 |
+
|
20 |
+
model, tokenizer = load("voxmenthe/Yi-1.5-34B-Chat-16K-8bit")
|
21 |
+
response = generate(model, tokenizer, prompt="hello", verbose=True)
|
22 |
+
```
|
config.json
ADDED
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"LlamaForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_bias": false,
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 7168,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 20480,
|
13 |
+
"max_position_embeddings": 16384,
|
14 |
+
"model_type": "llama",
|
15 |
+
"num_attention_heads": 56,
|
16 |
+
"num_hidden_layers": 60,
|
17 |
+
"num_key_value_heads": 8,
|
18 |
+
"pretraining_tp": 1,
|
19 |
+
"quantization": {
|
20 |
+
"group_size": 64,
|
21 |
+
"bits": 8
|
22 |
+
},
|
23 |
+
"rms_norm_eps": 1e-06,
|
24 |
+
"rope_scaling": null,
|
25 |
+
"rope_theta": 5000000,
|
26 |
+
"tie_word_embeddings": false,
|
27 |
+
"torch_dtype": "bfloat16",
|
28 |
+
"transformers_version": "4.40.0",
|
29 |
+
"use_cache": false,
|
30 |
+
"vocab_size": 64000
|
31 |
+
}
|
model-00004-of-00004.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41d8c9e29df3e3f8cd42217b486de53311741477a5e51de3b264ba4d64a9f4c3
|
3 |
+
size 1050673278
|