Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +46 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "mistral",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"architectures": [
|
7 |
+
"MistralForCausalLM"
|
8 |
+
],
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"eos_token_id": 2,
|
11 |
+
"hidden_act": "silu",
|
12 |
+
"hidden_size": 4096,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 14336,
|
15 |
+
"max_position_embeddings": 32768,
|
16 |
+
"model_type": "mistral",
|
17 |
+
"num_attention_heads": 32,
|
18 |
+
"num_hidden_layers": 32,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_theta": 10000.0,
|
22 |
+
"sliding_window": 4096,
|
23 |
+
"tie_word_embeddings": false,
|
24 |
+
"torch_dtype": "bfloat16",
|
25 |
+
"transformers_version": "4.34.0.dev0",
|
26 |
+
"use_cache": true,
|
27 |
+
"vocab_size": 32000
|
28 |
+
},
|
29 |
+
"vocab_size": 32000,
|
30 |
+
"max_window_size": 4096,
|
31 |
+
"temperature": 0.7,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 0.95,
|
34 |
+
"mean_gen_len": 128,
|
35 |
+
"max_gen_len": 512,
|
36 |
+
"shift_fill_factor": 0.3,
|
37 |
+
"conv_template": "mistral_default",
|
38 |
+
"pad_token_id": 0,
|
39 |
+
"bos_token_id": 1,
|
40 |
+
"eos_token_id": 2,
|
41 |
+
"tokenizer_files": [
|
42 |
+
"tokenizer.model",
|
43 |
+
"tokenizer.json",
|
44 |
+
"tokenizer_config.json"
|
45 |
+
]
|
46 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd80d68df5bcb1471284c8f6d6c3d87404034ead3286e4f5de656344f3707240
|
3 |
+
size 65536000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d842cc2529abd21f7991ba71bf8cef3d71adde4b15da2f8f058b178fae0577b4
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffb95c1553583f1de173f31bbfeff2f94b7320a38290450566230ee0bb9b7def
|
3 |
+
size 32538624
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c5fc7fb74ebcf3f3779965e642a4beeae71c1d6d0d8b49d7a915af63f1e8510
|
3 |
+
size 26214400
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46bce3ae9fba391bef682b90fc184e446da53e21e9ab9d3464d60556c609d361
|
3 |
+
size 29360128
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cca1d342ce87c88e7b335bb3c47abac417e4f4d6c3ca4b761b3ee97aa00e498
|
3 |
+
size 26230784
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a482698789e23f56981b89463deafd69006b69f7dede7927635c2b7e168f5943
|
3 |
+
size 58720256
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bac6526382f2bd8f4da19e1bad3fa98a74282f55eaf24915613dfdf75c47b9f
|
3 |
+
size 22036480
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b725b5c98973e2bfccb28298181d0ab4cfac01c0339988979ce0e120dd37a6b6
|
3 |
+
size 29360128
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:484f55be96d3e31d83c628c7f493be88829c663a48ea7183033a7da8ab712490
|
3 |
+
size 26230784
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b834380cafb8eab0e47041dcf144fad4f64af851097865348a82428adc393a3
|
3 |
+
size 58720256
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbb64c2afc97eaeb9e4d59e9064fd01a532843649edf00eba8ad23ef08181db5
|
3 |
+
size 22036480
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82d2b573239468a8a4d7f710f4d006065d738f19d4db76a01586a2f4b207ef06
|
3 |
+
size 29360128
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9414ef7fc6f9aafacbea6a059cbb87300e79e3e4d08d335372eb353509b86e2d
|
3 |
+
size 29360128
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c324ef7e1415dcebe4223844d2886ea58323e74c53d268aafed67be5fdeecab4
|
3 |
+
size 26230784
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfd41b4dddf4d0254c7763720a1c5741d85e5cb41ac96ea15cbe7b45256ce253
|
3 |
+
size 58720256
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bff364d5994e70300f12267411744f686417a9f125d0d2101e0b1c8d4e7a679a
|
3 |
+
size 22036480
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce7dbaa94487b7c5c4982b314f4eb1a4563541dd6c394c9ba0b7448a262e6791
|
3 |
+
size 29360128
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:387bab144593dbf780e1a99870d06ba2e35639f24474dab4b94e1d51649a56c0
|
3 |
+
size 26230784
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb5bb29638df066d6b46be5faa181926067c370d1cc6a8fc6e397b407c5dc11c
|
3 |
+
size 58720256
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e373e2f70295eeb5793499a30d016c470dd0ae6bf98b0b0d8710ac8ed8750f53
|
3 |
+
size 22036480
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:738f5c1d90dc3b5c0a4ae23f30366c9fb7867af2d79be8c05879b0d0b461fd29
|
3 |
+
size 29360128
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a53b41bbf06d0dbdfc418c036de4654b40bf97b71f19bad8228ab346f6b737d9
|
3 |
+
size 26230784
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35d9e8ccd248afda0fb09912d5d4b293df9195e702fcb2d4e0bacca28a3d235f
|
3 |
+
size 58720256
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1814c474a67f07de6b8abd17a25177dae7c185c23b25d7152976b5a7f457db55
|
3 |
+
size 26230784
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c1e0d083f0a28946fcf4cdd67f122643a6e2c2a8beb7d969fe1c2da34b8c78d
|
3 |
+
size 22036480
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c84e15eee10cd0faea1db73ddd1dba15a8416b9a224e3c9b29a1ca702b8d8371
|
3 |
+
size 29360128
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91d8ca418f855ec9d33af35a0ce374b850eed041821b05685f7d42800c985d21
|
3 |
+
size 26230784
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d960194a2b8f9bad171c70f35837cf27c451b5a484748e410426f6a9704fd8a
|
3 |
+
size 58720256
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25566162a2d72d54f28876c61d151488f60ef7f69b10864da6d04422b43b8740
|
3 |
+
size 22036480
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e234fb9d48226fbffa3a553388c296ea9cba5681cb11464a57fb43e23854f24b
|
3 |
+
size 29360128
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f4d742bf6c00d4ac5fd3a8eb7b145c681ab146f5030c5bf340bc5a8dc109e02
|
3 |
+
size 26230784
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ecef9c4a3c04e7c14ed96f8a4496d1f718c117b25754bdfc5b78a8cab30fcf5
|
3 |
+
size 58720256
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:266ae7c9abb5d3d09e7daa865f46db173aae90d76054f09a751ef9e0a2f331a8
|
3 |
+
size 22036480
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0573b6284c0adb803873be405ea86cd294e60b4e187d89740408a722cd4dc337
|
3 |
+
size 26214400
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:213692f8abc2c0213a8a599ef42ebeee5b603eef56816f6b98dd258d2a69b081
|
3 |
+
size 58720256
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23c5056bcfb346822140a6530955489ce4a419816ac398333b8ef55164edfcbb
|
3 |
+
size 22036480
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6368e5bd5d8a7983ebf1b1c6aed2ca5a3fb417d6a6b77fc7d90087b984a03726
|
3 |
+
size 29360128
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1745f0b311f1d2f0f2689cb52cca829d2986a0a3cc50afe5863c007086fa162
|
3 |
+
size 26230784
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75163b0b77e9dc33ed87df01d8d5de127c4a7e956ec370eba6c3797f5cb96497
|
3 |
+
size 58720256
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb6aaeae570dd08c43a628c0f04951dca2091c60e4c646f3ecd75e470a2e745a
|
3 |
+
size 22036480
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a145cbfb52aa620fa5418465e9e019eb6e1d85b4a80ccc60b69e39ba27df5bc
|
3 |
+
size 29360128
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d62fb1665e280a64d3a823d47618603771a8441fe4a5db6ca2fe51702e414a2
|
3 |
+
size 58720256
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:817f9514955fd32a9db401701de82d203c1c7da9f0de252721e1ed556c2eb9c5
|
3 |
+
size 26230784
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8c9c02cf67856b07ba108f7bb1dc47802c07a55153ed28ed78d2a7d41e0adb4
|
3 |
+
size 58720256
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f9c0a1233a0047455b250828d27e05bdba3ce33564148e5213de768ccd8bfa6
|
3 |
+
size 22036480
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa617f3e6e611b58a9c12144a4769a71d6a33810369f423d40d190f07d76c473
|
3 |
+
size 29360128
|