ruihanglai
commited on
Commit
•
b35f31d
1
Parent(s):
4b80df6
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +75 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_51.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,75 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q3f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 14336,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 32,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 128256,
|
11 |
+
"position_embedding_base": 500000.0,
|
12 |
+
"context_window_size": 8192,
|
13 |
+
"prefill_chunk_size": 8192,
|
14 |
+
"num_key_value_heads": 8,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 128256,
|
20 |
+
"context_window_size": 8192,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 8192,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "llama-3",
|
35 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}",
|
36 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
37 |
+
"system_prefix_token_ids": [
|
38 |
+
128000
|
39 |
+
],
|
40 |
+
"add_role_after_system_message": true,
|
41 |
+
"roles": {
|
42 |
+
"user": "user",
|
43 |
+
"assistant": "assistant"
|
44 |
+
},
|
45 |
+
"role_templates": {
|
46 |
+
"user": "{user_message}",
|
47 |
+
"assistant": "{assistant_message}",
|
48 |
+
"tool": "{tool_message}"
|
49 |
+
},
|
50 |
+
"messages": [],
|
51 |
+
"seps": [
|
52 |
+
"<|eot_id|><|start_header_id|>"
|
53 |
+
],
|
54 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
55 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
56 |
+
"stop_str": [
|
57 |
+
"<|end_of_text|>",
|
58 |
+
"<|eot_id|>"
|
59 |
+
],
|
60 |
+
"stop_token_ids": [
|
61 |
+
128001,
|
62 |
+
128009
|
63 |
+
],
|
64 |
+
"function_string": "",
|
65 |
+
"use_function_calling": false
|
66 |
+
},
|
67 |
+
"pad_token_id": 0,
|
68 |
+
"bos_token_id": 128000,
|
69 |
+
"eos_token_id": 128001,
|
70 |
+
"tokenizer_files": [
|
71 |
+
"tokenizer.json",
|
72 |
+
"tokenizer_config.json"
|
73 |
+
],
|
74 |
+
"version": "0.1.0"
|
75 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d440efd5790be523cb06e7b836da3d36a446d24f72015a002986c111a8fc8746
|
3 |
+
size 213417984
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:291e6743a2e3d545c1316f8006098b41092ad76fde5aee9d4e33a3b200b19033
|
3 |
+
size 23592960
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4736f711a96642f7ab204cb23f5cbe38acf9f18935cd61eaea5f5135b434c96d
|
3 |
+
size 32317440
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00e0c21068fe59ca5f504cd0ec0cc9bf60d90fc2492684a97100d5809fef110c
|
3 |
+
size 23592960
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b7139e203d3ba63bfa246dd9cd6d018055906f8976cfa3cf582074810645390
|
3 |
+
size 47710208
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71ab073b57865edc9e9915e8050124fa2c5577ff3293b104019b0962c2f1baaf
|
3 |
+
size 25567232
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a96c1875aa19703276834319b35478441f768de049e66891ed2beaa63c0f90df
|
3 |
+
size 23592960
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd40c2ec1f1888579388e6da842f99dfa8b14d837d23004897e5ff40ae187d72
|
3 |
+
size 47710208
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3aab939ef8372237cb3f071d8018bbcb212721749ac6ab091f1bd2eda68e3578
|
3 |
+
size 33439744
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c3e954343854a5a700822074d4cc1d4296aa7c0bd30ac09ad907f0e8b3597a8
|
3 |
+
size 47710208
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca1eca0b6b770439fe89d9f166cb2673b48c0189d6b8cd0e41eec1985c92f525
|
3 |
+
size 32317440
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca79ebdcee4a40a150f4b672fba775f89d169cfcb8a3895226e130ec5cef74e5
|
3 |
+
size 23592960
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:795a22e5d86953688b538b19fa285f0be32571cf35e749087e09531d5f089ddb
|
3 |
+
size 213417984
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e82fd8dbde0ac64bf1bf5fd5e68029a5ed8fda3a5b8cb04485899d6c8db1d9d6
|
3 |
+
size 47710208
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4c472a377c593c963fee410725b38b120eb0c49e666aa14d283ed65013c720a
|
3 |
+
size 25567232
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3c0c61e7cc9d264a4d42a785df0aa38bfa5f421d20d2bac7cdf30480c519b7e
|
3 |
+
size 23592960
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73a06e26a1aaa2f5ec776d24c18bfe1b98a4518b386847f5b0d9a67bc28d4f59
|
3 |
+
size 47710208
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3f431b8d4fdf0435b52b6c5af65487d98e36b85a8f8e45e8e798d1c260790a9
|
3 |
+
size 33439744
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5dd12b9a9f0e87b06137801968a01089827c28057219484c3fdb9ec08b2bb3d
|
3 |
+
size 47710208
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a3410e769683f1be6166080e458b6c6b9e002e572eb269329d94adcc731d9c1
|
3 |
+
size 32317440
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce170492f13c016a41a3ff689c3fe229526d55dc36d0250bb16a6cb093168988
|
3 |
+
size 23592960
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dce3c6b27a4a610fe7ff6f794031016370f85fd8ef39a8c5eef2360deacfb158
|
3 |
+
size 47710208
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3518e91a309ac86a60d686fffe9691cef1866a910f3fb9978b79136474a76e5e
|
3 |
+
size 25567232
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a978e7eb1fb0b6be6e99c86060776d19378f3dfaf00cb3e2bc74e8079c253cc
|
3 |
+
size 23592960
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f7bb74888f23423e2c5cb5c3780ac5dd2ad76498371ccaebd29db7f54200703
|
3 |
+
size 23592960
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6ff74a0cdfb331197c88caace2b39d452e65028b0d1bac384cf03e515304602
|
3 |
+
size 47710208
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1d41ab1d3ba169be64ddd86644db947d3e77711d129b9ff3f2fea13f72ff3db
|
3 |
+
size 33439744
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd751fb37b4205607cce85fbd1893952cfd939dd2d7b5c5f0fc11750d2b446ca
|
3 |
+
size 47710208
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2eec3323970a7ea03b3466859cf6880f52b94ef7b2e15c1a78975474923e36d4
|
3 |
+
size 32317440
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56214dae78059e711bac6f5f43f2cd99706b62359ee51a469263f4083c0b7ca2
|
3 |
+
size 23592960
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9dd20fc4a72a5c9ae1a4b2d56e216c1f5901faeb8ccd6919c6ed20df6e7224c2
|
3 |
+
size 47710208
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e86d4262fb37c023ab1ca2e7ae1a2987cdca133f2ab66736321d2be785227dc
|
3 |
+
size 25567232
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab59308ec212257760ccc4e41f28baedb6cd0bef11fe7b744acc0ea659842492
|
3 |
+
size 23592960
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7860fa33979c770959909d4599890eb840a654995263f7c53783988449d91ee
|
3 |
+
size 47710208
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ae5bff229bf846ce48f7e572295cc5f931379412effed5d0af9fba8aa3ec9fb
|
3 |
+
size 47710208
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a8f1507def28616f602a916b52dcc80bb6737e9fbe81547ae5e3569ad739f56
|
3 |
+
size 33439744
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74755475922ebaa3b63012cb311192f35495b982d66168dc93b942849b992efe
|
3 |
+
size 47710208
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b74103e7060f01c113cde4dc3280f923466b4da6252fce2f76fc4bd8738f86c5
|
3 |
+
size 32317440
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59b17c2405849f6ef55ccc459e305e307626686ecb1ca18da0ecf7035fcdcc60
|
3 |
+
size 23592960
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fef9e6f47a7f929497663d75dec9f6ebbbdf48c0b4025782b100f397441bb14
|
3 |
+
size 47710208
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e9b55301656293839fbbb0f1f83e42e8c0d1251ea1c42c95f629a811a616021
|
3 |
+
size 25567232
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7339d978460334d8646ce5782ba4a19f7e6904c95ea651eea9fe63aec4db4f2d
|
3 |
+
size 23592960
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c905cde0ca0a460f61ca91634df921bf8e84f6651313b7338c12d6b57632eb0c
|
3 |
+
size 47710208
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c84a27b7a9c653dd04f3696557017a4d794fd8ab30fb6cb0dd573d85088daa44
|
3 |
+
size 33439744
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e9a974cf89699f439fc2befa0e5e143c5dc109947ffd991658951deaef13294
|
3 |
+
size 47710208
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f48571a496534c3ead3d501e633bfacf853754305056ffcd2b0ad01c3102d58f
|
3 |
+
size 32649216
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc88da79b0b40a53a42d6f159d45891f881df697f4e05b6ef2a8b215fedf7349
|
3 |
+
size 32317440
|
params_shard_51.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18e6f31bdc611f8790a53ea43180e08650d1b828fe02fc9e65bf7d7a5a114a81
|
3 |
+
size 23592960
|