ruihanglai
commited on
Commit
•
3446c74
1
Parent(s):
63b6e65
init
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +78 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_51.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q3f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-06,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"position_embedding_base": 10000,
|
13 |
+
"context_window_size": 4096,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 32,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80
|
19 |
+
},
|
20 |
+
"vocab_size": 32000,
|
21 |
+
"context_window_size": 4096,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"temperature": 0.6,
|
27 |
+
"presence_penalty": 0.0,
|
28 |
+
"frequency_penalty": 0.0,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 0.9,
|
31 |
+
"tokenizer_files": [
|
32 |
+
"tokenizer.model",
|
33 |
+
"tokenizer.json",
|
34 |
+
"tokenizer_config.json"
|
35 |
+
],
|
36 |
+
"tokenizer_info": {
|
37 |
+
"token_postproc_method": "byte_fallback",
|
38 |
+
"prepend_space_in_encode": true,
|
39 |
+
"strip_space_in_decode": true
|
40 |
+
},
|
41 |
+
"conv_template": {
|
42 |
+
"name": "llama-2",
|
43 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n",
|
44 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
45 |
+
"system_prefix_token_ids": [
|
46 |
+
1
|
47 |
+
],
|
48 |
+
"add_role_after_system_message": false,
|
49 |
+
"roles": {
|
50 |
+
"user": "<s>[INST]",
|
51 |
+
"assistant": "[/INST]",
|
52 |
+
"tool": "[INST]"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
" ",
|
62 |
+
" </s>"
|
63 |
+
],
|
64 |
+
"role_content_sep": " ",
|
65 |
+
"role_empty_sep": " ",
|
66 |
+
"stop_str": [
|
67 |
+
"[INST]"
|
68 |
+
],
|
69 |
+
"stop_token_ids": [
|
70 |
+
2
|
71 |
+
],
|
72 |
+
"function_string": "",
|
73 |
+
"use_function_calling": false
|
74 |
+
},
|
75 |
+
"pad_token_id": 0,
|
76 |
+
"bos_token_id": 1,
|
77 |
+
"eos_token_id": 2
|
78 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eb91ecba3825638f6aaf3bec122a92ab7041d1e87185437b74c8ccb533bd7d8
|
3 |
+
size 52736000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b2637b1e5bcbf1b548b88380731623568c1962e3679fcab98e6dcce99fc176f
|
3 |
+
size 36282368
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac36dbda27d15f04f8b6ebea8061bd628ddafdbcc3d8c1eb12cc224ec6114afe
|
3 |
+
size 36282368
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1167ab4f5e20d51342768bca53a6f7a879b691bfd1830d3ec22d9777ba888418
|
3 |
+
size 30482432
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1280125d1b0817b12fc239530b939d2d4e47a7e4a75d04770e6a72d99bdfc97
|
3 |
+
size 27325440
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d7639c037c50af4320325116a6b9f4df58cd6e79546416ecb17f5e3dac4e358
|
3 |
+
size 36282368
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67308e559021443f0b20ffc9dfa0ad16faddf5e39167b150031092ca74773f6b
|
3 |
+
size 20250624
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d914ca47a339e62d3a7ee6ec766a5df0d58e3fee8213920946eb14b0df80bdb1
|
3 |
+
size 32494592
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38de89d0866d31d9362664cf4b2dbb570e3f1e274cf1cc6b7624224e0984c7dc
|
3 |
+
size 36282368
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de394c16dcc457a984a84b9e6b3f713bb05044309a1ac1e8c77ae516c60d9e76
|
3 |
+
size 30482432
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe055848d31bc82f637ebd44a2b1a681424cb0137d18c3c709958379e6e45fa1
|
3 |
+
size 27325440
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ab0bb2e789bde0bc44c205286ee6eeb4ccc6104e548029557893bd5646ae1fa
|
3 |
+
size 36282368
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:347249cde4a6042b1de709bbacd765c060b23196407c8bb76df382010cf2f7e4
|
3 |
+
size 20250624
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88d4b13ec5f459f14572b60e3cfc3a6672a63a6e4199dc71387859aca74c229e
|
3 |
+
size 20250624
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb86545023e27c5939d4511a9d35fdb5a5576de7ba74b9deb21334f3e463a670
|
3 |
+
size 32494592
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:630e725d84afa5e625e80c80e4f7e7518ca1985f3bf9b5efa7ec0a5f040c6c31
|
3 |
+
size 36282368
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03f6dc4f9d0e01bd7c58b3f1ede56b89c64503a98fda8937627c969746987bb6
|
3 |
+
size 30482432
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8c05f0e1c9e32822bbb369bba01e52c3e681327268653223d6b7f02cc7439ce
|
3 |
+
size 27325440
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38b775547675408b2217f9418eb1acd66e002e496907a44174028b14677b02ad
|
3 |
+
size 52736000
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35143dfe68cb17f78e4281d474a9371f96fe26d0c097de4f800c215b83bb1e55
|
3 |
+
size 32290304
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f4d518cc018e956418182317d4116b7c6c2d4563b491db8be5e64341ba41542
|
3 |
+
size 36282368
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:612b06d36b9912a7bcb7a002fdf66654eb90b9b2161c4c00053fb47c0cb7b579
|
3 |
+
size 29586432
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2c5dba3cf66b104450248842a9f8d65ae9e858985d2d11b0a638db201ea2cdb
|
3 |
+
size 36282368
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abc97d149958a661410312c89f50b50e5a76eec36351711d70b483ba76253fa2
|
3 |
+
size 31492608
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:960c28c1e36a93081af5660c5f69563eb06c83a42f2348309d4a81c67092da7d
|
3 |
+
size 20250624
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:995a6cbaf79bb18cef57e91854d575268b5d3889a309394dd07eb18c3a29f0ce
|
3 |
+
size 32494592
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6ec48fcd2c7d609057298bbc9a139f5347cb1ab774a9ec15537b0ca4fabcfc1
|
3 |
+
size 36282368
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16b3b640cc50c1ce8f08b927b2d254df6f435d4e4adc7233fd454f7ea6f324b6
|
3 |
+
size 30482432
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:418570949a43d6e88fab9957de88b76855e4d19b53e78fa3856ad04355d74210
|
3 |
+
size 27325440
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eed990ef90fa2eb9c3ff756670504f191475060f950505238e30d88021e0ab37
|
3 |
+
size 36282368
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3b19ae04c0c18e30d9f5a407713e6c22154eeafd0a9a9c2094b4b667fdfcdce
|
3 |
+
size 20250624
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3789734beb97df7e995862ce7a72032c45ef5236feb2f4f9701871aec657c43
|
3 |
+
size 32494592
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65d37a8fea8c0343bd54735f33452bc12acb9513a7af441d52a1fca39222ee5e
|
3 |
+
size 36282368
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4cea86a9c84d753a8502cf7ecfeaf5115d998767b6004842d78a37a7aa94530
|
3 |
+
size 30482432
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5c69f8657516fe90da7b1e0e9f9239560f18b43ce76aaf56da74f24f0e196ec
|
3 |
+
size 36282368
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26c4b5b5504e4cee3c62b1cdac87af0da54216f5d8a1497480322b2aa003ac27
|
3 |
+
size 27325440
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0a0aa996ebea5a839ad7834c43acefd049d65a71882d6f7e645d5cb86bce973
|
3 |
+
size 36282368
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9997fd7d2c17dea900519488c1d0a5409f351d463cd0bca45c1e8f26c1d4a72f
|
3 |
+
size 20250624
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:781db267bfea9ec330cd501e94da41f38ae5038d6bad848e70c964d83535d0ac
|
3 |
+
size 32494592
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31cf7be757e18d5d23c50f73b3960ffca5b95a5115522fde69f56d4a86f96e21
|
3 |
+
size 36282368
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f42d3e6d9045ed0311e972e47465a81b8119b6adc1a8225a8e4d007a631b136e
|
3 |
+
size 30482432
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8865ef637e125f51c0d9325f2e8042c7b37e188f59e1c00a787a8dc9a16577ce
|
3 |
+
size 27325440
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b3430105837bd490ba5f8234a0731580ff19db2197515d79d30b9be94473192
|
3 |
+
size 36282368
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf906c61c6b0b473563edc1b128e058cfb84d3dcc61e2efe40d4f64037c80880
|
3 |
+
size 20250624
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef7f376dd98b0fb07b84d0baa6e883f4c0635a09d45d0414f702ee88abe2575b
|
3 |
+
size 32494592
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ae1def83a5d3fc7856040147b5e74ef0cc8dfe01222a401b5a12a63ac8153b9
|
3 |
+
size 30482432
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0b80161e9b0fb54a487043e2b1a982e333d5509f22886f20395b076200d34bf
|
3 |
+
size 36282368
|
params_shard_51.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afb7eb01f9f689b35fa32052ce302b6853d8f95c3de2e314ebaa96c201dd9bea
|
3 |
+
size 30482432
|