Upload 188 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +82 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_140.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,82 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "svdllama",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-06,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"rope_scaling": null,
|
14 |
+
"pipeline_parallel_stages": 1,
|
15 |
+
"position_embedding_base": 10000.0,
|
16 |
+
"context_window_size": 2048,
|
17 |
+
"prefill_chunk_size": 2048,
|
18 |
+
"num_key_value_heads": 32,
|
19 |
+
"head_dim": 128,
|
20 |
+
"tensor_parallel_shards": 1,
|
21 |
+
"max_batch_size": 128,
|
22 |
+
"ratio": 0.4
|
23 |
+
},
|
24 |
+
"vocab_size": 32000,
|
25 |
+
"context_window_size": 2048,
|
26 |
+
"sliding_window_size": -1,
|
27 |
+
"prefill_chunk_size": 2048,
|
28 |
+
"attention_sink_size": -1,
|
29 |
+
"tensor_parallel_shards": 1,
|
30 |
+
"pipeline_parallel_stages": 1,
|
31 |
+
"temperature": 1.0,
|
32 |
+
"presence_penalty": 0.0,
|
33 |
+
"frequency_penalty": 0.0,
|
34 |
+
"repetition_penalty": 1.0,
|
35 |
+
"top_p": 1.0,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.model",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"tokenizer_info": {
|
41 |
+
"token_postproc_method": "byte_fallback",
|
42 |
+
"prepend_space_in_encode": true,
|
43 |
+
"strip_space_in_decode": true
|
44 |
+
},
|
45 |
+
"conv_template": {
|
46 |
+
"name": "llama-2",
|
47 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n",
|
48 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
49 |
+
"system_prefix_token_ids": [
|
50 |
+
1
|
51 |
+
],
|
52 |
+
"add_role_after_system_message": false,
|
53 |
+
"roles": {
|
54 |
+
"user": "<s>[INST]",
|
55 |
+
"assistant": "[/INST]",
|
56 |
+
"tool": "[INST]"
|
57 |
+
},
|
58 |
+
"role_templates": {
|
59 |
+
"user": "{user_message}",
|
60 |
+
"assistant": "{assistant_message}",
|
61 |
+
"tool": "{tool_message}"
|
62 |
+
},
|
63 |
+
"messages": [],
|
64 |
+
"seps": [
|
65 |
+
" ",
|
66 |
+
" </s>"
|
67 |
+
],
|
68 |
+
"role_content_sep": " ",
|
69 |
+
"role_empty_sep": " ",
|
70 |
+
"stop_str": [
|
71 |
+
"[INST]"
|
72 |
+
],
|
73 |
+
"stop_token_ids": [
|
74 |
+
2
|
75 |
+
],
|
76 |
+
"function_string": "",
|
77 |
+
"use_function_calling": false
|
78 |
+
},
|
79 |
+
"pad_token_id": 0,
|
80 |
+
"bos_token_id": 1,
|
81 |
+
"eos_token_id": 2
|
82 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29815774f62ac838ba8e8efdfca108bc1de046f4424492dc7dc64d87fa34e6f6
|
3 |
+
size 262144000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa20d5b36df5903ff396dbb98d0c63887b75e340ea5992f74b403f1fe2fda1f8
|
3 |
+
size 26287104
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96537c0390fdfa6a994455ec417da8788810849b333d6317488739c4271f0aee
|
3 |
+
size 33546240
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca0d6a1706796ca61782f0ef470a55face9336d600c6eb77a26358bc9aa67998
|
3 |
+
size 29360128
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb294554f5d8373c4c30582632fba4106d5ce2a7e643681822d2d45ea6f5fbce
|
3 |
+
size 33546240
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd1393cf013251226cd7e3a6283cea50edfaaefdb20f478d60b938f5f5d8bcf5
|
3 |
+
size 26287104
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4d35766298ff9a55421965b075fa60a2a456101f4a6322481184d70cca7760b
|
3 |
+
size 26287104
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87953b9e9121d8ba1b6f20acf882f47643d1a4a25554786e3ecd54d4795e2187
|
3 |
+
size 29917184
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01d4ce7fe470d141c59b00176c48ef0af24621ef0aab1bb94361383aa86b341b
|
3 |
+
size 26287104
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56f2cbe3bba44e6b52a1c6000ab5ddf3d011ea6fd666a12480f18f6fa9a1f6ef
|
3 |
+
size 32989184
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f6d5da6e8475042c3f17aeee71525344386ea1ce241d6ec20052a9f9ba77b48
|
3 |
+
size 33546240
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:256612e854cfdec27465dbb41c17eccf5d0b0014aafa7f8d6ecb941aec82a570
|
3 |
+
size 26287104
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:951c8c9c1eff0e179690366d86d19a7e1a1fd306d3a35b09977341320f2944b4
|
3 |
+
size 26287104
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4a8b9a5de084ccc459898cd75c3b6f1dc35829623078ee1a36566321bff58fa
|
3 |
+
size 26287104
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f69848b16a241266252af8c57b32f046a98e256489c8e8054471672c190ed366
|
3 |
+
size 26287104
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ade2bd5c9d141c90062619bf37ba7d918126f6a9531da9f0e9f7cf017c865a2d
|
3 |
+
size 26279936
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5630d3a91ca0b2dda2f97699094527f8252e15992c43b6fc3a3edf5f2f518886
|
3 |
+
size 29917184
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4314b2443e7b24a9ac6addbb8eddac2b6e2a345625d788403d8d4e9a869b111
|
3 |
+
size 33546240
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c13808ec2a9132aabb5b50fd6ed2582c0f28bb5a96dc942f147b97be57bd548
|
3 |
+
size 26287104
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc4a3bf3972447e1b25adeb3ecfed23fe0b7ac008d17e7c435fa77286ddb1964
|
3 |
+
size 26287104
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c35092e6901079cb978377a578300db40779667bc010e1d5ff6107cfbd8744bf
|
3 |
+
size 26287104
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85a4164c076545d2cb0093ff82b97793c9851df60cf344c4ee99f127ea9a02b2
|
3 |
+
size 29360128
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b134df67ca5a0a92ca563ff417bdf67c6535bd3b4d50019b6f8e73690d1c387
|
3 |
+
size 33546240
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ab052641cf2077d790c5b6e7de807de3f125c04509c41ccbfba62d5c1113a45
|
3 |
+
size 26287104
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cc071471ff0af6ceb34d901ba709ee0131c6a96040702cafbbe261c4b0a2fd8
|
3 |
+
size 26287104
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d83892b2304e6f46535d9b59ff8dbbacc52dfbeb9ebbb6ebfc85e02135fbe287
|
3 |
+
size 26287104
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2bfb7d76add6f584e671324db40b23091c7058a766a7ec6f48ca3076ff030504
|
3 |
+
size 29917184
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:900c8da9574e982266563491481b51bd44e66fcfe14fde17ad76c37475f6d2b8
|
3 |
+
size 26287104
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:584fc2389912ba808846b8877a4c2f5cce8814f7f2f93887a2948af7ed8c60e4
|
3 |
+
size 32989184
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e8745af279101920356dea73d97ee32762d26a10fd2504bca99809c1b78a244
|
3 |
+
size 33546240
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b9f70a90870a306de573397f3c428fefe82667de50dea66eb0bd590d10df966
|
3 |
+
size 26287104
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d118ee4e6f38bad62792b7478ad000a33289967ee2c741753451e98d05a6bb63
|
3 |
+
size 26287104
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3dfd8b6e23427e7ca9a9767f7bf81ffc6cc2cead614b7d5490d599cd5a3e099
|
3 |
+
size 26287104
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87f7cc6b74e9201b36c9f52c585dafa86eebb124450f942c3806361a44c9976f
|
3 |
+
size 26279936
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30099cf851f5bbe44d151db9a7d7c35a95dfb09a7aad25dfb12464bb8fc49d53
|
3 |
+
size 29917184
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c7be34f99c912cd907dc1bd88e1998dce7b38925dd4629aef642dd57296e55f
|
3 |
+
size 26287104
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f92bf46a4f1ad06d95873be02f44f975a16bec741fecf0ee5b2e241f61ec593e
|
3 |
+
size 33546240
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c93a42e4dd0b86ac68da15c51e8ab07a5e1257dd31ace2578910509d1154a17b
|
3 |
+
size 26287104
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4b6d192a59cf854b6062e982323a23911042cff82247fed18a5113490a0821d
|
3 |
+
size 26287104
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0007edd9e8f823b9fe8f64b9785fb48abfabba5c01152864a34ee02965edb2e4
|
3 |
+
size 26287104
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:430f0c58bd7079a749e2d9fa406b5907f28345fca6f084af403aabbdd5143f4b
|
3 |
+
size 29360128
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b1cf1ee0a3fec332524df3e31488baa4d0b1a147b1e1f48a281158dee9cd74e
|
3 |
+
size 33546240
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cf89394b4630b46b3c6d3585a8efafd801bcb2f50cf873360aef565d1743b6f
|
3 |
+
size 26287104
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87f89e0e6d70ef1b334b08a55b0a7083fb1d4ffe7418341c65e5ca50fd933a82
|
3 |
+
size 26287104
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82a0ecc0be218b4de1b7cd80ef393d49ac40ece9da0b9f1db37ca8ffaa20f097
|
3 |
+
size 29917184
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfc28ee8885e93fa1742690c8e172ac06869beac01ac1d47300547c1116cd318
|
3 |
+
size 26287104
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99df31bec60f3f0f01012cce7b012e9d74469b53339d07f85dea60a1f1951440
|
3 |
+
size 29360128
|
params_shard_140.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:504ea976450f97e5f83ef191799982b7b53d8594e6a6b17ba76f24708766d602
|
3 |
+
size 32989184
|