Upload 73 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +80 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "mistral",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"position_embedding_base": 10000.0,
|
13 |
+
"num_key_value_heads": 8,
|
14 |
+
"head_dim": 128,
|
15 |
+
"context_window_size": -1,
|
16 |
+
"sliding_window_size": 4096,
|
17 |
+
"prefill_chunk_size": 1024,
|
18 |
+
"attention_sink_size": 4,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 128
|
21 |
+
},
|
22 |
+
"vocab_size": 32000,
|
23 |
+
"context_window_size": -1,
|
24 |
+
"sliding_window_size": 4096,
|
25 |
+
"prefill_chunk_size": 1024,
|
26 |
+
"attention_sink_size": 4,
|
27 |
+
"tensor_parallel_shards": 1,
|
28 |
+
"pipeline_parallel_stages": 1,
|
29 |
+
"temperature": 1.0,
|
30 |
+
"presence_penalty": 0.0,
|
31 |
+
"frequency_penalty": 0.0,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 1.0,
|
34 |
+
"tokenizer_files": [
|
35 |
+
"tokenizer.model",
|
36 |
+
"tokenizer.json",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_fallback",
|
41 |
+
"prepend_space_in_encode": true,
|
42 |
+
"strip_space_in_decode": true
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "mistral_default",
|
46 |
+
"system_template": "[INST] {system_message}",
|
47 |
+
"system_message": "Always assist with care, respect, and truth. Respond with utmost utility yet securely. Avoid harmful, unethical, prejudiced, or negative content. Ensure replies promote fairness and positivity.",
|
48 |
+
"system_prefix_token_ids": [
|
49 |
+
1
|
50 |
+
],
|
51 |
+
"add_role_after_system_message": false,
|
52 |
+
"roles": {
|
53 |
+
"user": "[INST]",
|
54 |
+
"assistant": "[/INST]",
|
55 |
+
"tool": "[INST]"
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
" "
|
65 |
+
],
|
66 |
+
"role_content_sep": " ",
|
67 |
+
"role_empty_sep": "",
|
68 |
+
"stop_str": [
|
69 |
+
"</s>"
|
70 |
+
],
|
71 |
+
"stop_token_ids": [
|
72 |
+
2
|
73 |
+
],
|
74 |
+
"function_string": "",
|
75 |
+
"use_function_calling": false
|
76 |
+
},
|
77 |
+
"pad_token_id": 0,
|
78 |
+
"bos_token_id": 1,
|
79 |
+
"eos_token_id": 2
|
80 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfaa7381abe835156a9fc2a92b7c86edb282f4b781b48891b578bd3e8fc1b0ef
|
3 |
+
size 65536000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99f5954815be399512e0c0e73300adffdad7849960421d2ce2e80daa5f9f3f11
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d095cb76bd43d0357e6f5bdcad84b100d2a61951a54ee8a35fe49acb6637497e
|
3 |
+
size 30949376
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:863d768513f056960656d4815930cf7166a36ac237022787840435099e79793d
|
3 |
+
size 58720256
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6f9e8b605eceb6c05b703c1e48e55785522c1e1ea12d2baf27ac2de531bceca
|
3 |
+
size 25174016
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65a1fec7efa92f3c37ff0c7bfd0392d1b5471da32777292d674caaadfd879979
|
3 |
+
size 29360128
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8b769ef8543b8d409f7372bc0540c1b9a5bb1c2999988aeda22feb5754e37a6
|
3 |
+
size 58720256
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88c3cf848d21bda2199cb39c5ba9cc4c0ce0de66ab720e12c330cc02f9c04424
|
3 |
+
size 33046528
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3e13e87614f98bf5bd89f3d2ea8858f91628e0f11a2d26bfadda8016be655f3
|
3 |
+
size 29360128
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8da359630caf8f3682739296e6b806616366d28277a054221b0538113cc41ee2
|
3 |
+
size 58720256
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f863b399b1e4147f38576050b5a82ce52ba2901f8a835739049aa124b6ca930
|
3 |
+
size 22036480
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fc392c500cae9b973f97d3995fd2215690027f72e23a45152c8175903a46309
|
3 |
+
size 29360128
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4cf49a767cd6ba7d97be14fb6730e0012fc90a78bcb7a5fe3085b4777d448b4
|
3 |
+
size 58720256
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8390f525a9427d6482541b1f15a144ef84f632cd637990aa529e169d02e71b24
|
3 |
+
size 58720256
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af1331b4a04ffad23247b04e279d903cf6acdf3fd41f1fc37fffdcdb7dd529f6
|
3 |
+
size 27271168
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a13d214bb294dfe7ebdc776ff07fb8dc886d6f9cd60a3c8902a97f239e43a16c
|
3 |
+
size 29360128
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bffd419d5f5d2bfe1f2566bf69d0bd97c977be6b7675f912a6cd06696c32807
|
3 |
+
size 30949376
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ef2a7735f17119abe0e65db1edeb85bd63e70c76f86d5996521c9d644b0af8b
|
3 |
+
size 58720256
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d2159fb59eb1ee64d16ced8a62077aa584c755ddf09a5041c0ca097ec9467b5
|
3 |
+
size 25174016
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:730dd04a669f6ff7f1e517d2b7175efc336ebe04475fb10e504bda004b037444
|
3 |
+
size 29360128
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44d04df8952c03d4e1e5b70a308e97d3c5c057637c7b9a44fe0a5a31b1a6a850
|
3 |
+
size 58720256
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8695813a0762f49bd1cd6744a0408fda98c62806a377b26cc9e401cfe6763a9e
|
3 |
+
size 33046528
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef0b642239b8d3e96b45b1fcdbeaea52b3381bd97fb46bac77821aad593537a3
|
3 |
+
size 29360128
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:657360e5b54fa1fb932fe08c023c3f2e62848661a1f6a417c743f03e20dfe57b
|
3 |
+
size 29360128
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1df1464a9d91082fe7ae0a92e76741f19bfaa81443a811023e2a3dc17472724a
|
3 |
+
size 58720256
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fa54a57f01a5ff4e76ea5ff05ac029af29df66c3e9b525aa4829f1915541653
|
3 |
+
size 22036480
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9d4525fa0a018a2a5f3030bde0241632e8733a779a6a5bbe0008237798a5169
|
3 |
+
size 65536000
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bebf15356213a1cca07e8de0d54e589e41d48d0b806d3b4459574e69808b06d4
|
3 |
+
size 29360128
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dd170f12941b2edaa1dd3a12d255e2dd53c57664932b3b186eace2eb5358c51
|
3 |
+
size 31801344
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb49e9e544ee8c32887e9baaca0cfbff71dc2147a9046d09aa0bc0c47371390d
|
3 |
+
size 58720256
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c4796047e23beb75cf99289bb098bc2fcf1855f767663bddd637c229edd3e32
|
3 |
+
size 25174016
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba614bfb2d8dcebdbe19826c0291a3a4f51d7900971be05f885edf38e216813c
|
3 |
+
size 29360128
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49c8ef8973790fb2fab56c58cab3729880bb54c3ab530767011b811b4cf9ecef
|
3 |
+
size 58720256
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f99e61a0c6938fbe3d8658021570aed59f5d576e2524f857f545de068ded799c
|
3 |
+
size 33046528
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8db21c0dc5e904f9f1c1256884d13502354206ec6824891da791f155eade1faf
|
3 |
+
size 58720256
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:365856574720e9a042dcdd79ef8f79e8c4ce73373e8ae338f576ad79e1596ecb
|
3 |
+
size 58720256
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8be99590d595bf5cda7ced743d2fd26f8d654d4bf0e99202ab4aa19e49517094
|
3 |
+
size 32505856
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a45d7b16f7ee499f4b70becfc013588be841d1de984ec92734fcae8e38dcf798
|
3 |
+
size 29360128
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6998b23819d6d75a55ef86c56a8abf6807da30761ca2aa5848088291b672ddf
|
3 |
+
size 58720256
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00e293151d73c452ee60640a5cd26ed15aa865f254db75804fd968a19d5fa7a5
|
3 |
+
size 33046528
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d930f3fd385df82dcad32764fca88a01aa8cb570f64f4a8e033aa65e8b6585e5
|
3 |
+
size 29360128
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06912c8b1337b67699618e9da0898408a6a3debfe4a872a2210d472e89af9ada
|
3 |
+
size 58720256
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c05b2421a37a1673e1ac38bef360cf2ede7d5b990cbb2df9b27fd9e2ed551857
|
3 |
+
size 22036480
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35e2353f7cfe664b971ec7384417137db95fd6a170e17e3291872720024d5e0d
|
3 |
+
size 29360128
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a994ea433b38548120800dd8f227365b76b1f07abec163013aa59e035849d4b
|
3 |
+
size 58720256
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a98c1e47e22d83e5b0ebc9612c307416e462c4a2d3cb6235ed4f8e40f8c313dd
|
3 |
+
size 30244864
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:273ab674a5e510ff4396a8814d1a291990d5a4d421017125540ace2c33aae511
|
3 |
+
size 27271168
|