Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- merges.txt +0 -0
- mlc-chat-config.json +72 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "qwen2",
|
3 |
+
"quantization": "q8f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_act": "silu",
|
6 |
+
"hidden_size": 2560,
|
7 |
+
"intermediate_size": 6912,
|
8 |
+
"num_attention_heads": 20,
|
9 |
+
"num_hidden_layers": 40,
|
10 |
+
"num_key_value_heads": 20,
|
11 |
+
"rms_norm_eps": 1e-06,
|
12 |
+
"rope_theta": 5000000.0,
|
13 |
+
"vocab_size": 151936,
|
14 |
+
"context_window_size": 32768,
|
15 |
+
"prefill_chunk_size": 32768,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"dtype": "float32"
|
18 |
+
},
|
19 |
+
"vocab_size": 151936,
|
20 |
+
"context_window_size": 32768,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 32768,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "chatml",
|
35 |
+
"system_template": "<|im_start|>{system_message}<|im_end|> ",
|
36 |
+
"system_message": "system A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
|
37 |
+
"roles": {
|
38 |
+
"user": "<|im_start|>user",
|
39 |
+
"assistant": "<|im_start|>assistant",
|
40 |
+
"tool": "<|im_start|>user"
|
41 |
+
},
|
42 |
+
"role_templates": {
|
43 |
+
"user": "{user_message}",
|
44 |
+
"assistant": "{assistant_message}",
|
45 |
+
"tool": "{tool_message}"
|
46 |
+
},
|
47 |
+
"messages": [],
|
48 |
+
"seps": [
|
49 |
+
"<|im_end|>\n"
|
50 |
+
],
|
51 |
+
"role_content_sep": "\n",
|
52 |
+
"role_empty_sep": "\n",
|
53 |
+
"stop_str": [
|
54 |
+
"<|im_end|>"
|
55 |
+
],
|
56 |
+
"stop_token_ids": [
|
57 |
+
2
|
58 |
+
],
|
59 |
+
"function_string": "",
|
60 |
+
"use_function_calling": false
|
61 |
+
},
|
62 |
+
"pad_token_id": 0,
|
63 |
+
"bos_token_id": 151643,
|
64 |
+
"eos_token_id": 151643,
|
65 |
+
"tokenizer_files": [
|
66 |
+
"tokenizer.json",
|
67 |
+
"vocab.json",
|
68 |
+
"merges.txt",
|
69 |
+
"tokenizer_config.json"
|
70 |
+
],
|
71 |
+
"version": "0.1.0"
|
72 |
+
}
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64ccb06ab87d84dd755b61265bd8d4b7a03a2d7fed1e2eb9350b7455fb8fbba8
|
3 |
+
size 388956160
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:504c7e301257a8390b7d104dce78863a4608a3c5242581f240d105cf669faac3
|
3 |
+
size 17694720
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3c542743dae7d68cd814c1e3fb3ab9dee61083963cf6d428b555e341ef9c1c2
|
3 |
+
size 35389440
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f61fb7cba6c0b3427590f55d0457d2ff78849b1b257a996d81a8e12e6a1cc0ec
|
3 |
+
size 19660800
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99a0dff5eb38cb94e5e470573e8140938d66cefe283d513b8cd977661c20fe2e
|
3 |
+
size 29230080
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c40c1d493ad2ec98cad4806033039d212eddffac73caf3cfa0d022179e2ae537
|
3 |
+
size 35389440
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d42c136d6af7e92e081585b9d5bc1a2e271c0f3fc189abdc2c803b52a6cd67a4
|
3 |
+
size 19660800
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6c19ce05bf81441ac559f54b693cca422e70a01365e7ac40c9b2fc7e7d2bb26
|
3 |
+
size 29230080
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aca3012f47a411a869efa9077d447ef0e30b625f079cac5664660fb6fba5c228
|
3 |
+
size 35389440
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a39e4f287ce91db804532476ab6e135e9f582c129cd6121271e3d1e4f9d30524
|
3 |
+
size 19660800
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ce5982fb6a9f29eb9e84d9f7eead423de742b51156c1cf69d91c6292e1248f8
|
3 |
+
size 29230080
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f714d774e4b053e6e1c6a312e93ebefd79b3cbb71aa73dbe3bce705d6945ae8
|
3 |
+
size 35389440
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:927a14f1a5062a97c908f4979ca1bcf2ce90b87027944967c44aeb84a98bdbe7
|
3 |
+
size 35389440
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6827885159b98d207b1ce585e6dad521d24c23300d1eeabc685aa23a00cc00b8
|
3 |
+
size 19660800
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f733f83426d09901c0cdf4b2e7510ddcb3699e1ccf50450d2853ad1d1f51915f
|
3 |
+
size 29230080
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2999b2eca6ff062c4504065a4006922f42c3bd8b87d470cdc0a3db5d6c8cc418
|
3 |
+
size 35389440
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:716646dfcccadee483c7644b30a69a329c2949314b546eb8b4b223adc98f3030
|
3 |
+
size 19660800
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e79a5e5d48e60418d88d2ed4374812fdff558e0ab10a5db07643ecbe0f3071c
|
3 |
+
size 29230080
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4800de296234f4d0bbc30d5d8df6656325f2ed8e49f856a3f9b65acf5d6da162
|
3 |
+
size 35389440
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:675eff2d4ff19dcb9dd39436645edb4583de848f5bbcb3a308dfc4c5fa30038a
|
3 |
+
size 19660800
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ccef7e002df6301b5b3577f4486bf82ac20bca21e6492df784dfc3bba016b4e
|
3 |
+
size 29230080
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5444c609db0c5e32b7f4f1135a687ab4286668db213a3e99f2393d5473daf44a
|
3 |
+
size 35389440
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b05b45648ba380c5305365ca51a24dd67ad5831a7e18f18200cb908738835d5
|
3 |
+
size 19660800
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8366f010acd893168abaa78aa4d44f760a00dc93aed60d53fde437981eeddd5a
|
3 |
+
size 27637760
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3afcdba35d48b209b3178b46909550a0cf04da911ae1f0e34da8354e7b0dcfc9
|
3 |
+
size 29230080
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6aa3dbb17d442da375ac1c277efe531e69b35f9a4c2f035312e07019d3df79e8
|
3 |
+
size 35389440
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b31add17a679040d233d8ec769cf2f947b5cb01645af52b89caff6029d4218f7
|
3 |
+
size 19660800
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b9f2750d662c22f67e8da6d4c530826c1139dac4c465980f2fcfa4841a3d517
|
3 |
+
size 29230080
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48279920150a85e3a72f2f5022c7c64e86aa12328b468622443df7a71dd7c605
|
3 |
+
size 35389440
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:923754d108ba7d54aea6ebaf7a7fa2d91314ba9a48f2a73f4d80569f8d2faf8e
|
3 |
+
size 19660800
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82d025aa8f60087ef259b65d6d349503635d76e03cc8a5a853b2ce9adf3674bf
|
3 |
+
size 29230080
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0f5289e7f45766354b4be23aa083d4757bb78f6658edebe57c000be82fc7df4
|
3 |
+
size 35389440
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eac4bf24bd3225661f9bb85308b7f4816724bc05221ab6a8457cb49d7fcede04
|
3 |
+
size 19660800
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87f2be3aea8d5b85b820cf68a6bb5dd5d3cf05f8e56f77a1ffd931680f01cf8a
|
3 |
+
size 29230080
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30db99544324083d38325cd671fdb6d7fd93072234c7d629573e3f290a1fad46
|
3 |
+
size 35389440
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7308162e120f049cab2349f471067c695510fe9640be1aff9274b2dc8fb4a26
|
3 |
+
size 35389440
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b52ed9f917fe1e479f83698ffaa875820e4219b7c58318e10c4be36de49b9b8
|
3 |
+
size 19660800
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfef9fcba36b7579a8c7867de357ce3488947f352dfac9008741fa6f943b6573
|
3 |
+
size 29230080
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdc54f9697f91969a515c36a1495d6e468147396ed615846cbc211a2e41f4455
|
3 |
+
size 35389440
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcb776c858821037e252ba76762cb32792ab61ec67d230592c6562f4d46e062f
|
3 |
+
size 19660800
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:417f07146428f44bac01b5f699f7995948118a6d0dcdb7b5e81c28ccbf4c290a
|
3 |
+
size 29230080
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fe78a4884677810acd46584b86b59c7b794757c004865d50917494c107f36d8
|
3 |
+
size 35389440
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64059975d3452702186b56e7bb32f8c9eb92697f8389af45ef6ec674462c1359
|
3 |
+
size 19660800
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af810da92bf9d833884ae60fa709cfaa2e42d6c0f78a60c18590c398e8127083
|
3 |
+
size 29230080
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63ea34897a522e94d32512df9c4109d955048e0cadb36d4a3cb1dfdffaa7e376
|
3 |
+
size 35389440
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d43beea01e48deecbcb2d68b4d203913cebaf39613f60ed55c15ca641b8dd27
|
3 |
+
size 19660800
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:480f078f86996ce7df525f2c486fb6a239cbb509891369a7f61ff29e097c308a
|
3 |
+
size 19660800
|