Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +82 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
- params_shard_51.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,82 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f16_ft",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 10000,
|
14 |
+
"rope_scaling": null,
|
15 |
+
"context_window_size": 4096,
|
16 |
+
"prefill_chunk_size": 4096,
|
17 |
+
"num_key_value_heads": 32,
|
18 |
+
"head_dim": 128,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"pipeline_parallel_stages": 1,
|
21 |
+
"max_batch_size": 128
|
22 |
+
},
|
23 |
+
"vocab_size": 32000,
|
24 |
+
"context_window_size": 4096,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 4096,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 0.6,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 0.9,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.model",
|
37 |
+
"tokenizer.json",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"tokenizer_info": {
|
41 |
+
"token_postproc_method": "byte_fallback",
|
42 |
+
"prepend_space_in_encode": true,
|
43 |
+
"strip_space_in_decode": true
|
44 |
+
},
|
45 |
+
"conv_template": {
|
46 |
+
"name": "llama-2",
|
47 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n",
|
48 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
49 |
+
"system_prefix_token_ids": [
|
50 |
+
1
|
51 |
+
],
|
52 |
+
"add_role_after_system_message": false,
|
53 |
+
"roles": {
|
54 |
+
"user": "<s>[INST]",
|
55 |
+
"assistant": "[/INST]",
|
56 |
+
"tool": "[INST]"
|
57 |
+
},
|
58 |
+
"role_templates": {
|
59 |
+
"user": "{user_message}",
|
60 |
+
"assistant": "{assistant_message}",
|
61 |
+
"tool": "{tool_message}"
|
62 |
+
},
|
63 |
+
"messages": [],
|
64 |
+
"seps": [
|
65 |
+
" ",
|
66 |
+
" </s>"
|
67 |
+
],
|
68 |
+
"role_content_sep": " ",
|
69 |
+
"role_empty_sep": " ",
|
70 |
+
"stop_str": [
|
71 |
+
"[INST]"
|
72 |
+
],
|
73 |
+
"stop_token_ids": [
|
74 |
+
2
|
75 |
+
],
|
76 |
+
"function_string": "",
|
77 |
+
"use_function_calling": false
|
78 |
+
},
|
79 |
+
"pad_token_id": 0,
|
80 |
+
"bos_token_id": 1,
|
81 |
+
"eos_token_id": 2
|
82 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99c5948294f5f4ef55b27e744b90c4b34f96915ef9014f528a5499eedbe45562
|
3 |
+
size 65536000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dfe83ab22cc1256532555f346de9775440670a824ac254686ef1903fca04d8c
|
3 |
+
size 45088768
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8c9f1d3f6b0ee21dc6a4e3ae0dda0a99625f26446355c80026921270a19a094
|
3 |
+
size 45088768
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:463d307aafda1f54fd817110cedfb65f85f0124f98014372ddbcccb1c6be7984
|
3 |
+
size 25165824
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2193b1873c9766c46372810e611697e4cfd2bcd93bcd920b25d031dc8b636cd7
|
3 |
+
size 31034368
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:109932fea666ce78f45759fecd76b9a224b4f71991fdd88b00e18f6609659af7
|
3 |
+
size 45088768
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:973bb0f68fee479ca56f527145ade212fc35658e948915247eda707681e88b8d
|
3 |
+
size 25165824
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cb60031a59946aa6c600aa18418b0be6d7c69384539b5b0053dc954eb798318
|
3 |
+
size 31034368
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e69818aa63dd47fc8f9420b69e33dd8a7f4870dd7f750ac461747cc8bc3e260
|
3 |
+
size 45088768
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8b440ba4bfab86a8a96d43f18b485b83c864d99271351f8ae3fc23e516a8cb2
|
3 |
+
size 25165824
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8a70b098aa3b4dc10a78dd66220c47185a78ea04356e84fd275c34de7acc5cf
|
3 |
+
size 31034368
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcc803bd50e5acc8218b8295b583b5dffdd38ec4a570dc37b8e04827a63712c2
|
3 |
+
size 45088768
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b20cd01574f294801ca3f064cba4cf4c2683bb3209f496cd044b052c6bbb14c8
|
3 |
+
size 25165824
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:601be62d5e13d5d1bd19b6220a1f54b4aa508b026256128a918304b22fb09bdd
|
3 |
+
size 25165824
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39690b28ba7015033d6e00667d1104ca7b599567ffece5df504c6cee7b33438d
|
3 |
+
size 31034368
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed59ce16412df999d145af851e9d910b8b887a8f6ca8e1817bffe12f8c113d6f
|
3 |
+
size 45088768
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3392fa32503a4f2622cf10251bac5678a4ac81f323bde1b08bbdc1b02629a03
|
3 |
+
size 25165824
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1c194dbef63ed17e63c40e0479c64b0010351d4782e205a3e2cbaebeef2e063
|
3 |
+
size 31034368
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58b654596fdc4059658d1b43c1f089524b4b6ba6543543b2950497760f2eaa46
|
3 |
+
size 65536000
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d905e4d77e98eab9ba45868eaca7fa488b28ac9ed18203788387bda7b0d97ccf
|
3 |
+
size 22544384
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7806f9f223cf3e59ab9ecd8310e6bd450b6ff64785301e0aee870dbebae787a9
|
3 |
+
size 45088768
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:432c55ad0cec6b8633651f3978e3adec5aceba1caa50f745d8a09349c7d1138c
|
3 |
+
size 25165824
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ac1ebe4b155d771d4e9fa78613f62558c4b201e0738291cdc8afb1eaf0302c
|
3 |
+
size 22544384
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a542bae3b8f6a0a2f08de726573cd5b98fdbfc531d197f2412f40309fed26dc
|
3 |
+
size 30829568
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd75b0817f752618538f01f5841198f0f650816711029f48238015e1c6b476d6
|
3 |
+
size 45088768
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29c233e3c75895f73c2d55f9500384222133867f799dbd051dda496ddcf99f5f
|
3 |
+
size 25165824
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0f9c999136e6182cb5fa3e3ee0ab582aa536492e0ad2bf54d405d484d986a8e
|
3 |
+
size 25180160
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ff71141f0a336cc2ed354e0b70eab0892288c8375c0061bf7c403b95bd93298
|
3 |
+
size 45088768
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b98ec14d59abfe66a5be6bc6189a8cf06acb0ccca5b59eaa0aeb70cb7c3b680
|
3 |
+
size 25165824
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e561abffe6b1467919762ca14bbfa02fd4546103c39629b93c9f99a830ee8a53
|
3 |
+
size 31034368
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:539a759f3bc5985c0ea26eb6d81585f1e7b0404828cbcc53b844f07a588e47be
|
3 |
+
size 45088768
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cae2fca4d26be303a5754b5cf50bde7ea35c2ea1dc97662862e7c8c78b9a9ebf
|
3 |
+
size 25165824
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58f0096a53f3d1f469d537a10e3fb62d3bd15f0e1a79f0e779e617b74aee0b2c
|
3 |
+
size 31034368
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9937fe3bab84979b0ff53d186f0f2a68cc54ddc62d0446f7787da4abc4a1fdbf
|
3 |
+
size 45088768
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:529e44b446ba64ee889d0e1d687e2bc45424303a37328f0d2a39e55bf0759195
|
3 |
+
size 45088768
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eacc91c01dfbd8b7d671b9b674bcc205242bd735d3163ad79c67a55edb5a6344
|
3 |
+
size 25165824
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f7908c75b3f145a38202ec036b6011e6b22f364f1d3e708ad5822f4dcf5e826
|
3 |
+
size 31034368
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e61ab8f97d001f748526d17bb81b900b6d7029748a4d7a9f77e217f7f2ef7a78
|
3 |
+
size 45088768
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00427dac47d4e03ad465bbcd9455b7f37be384fe0a4320cc0a07695763fb7112
|
3 |
+
size 25165824
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f17fd31e78adad510886db988a01986e769e7cc2a9f85c627ea8bfeca01669e2
|
3 |
+
size 31034368
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2529db9c4b35e688b98a359e6e9f82cfced52e9c9973c59af34c2fa46da71890
|
3 |
+
size 45088768
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcf90bf62bca5533568a0f0b365cd18d87678e810c81a0c34b0c38ac970dff07
|
3 |
+
size 25165824
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0573604f925374618787d8d6f3075e076ea565e2b36d9e454dfc0c3a902f794a
|
3 |
+
size 31034368
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f9da1954b5aa8618f3ddacebedfdf8c2079f9f7506563e4cb6ea74fe52258c0
|
3 |
+
size 45088768
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9313738f9d22714bc87b5e1ef53915a7e79889b86419fc7524639280432218f1
|
3 |
+
size 25165824
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b2e190e554e41f523fa40c346c01bc07be7e706d11aeca1b9f07ecf6079507e
|
3 |
+
size 25165824
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2145d8740164f04fe60d20b02d512928bcd36cf27fc701928ac540eb93c2e29b
|
3 |
+
size 31034368
|
params_shard_51.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e392c6927c8ad4789e9e226a1e593f654f3209b660adbaa75cf2173a33072cda
|
3 |
+
size 45088768
|