gavinzzhao commited on
Commit
28ea432
1 Parent(s): 529cf79
This view is limited to 50 files because it contains too many changes.   See raw diff
mlc-chat-config.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "llama",
3
+ "quantization": "q4f16_1",
4
+ "model_config": {
5
+ "hidden_size": 4096,
6
+ "intermediate_size": 14336,
7
+ "num_attention_heads": 32,
8
+ "num_hidden_layers": 32,
9
+ "rms_norm_eps": 1e-05,
10
+ "vocab_size": 128256,
11
+ "position_embedding_base": 500000.0,
12
+ "context_window_size": 8192,
13
+ "prefill_chunk_size": 2048,
14
+ "num_key_value_heads": 8,
15
+ "head_dim": 128,
16
+ "tensor_parallel_shards": 1,
17
+ "max_batch_size": 80
18
+ },
19
+ "vocab_size": 128256,
20
+ "context_window_size": 8192,
21
+ "sliding_window_size": -1,
22
+ "prefill_chunk_size": 2048,
23
+ "attention_sink_size": -1,
24
+ "tensor_parallel_shards": 1,
25
+ "mean_gen_len": 128,
26
+ "max_gen_len": 512,
27
+ "shift_fill_factor": 0.3,
28
+ "temperature": 0.7,
29
+ "presence_penalty": 0.0,
30
+ "frequency_penalty": 0.0,
31
+ "repetition_penalty": 1.0,
32
+ "top_p": 0.95,
33
+ "conv_template": {
34
+ "name": "llama-3",
35
+ "system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}",
36
+ "system_message": "You are a helpful, respectful and honest assistant.",
37
+ "system_prefix_token_ids": [
38
+ 128000
39
+ ],
40
+ "add_role_after_system_message": true,
41
+ "roles": {
42
+ "user": "user",
43
+ "assistant": "assistant"
44
+ },
45
+ "role_templates": {
46
+ "user": "{user_message}",
47
+ "assistant": "{assistant_message}",
48
+ "tool": "{tool_message}"
49
+ },
50
+ "messages": [],
51
+ "seps": [
52
+ "<|eot_id|><|start_header_id|>"
53
+ ],
54
+ "role_content_sep": "<|end_header_id|>\n\n",
55
+ "role_empty_sep": "<|end_header_id|>\n\n",
56
+ "stop_str": [
57
+ "<|end_of_text|>",
58
+ "<|eot_id|>"
59
+ ],
60
+ "stop_token_ids": [
61
+ 128001,
62
+ 128009
63
+ ],
64
+ "function_string": "",
65
+ "use_function_calling": false
66
+ },
67
+ "pad_token_id": 128009,
68
+ "bos_token_id": 128000,
69
+ "eos_token_id": 128009,
70
+ "tokenizer_files": [
71
+ "tokenizer.json",
72
+ "tokenizer_config.json"
73
+ ],
74
+ "token_table_postproc_method": "byte_level",
75
+ "version": "0.1.0"
76
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66cf234fbae0f57ecd01d9fbbeed633e0d302153225896e528db36ebe4db5122
3
+ size 262668288
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e485e3fde43c7d1307cbf50ad6826d3f97a501aa72e6487e52f87524a0e88125
3
+ size 29360128
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30f1686163d1789bf1839ecd5495f5cebd4a1bb0307d54f05ba9d647f475a7cf
3
+ size 33046528
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5af93afc21295fe84f9317b73b90c9880f6093758c52918940421ec595f86fa4
3
+ size 58720256
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f51a0f7e3fdd9e682cb58d95239c5baae53fff0ada9b9d5dbd2e216a1aae27a8
3
+ size 25174016
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e84cebd6c1e568c0e572616ecf9c8ee4ad3a9f283ca861e7321cb1fcae8bfa4
3
+ size 29360128
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:679ce78370d38ddee975d9be6d6a4b92149da87aaab6efe00657a4512013bcd1
3
+ size 58720256
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:904fc26ba19b621db8e41bb5940246fe8f880912ee98c5576019347f147332f8
3
+ size 33046528
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:795014b84afbfda18b4325d389e4d914e712e18c2e8609e9096a55790ec01f42
3
+ size 58720256
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9013fcc86639f35b9b5623ad100ccbe710813d1345a5012ad49af3f2c6a3dd56
3
+ size 32505856
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f7b838ba07689220492e894a3af0aecbef07108e8f710f0e4845a293a08e5a5
3
+ size 9437184
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:309b8e0ffb601b4ce105c166119a234b75dbf409c5a48f07f62757cf89f9170c
3
+ size 29360128
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9042b6d24e233bbea8cc6e4554877675990fc89fa8be32bfbe4858b1ddaabcc7
3
+ size 58720256
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ff34ced0d4fdc4dbe93801f7fde97e7da7de16920c48b8e104d8b882c4032e5
3
+ size 22036480
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8f26fef1dd1bf72f022059c995aa38b77f950e6fe6a48c60d15acbc0dd4ee76
3
+ size 29360128
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43b05a806e7d721001f80cfde52b6896fcebae36f882a0281795bbb1ac77c512
3
+ size 58720256
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7731a1fa6a6b051f70155cda4f50e6c411c39705a134849eae2d4075141dbe7
3
+ size 27271168
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c8ff4d730b1cc9f71d5d3fdd7c258e596a6e72f89e77f48a479d472ae1b5fa6
3
+ size 29360128
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3ad346c6cea92f821fa001739196b2993fc6f18c27d5aa440522b9ec6dbdcdc
3
+ size 30949376
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6633ff370c53fe97ccb8de61a966043b9dfd7e577f57785e6660afc275a255d8
3
+ size 58720256
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38c94f900373ebc06db0651c9cc77e55d78fa889f30e6ec40e9d31aadd237d1b
3
+ size 32841728
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f360b01d8eec1890bc21da0c941b787f39974985cd8ed84efc32ef7e0463865
3
+ size 25174016
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce20da3231690da76194794d6902c4a8a51d8348611a585df8e0836c54b2ec6b
3
+ size 29360128
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73ca07dfdcbaa459f10766e825e5f561470d84acf402d082eb80c9cde618f52a
3
+ size 58720256
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5ce09919b4da6c36c027b9612b3b6019eb7d34386fc0c8c00115d3e10752c3e
3
+ size 33046528
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94761ef8e7102bf3e57d35f7c6a0e216268b3cee67be8117aee8e534651f36a9
3
+ size 29360128
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87d1ec0d2649218fd7dbb8c83cfcabaacf5b96f25038cff14c357a1c7b747b39
3
+ size 58720256
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88eb08a666ddb5a12fd3e90c6a24384a8887401a80fab846da9cee57cb7ee1d4
3
+ size 22036480
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:517db97e75e57432c64a5c816fae024e714c6572050aa14b062fc51cae42c86c
3
+ size 29360128
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6b09bf316bc597793dd9a61015a47079ca458a7ec937cf104d245ef49664637
3
+ size 58720256
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7c177087091b85ec4a96ba20c5c6c1e51dc17bfa1c3629ee9919c45f6812b37
3
+ size 27271168
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ae85e2a78886cc352afe5bd9fdd57eb6d21e98ec87b505b18e4c7567ad5cb20
3
+ size 262668288
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65db8ef4202f45019d0c577cb4ed9c47736899296c6ece09369ee191f5ddcca4
3
+ size 29360128
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3263e94bf2bdbbb804d7eb466f41054a5a4ad65e236c3d59bbec42238bf29f0
3
+ size 30949376
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08b4004210599576b6905df996d7ed0c3e9c61351e99bf7e82cc7aefc324f040
3
+ size 58720256
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfdf4533f21fdbaf7cd30a7389f0a87d3c38f353470fd3813863814f39c2871a
3
+ size 25174016
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d23a2aca478d9446b3411b1793f670aa6890a51e091f9fbddc17daaae9375def
3
+ size 29360128
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3402121e72aa542b99139836955b61a186b42a00f087d25342a51c71247d85d7
3
+ size 58720256
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e33e2736306aab9fa716f32170bed791fb6b41047f8e7434e2f325435e1a03e7
3
+ size 33046528
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ffea25ce85d9e3c13f3cd1fa61c8717c133de5015d88a2109625e36e6ff3476
3
+ size 29360128
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3b2b3ac21fdeb23252c234afed81e39cf7878d753e8bc23c8881daad64bcdca
3
+ size 58720256
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76916e0d543ff8de587ec2e7d8e0871f5afb5f5bd69dd6ad8bc0d33ab9b8d394
3
+ size 22036480
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ff89bce064cb336431dd1d3ee186b985f408afb78795371d9d2847156bcb98a
3
+ size 32833536
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bb0e3e32810201adcc32187531e0e1276ab59e7c0ade8087f4b168fad1d271a
3
+ size 29360128
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13ee86a481d0d294649e1a42eb335206bc6636903c0d9aed6f3e2d13628e20d7
3
+ size 58720256
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd9fa550ee63874c61e539ef23fc729ca1314bbd1bdad2e7f8481cf527b52add
3
+ size 27271168
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c13b3e3d318e48f0546463c7ea139b4583bdbf64165c081ded0152421800ff3
3
+ size 29360128
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9532e2542be7b2f7d0c76aa902cb0c421c4b76fee600d3c6f87e649949906cdd
3
+ size 30949376