CharlieFRuan
commited on
Commit
•
c4a1ea1
1
Parent(s):
a54e3af
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +75 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,75 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q0f32",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 14336,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 32,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 128256,
|
11 |
+
"position_embedding_base": 500000.0,
|
12 |
+
"context_window_size": 8192,
|
13 |
+
"prefill_chunk_size": 1024,
|
14 |
+
"num_key_value_heads": 8,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 128256,
|
20 |
+
"context_window_size": 8192,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 1024,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "llama-3",
|
35 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}",
|
36 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
37 |
+
"system_prefix_token_ids": [
|
38 |
+
128000
|
39 |
+
],
|
40 |
+
"add_role_after_system_message": true,
|
41 |
+
"roles": {
|
42 |
+
"user": "user",
|
43 |
+
"assistant": "assistant"
|
44 |
+
},
|
45 |
+
"role_templates": {
|
46 |
+
"user": "{user_message}",
|
47 |
+
"assistant": "{assistant_message}",
|
48 |
+
"tool": "{tool_message}"
|
49 |
+
},
|
50 |
+
"messages": [],
|
51 |
+
"seps": [
|
52 |
+
"<|eot_id|><|start_header_id|>"
|
53 |
+
],
|
54 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
55 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
56 |
+
"stop_str": [
|
57 |
+
"<|end_of_text|>",
|
58 |
+
"<|eot_id|>"
|
59 |
+
],
|
60 |
+
"stop_token_ids": [
|
61 |
+
128001,
|
62 |
+
128009
|
63 |
+
],
|
64 |
+
"function_string": "",
|
65 |
+
"use_function_calling": false
|
66 |
+
},
|
67 |
+
"pad_token_id": 0,
|
68 |
+
"bos_token_id": 128000,
|
69 |
+
"eos_token_id": 128001,
|
70 |
+
"tokenizer_files": [
|
71 |
+
"tokenizer.json",
|
72 |
+
"tokenizer_config.json"
|
73 |
+
],
|
74 |
+
"version": "0.1.0"
|
75 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f14b339532db00e9bc7c7e59c8ec852f30a451e416014c2641b4bf10abcb157
|
3 |
+
size 1050673152
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91f6f93a88bed034ea0619146bf6b59ff41b89559234c34c957d0ffd46c824d1
|
3 |
+
size 117440512
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3cc252aad9004be03c7115cafa3f257699a2582b9a63dd6401b29a6d6fb2f4c
|
3 |
+
size 33554432
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04a5b032544ffd9f0ba84cf6d8a1a9624e5e255654f361dcb1e984095d863724
|
3 |
+
size 234881024
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b8fa3db884fefdf89f2fb97b34871e1e5142b4d406d5193f36c6390950d8689
|
3 |
+
size 50331648
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccc1183fb276fbaa19b6b605ef431cb8cc7c121983b3cb7ec813c9a135cc3d85
|
3 |
+
size 33554432
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:721adc4f5e4800c9610aef452319b1355b54c75e180ae833b4e4f0dc608519b9
|
3 |
+
size 117440512
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e2364eec38a8d615aaedd456ed6c03905d3cea931124e91b6cdfe879442ab6a
|
3 |
+
size 234881024
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e1be61e05798139f354f06a0afd3c0df204488e7bca9328382c6efc545ce7c5
|
3 |
+
size 50331648
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c70fffb364c73a6a62983852d91139eb8bbd6243c5dd0bf2ae0e324b88900cd2
|
3 |
+
size 33554432
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5883417a703a7dc8f6845f2cdc687d5b2bb0e7d1bced7a335336f9f632a3dcc2
|
3 |
+
size 117440512
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28efded368aa1896ab3587a08a621cc2b16b49944093b98244ab9227982b6ef7
|
3 |
+
size 234881024
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db332d605e56e376a844106dc0bcccf747774a6e57de5b9211fa49dde8fdb3bb
|
3 |
+
size 50331648
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d08df32045b31b3882e0e12c8e9660c6eeb4e32a6a5849b62b71b7b202146d47
|
3 |
+
size 117440512
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:622538ab9a924524681426852256fb332de852ca6ab36942ff087afaa258442e
|
3 |
+
size 33554432
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7025368bb28ccc15c6e7ea5ea0d14aafcf80ce2966cc46f03ee8d8c868710c7a
|
3 |
+
size 117440512
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c71d3506a88afad2de0d1c48c26e14d3746f80354bab7ef9f596ce8253f791af
|
3 |
+
size 234881024
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bed94198a4f8d3875b7770a6e86824bd062cf56f975127492893d76142e7817
|
3 |
+
size 50331648
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e664e6a4a1497f99afcc3afc5a27841f951fd2761dfd3d55ac04d50ed820fc67
|
3 |
+
size 33554432
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e49b7507902aa5408aae10880fd80f24bffffac9088c9f37304155cadb9f579
|
3 |
+
size 117440512
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e20595108ef3b11bd279fe7b8e955f2879bc112db0c1acc947e75b62e91c002
|
3 |
+
size 234881024
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15f74cfe2abc81e194abb568ee31388e0538e3b971155d1c358d18ce3bd72bec
|
3 |
+
size 50331648
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3374009b4ffa9d1c6611977322c38b3c6c9fc4fae713e58adde3921d7bdad6d1
|
3 |
+
size 33554432
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c02b1da9f14899c96b30dc81f499dd403a0ca7fad5b4d828f7e4628b908199cc
|
3 |
+
size 117440512
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4eddec28a35476ed521ad174c16f84f9256627afdffafada9a349549e71b9d14
|
3 |
+
size 234881024
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d158c7266a896aae5de3d15c498dc54a64c8f0cfb0e47c34354801ae1c202ac
|
3 |
+
size 234881024
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1180f7018c4678639973de0d633c75fdfff235f23b9b8b536d4a76c2e21425d5
|
3 |
+
size 50331648
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1e29e5052214ed24a6532c59425018f664417fca40b692eccb20b1cbccbdf37
|
3 |
+
size 33554432
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86ab4cca730f9d389f190793066cd7034d5ca6f40ed7a178736f7b6b18ea4bd9
|
3 |
+
size 117440512
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:265a48c9894f19a8b229d41c0d13221e4c5ef5a12f6016437e8f0e8bcd57a588
|
3 |
+
size 234881024
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb8c3d510eda6ba108cbacf281f1064e42db716dab5747e5c7f265aa4e337d6c
|
3 |
+
size 50331648
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d89938053a56197876b8814fa2ccb0239dcbf5089abd721122e04aed29ddc86
|
3 |
+
size 33554432
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cb192d38c861ae08a42a759ca50ba77006c8df1d9b1f4690cccdf538731c502
|
3 |
+
size 234881024
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3cf6c5d2b150d24040d029a66065c6808ba54ebc08b09c9829adb021e299bc5
|
3 |
+
size 50331648
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d88c96ecd30f3f330d76611265fa525daea07401efe34a0159f0135d917f296
|
3 |
+
size 33554432
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d0a434b1f68442d9b3060746179f9bdd964f6ab39c9ed5c8be574ae97c146c9
|
3 |
+
size 50331648
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:035523d91800cf542459860daf7b566108c16d07dee04ea53ace6559685b1896
|
3 |
+
size 532480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd93a97ffdb8439b6a03d99849f0b9cd214066992f383a71aa96c8c28710ea8f
|
3 |
+
size 33554432
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abca8a9dba25976720ba1c39f8fc762c71089bd98d56bc79f44ef34bfeaab095
|
3 |
+
size 117440512
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c09bd7c04d7574d10a7b91803117d61f12782b19ccb895c213d67b0eddb03ec7
|
3 |
+
size 234881024
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a85856ad6701cec95afb8233ec8759c5766dc7f42173b9e0e6e63d11cb4a44f
|
3 |
+
size 50331648
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddc408892cd14fef65802fecd1d3a6c3ea0d11d5dedd183a45a83c17642bd854
|
3 |
+
size 33554432
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10c24f6f22c779b39409622ace0e8ba4e5e4587a95f9c3879e4f72876839308e
|
3 |
+
size 117440512
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de91d6d84a671e2fba5b6083b6afaa1f0610459fdebf6c265e2ef1e6c420da18
|
3 |
+
size 1050673152
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d5a2d8ddcc035360c4f4803fb765c9c22a8e6c2143919704b57fe7d6992e617
|
3 |
+
size 234881024
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69abf6985ce1e66f2baddfb6749eb3aa458ec7ae1250b6e41b5fb2a521eb1373
|
3 |
+
size 50331648
|