Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +42 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_6.bin +3 -0
- params_shard_7.bin +3 -0
- params_shard_8.bin +3 -0
- params_shard_9.bin +3 -0
- tokenizer.json +0 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_neox",
|
3 |
+
"quantization": "q3f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"use_parallel_residual": true,
|
6 |
+
"hidden_size": 2560,
|
7 |
+
"intermediate_size": 10240,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"layer_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 49152,
|
12 |
+
"rotary_pct": 0.25,
|
13 |
+
"position_embedding_base": 10000,
|
14 |
+
"context_window_size": 4096,
|
15 |
+
"head_dim": 80,
|
16 |
+
"prefill_chunk_size": 4096,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"ffn_out_dtype": "float32"
|
19 |
+
},
|
20 |
+
"vocab_size": 49152,
|
21 |
+
"context_window_size": 4096,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 4096,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"max_batch_size": 80,
|
27 |
+
"mean_gen_len": 128,
|
28 |
+
"max_gen_len": 512,
|
29 |
+
"shift_fill_factor": 0.3,
|
30 |
+
"temperature": 0.7,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": "stablecode_instruct",
|
34 |
+
"pad_token_id": 0,
|
35 |
+
"bos_token_id": 0,
|
36 |
+
"eos_token_id": 0,
|
37 |
+
"tokenizer_files": [
|
38 |
+
"tokenizer.json",
|
39 |
+
"tokenizer_config.json"
|
40 |
+
],
|
41 |
+
"version": "0.1.0"
|
42 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ec53756cbc3d1756e9f8dfe69a27d235b4241b0ae9882ca7bdee99930c8cc4a
|
3 |
+
size 50331648
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b73dee6d8b1d61b41cce8b1a982ba73220899449834f5b62bbb5c08b5db6c46c
|
3 |
+
size 29945856
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8e1984b979ce1aa3f571ffd551b39df7010a64688a4cb808d47cd260d0416d1
|
3 |
+
size 23639040
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c9b6fc3798194dead7d1d43aac3e443d91f7213cf5f3d824deb6739a6945b7b
|
3 |
+
size 32501760
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b81c2606ff1bc2614401dce063badc413f5d29e7feea94c59903a2b83bdff5e
|
3 |
+
size 26593280
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc6189b48aa278cbaf8ea05998a8e844552c23cc3cda8af458432348c3a1f393
|
3 |
+
size 23633920
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ef24c5643ca366cbe65533a551ad1859f45ac858a85199424769cf0f20d88b7
|
3 |
+
size 23639040
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cacc74451d2263be100a0d02813127c1f588088d461ca89b8d81c5a88f8d215a
|
3 |
+
size 32501760
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ed8a0282169172822a3a1c21f88164510c058c505ebfb3c0cbb9837068d59d2
|
3 |
+
size 26593280
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5acc47ec19fcd12c950f298cfd84e74aade62f68a6fd0c294318294fdce4abcc
|
3 |
+
size 23633920
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d609b70f38c67794ea06a6f28503a5c9a0cef9bc879b302501ac97d723b52f1a
|
3 |
+
size 23639040
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f860980482b8b895a6e7f9975ab6a69b6cedc9463d7f3529ba1ecdc2efc238d1
|
3 |
+
size 32501760
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9e2ee69437ec91c7d965ef54c46ccf99360bc743ea7dbccdcf9855c337a1bad
|
3 |
+
size 23639040
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93df2f9b64553628a8be7c9453ca885c65dc3ca8708ff4d40ae85666a51928cc
|
3 |
+
size 26593280
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b8d9e8f2b4ebcb1c5d083f24f0d877bd19f227dc5fcdc6c220cf158e12173f6
|
3 |
+
size 23633920
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4637dc900d5726fe57cfa758c858828ee09775648b2bee74f6102887d3deeb05
|
3 |
+
size 23639040
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b88c82f043b160dafd2ee5e43603f5afa5f918c980a7f1eaf20a0874107646b
|
3 |
+
size 32501760
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d0e120d8ca12be03dec4cf5db3769f10c3ee48439fb3d634a893813c664c1dd
|
3 |
+
size 26593280
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc1edce35eca09c2040a6369fc4ee1fac449c55bb229637864b41729c7881df5
|
3 |
+
size 23633920
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14c4f6885cf8b98eef5a2ac018aa0b77888df59917f0c9deb629a39617eb2a8f
|
3 |
+
size 23639040
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:564fe8dba2b9be48c717777aad08f03efab147f979a63e80277a681cbc1fdfab
|
3 |
+
size 32501760
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b01895567921f8a37784a35531bebc805cb540c3787b4e57ff53fb24917494e8
|
3 |
+
size 26593280
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e58ed2b866a6350fe931570f3d94ba0cbf8ce435f6661fb47ca483d42954dda6
|
3 |
+
size 23633920
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53aed6e9db33089f934554d30b21039ac5bc92ff8803f610461a2e8634a9f96f
|
3 |
+
size 32501760
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:786eb78183b1632935eb288f934f4cd334cc55f008be34f87d4b4848cd17cf0c
|
3 |
+
size 23639040
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07ad1190633b8e6e8a20dade93d7b2d87b2b18df71be4a2d68431b2c2771af15
|
3 |
+
size 32501760
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:943db8c8c7febbe0024afcaeb22f4eb451436a35dc81e8c2237a0447f3292172
|
3 |
+
size 26593280
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ccb5db867200c4254c01bc5c937c8137b827f1f55829bd365086eb94e5df620
|
3 |
+
size 23633920
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:828087099033c0f62f9b46c95708be9d5a16f9d2c8a7ed64a9ea96a91f76b3a2
|
3 |
+
size 23639040
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9504492dd784d755429ffe69e4bd7de34b3df41f900ae7fc6d3d07a0fd06046c
|
3 |
+
size 32501760
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2024deba522e64339d3bd8bf4fa0ce2d346feb618c84c080b9f835890bb29d9
|
3 |
+
size 26593280
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abe586757269b265b5d4c05aa2febd5a35d95cd6667581f8f21f04b52d7b1b8a
|
3 |
+
size 23633920
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d732ac45f682752ee1f22e1204dc77f098ba8733ab3cf367149c49d35a0a637
|
3 |
+
size 23639040
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ec3585019d53f10ee561806ddda54a8fc0e93348500e8efde14d687381935fd
|
3 |
+
size 32501760
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc71e0baf82f52e059bfa1dc400ceeacdc5515f253a8a7e59518f02422d4c786
|
3 |
+
size 26593280
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2f273c02c16ac6d18f791f31f7ac944969c4e41f570d30fe20979cfa796571d
|
3 |
+
size 26593280
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbddbb2794d381554b9e0c6e1c5350f772ceb10abcb36fbeed574017a03856b8
|
3 |
+
size 23633920
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7329baf7e52306fd1cd8ac168eac58708807b380e9c2cd369b16315404ce836d
|
3 |
+
size 23639040
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b48f0b2fbb001eeaea7d1527d7998ed5d88da2ea6fa0bc1b5ece24fb1f65c320
|
3 |
+
size 50331648
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e66c3dcb4c1431d9b0151b3d7336604476f66e0c065cbfdbe523fe0b8542463f
|
3 |
+
size 29920256
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab7e0fd68c6567d412cfe3969065260df13d8bb052c96d8916a61c38dbf6bcf3
|
3 |
+
size 23633920
|
params_shard_6.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56ae245a7a96cc96c5ad086a628e635743867b3076933176ffeb20305d33d91c
|
3 |
+
size 23639040
|
params_shard_7.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1042315cbfb4f527829a390b27f39677dd6eb6910e358698eef20a5cc198e4c7
|
3 |
+
size 32501760
|
params_shard_8.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87e7f928aafee48b022f16e482b5ec7d395e6013b2bd1e68b31a1853d7426723
|
3 |
+
size 26593280
|
params_shard_9.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4c38b30b3bf0ea799ab047752568361334e81c992004d78758b5d12d47ef4fa
|
3 |
+
size 23633920
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|