Upload 107 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- mlc-chat-config.json +45 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,45 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gemma",
|
3 |
+
"quantization": "q4f16_0",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 3072,
|
6 |
+
"hidden_act": "gelu",
|
7 |
+
"intermediate_size": 24576,
|
8 |
+
"attention_bias": false,
|
9 |
+
"num_attention_heads": 16,
|
10 |
+
"num_key_value_heads": 16,
|
11 |
+
"head_dim": 256,
|
12 |
+
"num_hidden_layers": 28,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"vocab_size": 256000,
|
15 |
+
"position_embedding_base": 10000.0,
|
16 |
+
"context_window_size": 8192,
|
17 |
+
"prefill_chunk_size": 8192,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"max_batch_size": 80
|
20 |
+
},
|
21 |
+
"vocab_size": 256000,
|
22 |
+
"context_window_size": 8192,
|
23 |
+
"sliding_window_size": -1,
|
24 |
+
"prefill_chunk_size": 8192,
|
25 |
+
"attention_sink_size": -1,
|
26 |
+
"tensor_parallel_shards": 1,
|
27 |
+
"mean_gen_len": 128,
|
28 |
+
"max_gen_len": 512,
|
29 |
+
"shift_fill_factor": 0.3,
|
30 |
+
"temperature": 0.7,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 0.95,
|
35 |
+
"conv_template": "gemma_instruction",
|
36 |
+
"pad_token_id": 0,
|
37 |
+
"bos_token_id": 2,
|
38 |
+
"eos_token_id": 1,
|
39 |
+
"tokenizer_files": [
|
40 |
+
"tokenizer.model",
|
41 |
+
"tokenizer.json",
|
42 |
+
"tokenizer_config.json"
|
43 |
+
],
|
44 |
+
"version": "0.1.0"
|
45 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb07c314a0bc54bb896a328e543ba0b50dd49ee4e7d518a00daa14a550a76ba3
|
3 |
+
size 393216000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63fa7708104b0af3b9c6b126dee669516ac878feddd8a8dcb0e2509df9e7ccbc
|
3 |
+
size 49152000
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65961d7b8025fc7f14d8b6c580687f648f12a656b28a789ebb18e9356442160b
|
3 |
+
size 75497472
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f76c3df72da9b7379488f5c6bdef11085d4a809036b1353f1bf61eb48cb2eb8
|
3 |
+
size 33036288
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a45af99bf69b84e195a3df0851043a164d9e684becbd9121d164954c53c71b58
|
3 |
+
size 9443328
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f4913f62d105a34cbce074ba5c264edaec67632fea802ed66f92e3653c6bc78
|
3 |
+
size 33036288
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb01f30569e854a6187ffc06f2ce19cb7aecbc51dc481b08265a9dbdd33c2da3
|
3 |
+
size 37748736
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b0d82858ec376e555a47e98fe1dc8a8d6a2fee712134f32205d05f680fefc96
|
3 |
+
size 75497472
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26f9be9512520dbc8b715c629f63c92a45175a04f10cf822eddf7ef084feaeb0
|
3 |
+
size 18874368
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0333c009a47710d8873b3920d99bbe37357f80b34dfa2f53190d49d62e502024
|
3 |
+
size 37748736
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb6fba705ada839bad5656a5451ce4de219c19a465e533d4fea5852afa77ddd0
|
3 |
+
size 33048576
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2cc8dcae1634c4427ab4df0b7144ab1976e8444352c0d754fb2a10615547e9d
|
3 |
+
size 75497472
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:470ecabfeeba502b9def35bd8781e1cbd4016f9e6c9b9f022b851bd25bbe70ae
|
3 |
+
size 33036288
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:968ba69d9606f111cc3b940f2c617ba02602c53dfc042539aef11eb5216fdc21
|
3 |
+
size 37748736
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3838dfc032d4e33d76e2d3685be1b2812378e8b8fe93d6cac5021278eb0cc8f
|
3 |
+
size 37748736
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cde06b4b48869021bce3649f0c4807d4f3eaa457bee16f9dd114a3f2c1390e2
|
3 |
+
size 75497472
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1816489510674bd335922204de404baa03034bc7a9313b42cc7711a11e21ac3
|
3 |
+
size 18874368
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ac6e28bbf2e1e7f1377f55fc260d1ca845933e4b7e0f2e3256f43cc36f6a65f
|
3 |
+
size 18874368
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93a445724eaed413f1e0f1c1d45e0fb377f32291028c8bccae03dfe190b3d0d8
|
3 |
+
size 33042432
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cd940330458e65d040eb511d1118f5ea32ef67df22cf6bc9b287e1bbbcffe47
|
3 |
+
size 37748736
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:110bde984fd473c04a88eeab749131fc8b8e6069ad272e291dc42cce3b0f020e
|
3 |
+
size 75497472
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66a31c4c1d94fa4163e6ff3048395ca3abd4d8c2ff3355c7ac1ad484629d65b9
|
3 |
+
size 18874368
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b091f498769fba2da0a0d050125015f09a0e97f6d2f2192348268ad284b876ac
|
3 |
+
size 37748736
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb75a91c1e30ab59d53aa09854e951193b88aa3b39fc25c011e5fd327aced7b1
|
3 |
+
size 33048576
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01e8902e5a99de97fa944f881beb82096e571289d4d607fa3a4285f4f86ed332
|
3 |
+
size 75497472
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4ef6f434167e77347331a631c335e667d927683ac90c419cc4fc02ebccc7af7
|
3 |
+
size 75497472
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ec3a26bb17c69dc2007f34ad678c06974289a45172c1a6b9086b0c0ea924b55
|
3 |
+
size 33036288
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc0b53780a6a026c810a77dc6af809d463075ac75ffed57059cfc59f5b797abc
|
3 |
+
size 37748736
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b8c0ed3b7e024f916e66bdd828122520b3baf680805f8872cfdee446ff61ebe
|
3 |
+
size 75497472
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee36f174bf6b9aa4b988ffdcd575229a2e7bbd2b0aa9dee46ee33e6f6d909d1e
|
3 |
+
size 18874368
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f52633ac0c6f9c0a6bfef93bd006bb22b9bdb376026b7dc0e1c015cf8b14099d
|
3 |
+
size 37748736
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e63616ab7b04d2d2fb07680677e986becad34ec272f19be98ce387a21fcc9a43
|
3 |
+
size 33048576
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:479ce0fd5b1a66b9bc57a6f51532fb00c6c0dfbf0905d37bb543f01099a18ff7
|
3 |
+
size 75497472
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:039128ba09120f1c4fae1d310b75b57978b8b8d8446b39ef5a77fbf886d751be
|
3 |
+
size 33036288
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7119f7daa99f269f8cebafd5b96711e11749c6d35d22f01093b00fb773c5ee1
|
3 |
+
size 37748736
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13b52dec000f552de9724cd54eb2324b6c34ceef7086cf62efb98b256cfe2337
|
3 |
+
size 75497472
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b27320b23591ca86026f1bc6d7ec6bc040b970ffb2be0a6117c644f68ed7447d
|
3 |
+
size 33042432
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:613ffc0f63fedf7ff871fc5164aa3be3b344e4025b002372ea219cd9af06e66a
|
3 |
+
size 18874368
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9f5d2bba620638ad1a8033ab318a78e0c5676bccb830fc92dcad05c72dfd3e2
|
3 |
+
size 18874368
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e7b09e3033aafe32e3b3ee9f8124492b8e3f4db0c9a63aad5b0bf340118b41c
|
3 |
+
size 33042432
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04c7929c277aadc6cef83fb949f50dfdad9a7b01de7ee56672f0bc702b4990b0
|
3 |
+
size 37748736
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b79ae0ad5893cacdff1778b766d55e6ba6e6635ad8818b63d7eec2f833fc2c6c
|
3 |
+
size 75497472
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b73ada6489689750fa1da5218f63737042a317841e5448aa338c3b335001b3ba
|
3 |
+
size 37748736
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf241480f96c85b20c931c3dddb6ff889a782362ee099e9329529a14c2c0813d
|
3 |
+
size 75497472
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:503c03712dec997620bc70958557df654cc0c38936e4b09e898317fa55feaa1a
|
3 |
+
size 28329984
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3672ef6d074d87594884f8419cb3f2b10abb9f931a5b9ee02bb478a9690958cf
|
3 |
+
size 30676992
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:924508c0d5338ac455fcca38b8f4f5d135ec420d7c78ea4a2a81b3c86eca9297
|
3 |
+
size 37748736
|