NSTiwari commited on
Commit
b4ac27b
1 Parent(s): eb3e54f

Quantized Llama-3-8B-Instruct model.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Llama-3-8B-Instruct-q4f16_1-android.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9f804c58d4750908cb091bb00a6fe0e030dd7a3f96c9ba8aa87a8d0c3c48636
3
+ size 515778
logs.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "llama",
3
+ "quantization": "q4f16_1",
4
+ "model_config": {
5
+ "hidden_size": 4096,
6
+ "intermediate_size": 14336,
7
+ "num_attention_heads": 32,
8
+ "num_hidden_layers": 32,
9
+ "rms_norm_eps": 1e-05,
10
+ "vocab_size": 128256,
11
+ "position_embedding_base": 500000.0,
12
+ "context_window_size": 768,
13
+ "prefill_chunk_size": 768,
14
+ "num_key_value_heads": 8,
15
+ "head_dim": 128,
16
+ "tensor_parallel_shards": 1,
17
+ "max_batch_size": 80
18
+ },
19
+ "vocab_size": 128256,
20
+ "context_window_size": 768,
21
+ "sliding_window_size": -1,
22
+ "prefill_chunk_size": 768,
23
+ "attention_sink_size": -1,
24
+ "tensor_parallel_shards": 1,
25
+ "mean_gen_len": 128,
26
+ "max_gen_len": 512,
27
+ "shift_fill_factor": 0.3,
28
+ "temperature": 0.6,
29
+ "presence_penalty": 0.0,
30
+ "frequency_penalty": 0.0,
31
+ "repetition_penalty": 1.0,
32
+ "top_p": 0.9,
33
+ "conv_template": {
34
+ "name": "llama-3",
35
+ "system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}",
36
+ "system_message": "You are a helpful, respectful and honest assistant.",
37
+ "system_prefix_token_ids": [
38
+ 128000
39
+ ],
40
+ "add_role_after_system_message": true,
41
+ "roles": {
42
+ "user": "user",
43
+ "assistant": "assistant"
44
+ },
45
+ "role_templates": {
46
+ "user": "{user_message}",
47
+ "assistant": "{assistant_message}",
48
+ "tool": "{tool_message}"
49
+ },
50
+ "messages": [],
51
+ "seps": [
52
+ "<|eot_id|><|start_header_id|>"
53
+ ],
54
+ "role_content_sep": "<|end_header_id|>\n\n",
55
+ "role_empty_sep": "<|end_header_id|>\n\n",
56
+ "stop_str": [
57
+ "<|end_of_text|>",
58
+ "<|eot_id|>"
59
+ ],
60
+ "stop_token_ids": [
61
+ 128001,
62
+ 128009
63
+ ],
64
+ "function_string": "",
65
+ "use_function_calling": false
66
+ },
67
+ "pad_token_id": 0,
68
+ "bos_token_id": 128000,
69
+ "eos_token_id": [
70
+ 128001,
71
+ 128009
72
+ ],
73
+ "tokenizer_files": [
74
+ "tokenizer.json",
75
+ "tokenizer_config.json"
76
+ ],
77
+ "token_table_postproc_method": "byte_level",
78
+ "version": "0.1.0"
79
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2ed37d77cd108bf6f4ae44b752deb6d9ff230cab0d1dd6e498a7afc24733099
3
+ size 262668288
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c45006b20e9cbbf1941a106dbddd5b043a24a4484cc15f7dca444031d5e59ada
3
+ size 29360128
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92423d1e470526664d2cdd09bcf9111d813fea4cf22223636b05c2d9229a1618
3
+ size 33046528
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7b1f5a47bef6b9c1087ae3865ecedede9e19f9bf6b1ea3e94a76a81a1e68843
3
+ size 58720256
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:068171b489cc7cbd43dcca11b5520127ad201c59802530681dada0940060d72f
3
+ size 25174016
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc6f005ac098bd8aef30fb032aba815bb08a66c35f9a1353516d964df44278e3
3
+ size 29360128
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eea3b928e9e76e9b7a4f1dd98e98a12f5e34df364c28867f6b27d52ae2675a11
3
+ size 58720256
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef049ca8e8ae1623db544b23546248657a232e29dd6fcc4951e6b998eaca9044
3
+ size 33046528
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bec5e57d1eae4044ce2ed6b5de14220d6ab4aa81d367abd1df1f5e391c4209bd
3
+ size 58720256
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:148236900677871920dd45b0c0ef57928d3098f304662700e5b2d1778c672d1a
3
+ size 32505856
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44f5ce12208ff6abd5779a75ba0bda156318f3766256659431dd446f4992b154
3
+ size 9437184
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c745443ff322319bd8120fb43169e40167159e9dc96047b544015e601114522d
3
+ size 29360128
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddcb0155d652d7dcbdf83af1c8da095c66a2e94f30a755c7889cfc7456e30485
3
+ size 58720256
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee8a779df967099cc3684157d4c68badd7a4df554ee7ae57f7249cde1180c77e
3
+ size 22036480
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:028dcb0f5706b25a6173bf9cb2ebd4aa833f04a3bb6c0756415f63afdad91833
3
+ size 29360128
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6434d2b1cedfb96b5105758c697fafcc2380e41c29350ca1d5942f64ec7a005e
3
+ size 58720256
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:687c80c5494efe7efa0288ef9d3ffb44c1eedc8558c151da9b84d0a6f4eff583
3
+ size 27271168
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54126705bc9a09bb3310855a4ecd3d5e57c5d94b3facf877a1a400c21e871ef6
3
+ size 29360128
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e05bfa4a2c5d0bc93573a75ecd287a4938b83ee4af669fe5e9e0d3c43146bc2
3
+ size 30949376
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30130ce7c89c60aa54c00c167ca8962411178a59c24207f0ad00bfb863404fab
3
+ size 58720256
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63962a1a538ff2ecc296c6d07ff461247cfe1fa28950a97a7779dd80c4bb4d1e
3
+ size 32841728
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f655c2bf134b5b9a85f6247651ef076f624d8165b8f531e6aaa52cde8395c603
3
+ size 25174016
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bc9128b9f3c5abca94c4e13619347a1f36f539e7795552cbdbf437055e0cd9f
3
+ size 29360128
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fa3a2a4c7742eb08bc6b8b8e17d78dfeb2ec1d6490e1a16add6925ca4e79009
3
+ size 58720256
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d90de65f027fb1fc916f02ff73b55ae84e036fcf2f35fc5407ef25da61c20931
3
+ size 33046528
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36605734cb52b92aa8635262f13b15d82610da79722877194557d69b37e6463a
3
+ size 29360128
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc13fb93d3054955f68a3840818dd74ee39941c682d45e4ddcaceeca46d9b9f3
3
+ size 58720256
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab76e5856b186751326e893e227802986deaa8151329a3d2a5ba35a9e2d84b1b
3
+ size 22036480
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6597b2a99b385cb36d77a387f3a035eec1e0a2c53de017c8db246c2774d0471f
3
+ size 29360128
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f9787abf533597067187590595ca737771f089ecabe53ef76770b37e8f58f18
3
+ size 58720256
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa3a9e9df3c533bdcafa8819381d0bb3efc67d277177349cf6cafbfa84af8fca
3
+ size 27271168
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d34f1fcb18350c4f89329f1db8ae657b37ae48926dfaf8a9aa25d98c26f9a03
3
+ size 262668288
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b59ffd98eb25881c21bbc6b0843cccf12d3f98a08fe26f1030c93812131cf4f
3
+ size 29360128
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c50b2f9ff6744c1cadedb37ee0ad1c7f800ad3f607fb76003b127377b75d72d
3
+ size 30949376
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7d78304a26c4164b72a5d71450c21979e711fb88ea963e142d34165f33deb9b
3
+ size 58720256
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3223acb25be3c6f301ea8f88e2c4d0f07c6f49c65faae047984e9805cb9486fc
3
+ size 25174016
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3051a8f94165689c4cfc0c05563c9b02e351f7667d0da97f123a2ee405d38dc6
3
+ size 29360128
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de466d5e972ee871cea39086fff82049da244b471a136af264af64c4279cceb4
3
+ size 58720256
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a192ac9f10be719ca8780c989693583b894c84817205189d3b0d69f4db96f27
3
+ size 33046528
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f23031f20e901678c3188e63e5e09ced63d4395c8c34ae87b22cbb349fa3a72d
3
+ size 29360128
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b9dc05e957ab2f7df4b5699231ad6b8a0cf5e8919ee749ee11debbbd9ae18e
3
+ size 58720256
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef42d957681f632ec441cf7ddf8374c7394d6d29685a1c683624a457a4caced7
3
+ size 22036480
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2328a9e043f74b15f0843a8b02637a4b1b6e5925809c2dc53dd131aeefdc2958
3
+ size 32833536
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c1a32e5f9d72ec6a3a6e03bd929c5a0d8d3c5cca4dbc33e2234476532477e7f
3
+ size 29360128
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c925ab081cb0f0e5171b6a4111eb469e3268b5b62352e461f5f00af2093c00ed
3
+ size 58720256
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bc9760e7e0b84d91c4a674d29cf59a3f96f12a4f010190381f4e8ed08e86bca
3
+ size 27271168