at676 commited on
Commit
53a8d38
·
verified ·
1 Parent(s): 487c673

Upload folder using huggingface_hub (#1)

Browse files

- 7b034bef1925b15fbd72ea5cee4188803002c0c44db5f60c328f38bc17c7d5e3 (61a9db1c490171d77b734383bdacdf4b3781231d)
- a2d53511790456111625d21cd14185ecb037ec0ca65b9acee65e8b883631397a (34689f7615f7b1634815af4a86896e13d97101c5)
- 76fd91607eb76ad3cc644e0028aa8ac976d82c6412a8acfccbee96b7074c3e57 (dcbcdb9c011a15dc22479a36ef49ec6d438c2df0)
- 620297bba12bbd61d2dad8c7bf53a7b34adff1c4c080710dd394d07f2099d63c (6e1dc600a12c191c17bde48ff171c323f2fc192a)
- 5333c045a8c7da6d8ea8f9004cc5a75ecd1d7c55fc0883fe385257053bfbe342 (45a362a9ccece49157fcde580855a3fddba2e206)
- 6a43a1230ae0008005dd4584fecd26e35e9ae90454f21ce39094f451ca792ebd (736c5044cb7586f18bc98dd1048b48601a6c0a42)
- fc08feb3ed410693ebf753cbd8e9d2506e8dba131bc8c3ec54e260bf6648f5c5 (fd22347ba7101fd5aac616c0ff60845f05dc1a68)
- 58d5831d083ce7d44d15364d11567090b89081aa818e51054917c037e60285ce (fe6e2e060dc698743a6685fcd7f4b4e633f502bb)
- 0825781306f43230b18885be7bc7c73cb60ce094d1a0b6406452edde69819d63 (8c248f28f7b7b8818334edf2d141e68f00502247)
- 7289b6b000da9b3cb3f73e0b0a7ec1b66520f721b8edcae7c19917f61a5c37fd (d9eaba162a8eaff7550b43ca2215a2ad0fca503e)
- b8b28126f7e0033a281f878e17fef3f13660baa6b0b30df0eb959421a0e9b491 (ea446a71bc1790b75ebd4f02a114e542e4aee953)
- 291bfa0e72af023140e4573fe018dc89b3bbe40888b6d4b016026e3e8a4af373 (f3f1cc6758f8c88e323993dae5f6e19ab32bac3c)
- e37d3ada6c07deaf647ed9366f37d8c70eaa5f8cd106665e11d88916cf7f3286 (ad7c9dca35b2b5811bdc9052c9b35f5508924939)
- 3fe025e3c867c5ece4050ea0f7450b9c8a73137d8894c8515c654c6f047eca1a (6d8e87c8d7801ee635737245f7795e55f278c31a)
- db93f8a8a429c2b81e9a5a62d5f744b9563da1a8b45555d9f988795daee948d0 (a3bca618a280a8a3874c2fba7cb82a327a3206d6)
- 84a7d87072078125db33d6105ee5f7edd65824084278b1f8888d588d3b88531f (6480312b7ebc56a3f211545d0b539b45603d8fb9)
- 8b4d0e1ca7d9eef31dfc7ed56c199d559a4dcc92b3ff2b1c08fa9f23add0fd4a (d6e366e30c48917788ced546478dfc3bef00b072)
- d10e0136b9dcc4ceee24b7a5aed26d20bc738dca3b855117f933474a93a413eb (664b1bd28c2b257aba8f7a6da4038519e7091973)
- 34a900240ee735020f0f4b8b6592c2c20f8cf3dbcea4663143aaf8972cf6aa04 (c52ef79e429c5d6868bbfe471db1abe4156dbb72)
- 56121552e4c2f2aacd0e427d10b72801a16b5c4f7c85f8fbc19e2bc4be12283b (b08983495772e19e51cc6eee788088d3d49f0f6c)
- cf627268e587bcc2f1e5d53a402f32665cd817893111fc70b83a0e0fc029e882 (966c4ea8047b530b49829c3cb330c9bbfb429855)
- 48949e4f8ffd4fc24e420adcfa8a65c2268d53b574c8a2b7eb483b5b813b57ab (1fe733b9e545cb1795d77a9695a2776e91d50182)
- ba0a13c72c5cbd12f6c1d8a141235c8ed7594723eabaf541dd75eb146155c076 (28d9dcd63a3fba53c2a256a7694197611b64e3b0)
- c6b263a60c0b7d56e31ccbd1c8ff4d46e9290fd1e5477ceeeac4ad52ec417d58 (c057c14f43cb0241560c713aa3aabc930c93e558)
- f92c55db01865b2a7d2fb7d203311b82cd50c9a4c7c091d683d1433132f6c173 (2568e344d1e96b09a5112bce8c96996b8f6d5a8a)
- a4745ea6f453dec7cec629a74c271e6b21fdf31368c2a6dc1e77506c9851f9f8 (d33c23636e44e8a855b96725afb1413ea2bb3cb1)
- ee49caac6bdf774915f83a7c7755f98cb9283440f7665016feac45d548baf04e (04964fca5b9e6c4d1629ecb02d89267b5dd79c78)
- b64b0b1e1bb38f78221b34a9327946e5a9a9d69398cff6a623324ea1fc8d00eb (c6ff037ff310d274cc99a86e7611bc884d0824ba)
- 2b0e3ec5cdf0c9d94a64a8d40e27bc410ab37a8c96eed87cd9cabfd48f1b8c76 (a58e1c64164f6c4b28e43dafb313fd10fb511b53)
- 9a2258c37c751934ca14a530a19046dc69c7ba50c610e920bce756ed6e041813 (400aaa3a89e95b393d2b1502b2f2c6afdc187b0e)
- 0fa410561275b02275a0afd973738b8e1ce05d002cbf832f61d96744a0252b17 (ae8e863b46d86bfd46afc9e2866307ccf3bef0be)
- f4d00372b42d1708fbf05572451cedce0a5c6381f20fe48bb6aeb36b45af6acf (358689c92a4b2847074b26a219196c8a883c1af6)
- c6b6de80a11cf4403f54326d3971e046628487fc0e336b52bc44799a19522abd (7e814e89ded149bdb29d2136b347970cd6d38722)
- b9b42073371f4f7f3a1510bd870bae2ec214249d30259593d9d47139ff67ff80 (6bc74307b084b1b4448ae0ef54d133cf91846699)

config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "meta-llama/Meta-Llama-3.1-405B-Instruct",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": [
10
+ 128001,
11
+ 128008,
12
+ 128009
13
+ ],
14
+ "head_dim": 128,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 16384,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 53248,
19
+ "max_position_embeddings": 131072,
20
+ "mlp_bias": false,
21
+ "model_type": "llama",
22
+ "num_attention_heads": 128,
23
+ "num_hidden_layers": 126,
24
+ "num_key_value_heads": 8,
25
+ "pretraining_tp": 1,
26
+ "quip_params": {
27
+ "K": 3,
28
+ "L": 16,
29
+ "V": 2,
30
+ "codebook": "bitshift",
31
+ "codebook_version": 0,
32
+ "decode_mode": "quantlut_sym",
33
+ "td_x": 16,
34
+ "td_y": 16,
35
+ "tlut_bits": 9
36
+ },
37
+ "rms_norm_eps": 1e-05,
38
+ "rope_scaling": {
39
+ "factor": 8.0,
40
+ "high_freq_factor": 4.0,
41
+ "low_freq_factor": 1.0,
42
+ "original_max_position_embeddings": 8192,
43
+ "rope_type": "llama3"
44
+ },
45
+ "rope_theta": 500000.0,
46
+ "tie_word_embeddings": false,
47
+ "torch_dtype": "bfloat16",
48
+ "transformers_version": "4.45.2",
49
+ "use_cache": true,
50
+ "vocab_size": 128256
51
+ }
generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
+ "transformers_version": "4.45.2"
12
+ }
model-00001-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a42deca02abcefc58242c25cefbfc71ba235f025e87a6562bf94510d3873e5e2
3
+ size 4744288624
model-00002-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c6c8b2ce881db2a10a332d340ab9083b2da893b9f2c7fa29d9e64d1a37f6521
3
+ size 4785574248
model-00003-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1effc15a8e6bff779bd2d69576a2352e90f5a4242d21aaae190986fb0ae1ee18
3
+ size 4785574248
model-00004-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ad27d0b7627694be8213fa797a12e29eb978ab611a9077c573297a90167a549
3
+ size 4785574328
model-00005-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc4f631cd63569758d212a5b157616c22ee2be348adc6bf3756c9c358f8481a0
3
+ size 4785574368
model-00006-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47f18a027a2f9a3692311c44c40054f60bbe84d818463e4cf0ca1588aaf1ab19
3
+ size 4785574368
model-00007-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0ea2824c2e53ca325219220ccb9759a54710fb4731ac60d19dfdf260f32b091
3
+ size 4785574368
model-00008-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d1fde9f3469f0f14b7c1bd3e7bedb1e4adaf575171240d39857c09d8f1d9978
3
+ size 4785574368
model-00009-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ec887524b05edb1cb8518bfc7e6fa1a4d60122d46796f0181742e3f11384780
3
+ size 4785574368
model-00010-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bc0da1cb9b42972d6649231b66f8d8c2b187d2fe438a03c2f65312f73669aff
3
+ size 4785574368
model-00011-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e64204fe44c6e2a09f38bbd3a317832e5a325b4fa754c55e45d9fdb2d8b9e19e
3
+ size 4785574368
model-00012-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd9dc098ad292e79d26b3006921ae3e6b1f20e21d44fc62709d86bcb04a3b645
3
+ size 4785574368
model-00013-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2ec5f7bea8e751982cd267b0db5ec8f53341cbc3dc211ac25fba8168329556a
3
+ size 4785574368
model-00014-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:342106a19f04746272440840cc7580cec84a660055c9a358268f27aa3185f4da
3
+ size 4785574368
model-00015-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5131fe57c81e29efa187fc77af55a935a045c81f2cb6faba0a722e14647a62b6
3
+ size 4785574368
model-00016-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1842f1505a48bd06d73dff1d4e743b9ad93cf7a57905e1007d394958ddea81df
3
+ size 4785574368
model-00017-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d38612c5bdcde4cb1a6409a8edf89693436250fb51a1769d89f633ea6f4685e8
3
+ size 4785574368
model-00018-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d7489a481bc990a57d631c4bed93ff105655679baea41bbddcdf02b96bb903c
3
+ size 4785574368
model-00019-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:458c27ea0de160cdd1e7418a28a4d140a06454fe81549ca9c161f96ae80be3a6
3
+ size 4785574368
model-00020-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba7fcffddf087d7441d28e4208fdd8d521d2cf9daabbc1899641f60ca1649806
3
+ size 4785574368
model-00021-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82580025a77f93b9718bdf1a19b803befe2578733aff3b822f850e299306f7d0
3
+ size 4785574368
model-00022-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cba94cdc47e0ec3fe9d3654dffd8d1075409fc87102b8d9e60b6108c1e317b4
3
+ size 4785574368
model-00023-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ea243b3e9e8095e7374d7e66b53c87f28185777ef934c1680ddac4582c7f9b4
3
+ size 4785574368
model-00024-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b52474db9dc9b785df0984f9926f69d1738169327039af8e2f0ce41f04a94fc
3
+ size 4785574368
model-00025-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c3a90ae500d679a893f1f6820bfbd2d9d409b7b1ec31b7b56bcef1d12021608
3
+ size 4785574368
model-00026-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd8f6a3681073cc2da50f5a8ebcc7f2531f3a83b5cf3fc528d66a835bc35c70f
3
+ size 4785574384
model-00027-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4056031273560748c122df42bd4fd7a245eb820d08f10a1a0c1a7fbb7e7e2cfd
3
+ size 4785574488
model-00028-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef5bc3315c8e1027532f131897cc09558cf65f9afc0019bc6e98ff5fd7b2a03a
3
+ size 4785574488
model-00029-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17ecba067b4609fa1a97d651ee01a6fcb79e61ef6e4d2d3add73d0806fa81f7e
3
+ size 4785574488
model-00030-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70cd3373b9827f488c4ec09819d1502e6d89a361894b571dc63124ace58bfb56
3
+ size 4785574488
model-00031-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a00d96cfbabae5081fcccec3a54f8dd194185844d2aae639db56b5d62676d021
3
+ size 4785574488
model-00032-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:063d533fe69e11a564b480062686feffa17b1c3ac7d2ad51ff8cb7b3af7384f4
3
+ size 4785574488
model-00033-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c060cd8ee1d4f25e39115324e8f8ab1a0c126dc3610fc24b6536ee7174e1b8e
3
+ size 1851224240
model-00034-of-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71b079a02069ebe5a5f4f8135815f136afb1d6fc4423620dcb2a14fa399cdf12
3
+ size 4202692736
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff