apepkuss79
commited on
Commit
•
b223872
1
Parent(s):
7f977f5
Update models
Browse files- .gitattributes +13 -0
- Llama-3.2-1B-Instruct-Q2_K.gguf +3 -0
- Llama-3.2-1B-Instruct-Q3_K_L.gguf +3 -0
- Llama-3.2-1B-Instruct-Q3_K_M.gguf +3 -0
- Llama-3.2-1B-Instruct-Q3_K_S.gguf +3 -0
- Llama-3.2-1B-Instruct-Q4_0.gguf +3 -0
- Llama-3.2-1B-Instruct-Q4_K_M.gguf +3 -0
- Llama-3.2-1B-Instruct-Q4_K_S.gguf +3 -0
- Llama-3.2-1B-Instruct-Q5_0.gguf +3 -0
- Llama-3.2-1B-Instruct-Q5_K_M.gguf +3 -0
- Llama-3.2-1B-Instruct-Q5_K_S.gguf +3 -0
- Llama-3.2-1B-Instruct-Q6_K.gguf +3 -0
- Llama-3.2-1B-Instruct-Q8_0.gguf +3 -0
- Llama-3.2-1B-Instruct-f16.gguf +3 -0
- config.json +39 -0
.gitattributes
CHANGED
@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
Llama-3.2-1B-Instruct-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
37 |
+
Llama-3.2-1B-Instruct-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
38 |
+
Llama-3.2-1B-Instruct-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
39 |
+
Llama-3.2-1B-Instruct-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
40 |
+
Llama-3.2-1B-Instruct-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
41 |
+
Llama-3.2-1B-Instruct-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
42 |
+
Llama-3.2-1B-Instruct-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
43 |
+
Llama-3.2-1B-Instruct-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
44 |
+
Llama-3.2-1B-Instruct-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
45 |
+
Llama-3.2-1B-Instruct-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
46 |
+
Llama-3.2-1B-Instruct-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
47 |
+
Llama-3.2-1B-Instruct-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
48 |
+
Llama-3.2-1B-Instruct-f16.gguf filter=lfs diff=lfs merge=lfs -text
|
Llama-3.2-1B-Instruct-Q2_K.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cbccffcba1e679d2fb906a55b5d6d641aa21bff9ee20fe30cef6dd6b9f8e410
|
3 |
+
size 580874080
|
Llama-3.2-1B-Instruct-Q3_K_L.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e89a46e80c150f92bc0d5dfacb069f46770807664340339a22d886031ee06ddc
|
3 |
+
size 732524384
|
Llama-3.2-1B-Instruct-Q3_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bdd2550b78bdee5653da8f9d07d74faaafd7cc50602eac9107d8f2c60677d24
|
3 |
+
size 690843488
|
Llama-3.2-1B-Instruct-Q3_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf5363d4847936b37950b1d048199b616b80edd40e78ed15e7b0f2e36c32433b
|
3 |
+
size 641691488
|
Llama-3.2-1B-Instruct-Q4_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:150e95f201edeaef9b5d37aec70fcee65533ddeca51a4d1092037195f0302f69
|
3 |
+
size 770928480
|
Llama-3.2-1B-Instruct-Q4_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e95df2f5144fd67bf11421ad59812fbde45a79c90eb49cb5d79e3d7bddaa1331
|
3 |
+
size 807694176
|
Llama-3.2-1B-Instruct-Q4_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e256d51eed0799552f91a4fb8f0d05315b3e3dc1cd4499514e7d87a845951c88
|
3 |
+
size 775647072
|
Llama-3.2-1B-Instruct-Q5_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:922306ce6b89b731d20130c2a5e909be530c5703fd24b26f7d050bad3faf3fc5
|
3 |
+
size 892563296
|
Llama-3.2-1B-Instruct-Q5_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cd16584b15af8c268ca60454b63b5021b0b2c7edf66cff2b41210a333b2233d
|
3 |
+
size 911503200
|
Llama-3.2-1B-Instruct-Q5_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66260aca245c04327590457d52debf378e0fc93b881b2effb71f9a00703a1953
|
3 |
+
size 892563296
|
Llama-3.2-1B-Instruct-Q6_K.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fe00ecc20650188a714bf1766cecbd938e6119e9311c8fe91ca3fb5f3246591
|
3 |
+
size 1021800288
|
Llama-3.2-1B-Instruct-Q8_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c0522ea0da43f9a089b5f2df7699a659cc320a5259c33506c44925fa03232fc
|
3 |
+
size 1321082720
|
Llama-3.2-1B-Instruct-f16.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f33ad43d2b85b908ff06fe7002b69806a57359b9b2617ca27d7bdea428ae146
|
3 |
+
size 2479595360
|
config.json
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"LlamaForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_bias": false,
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 128000,
|
8 |
+
"eos_token_id": [
|
9 |
+
128001,
|
10 |
+
128008,
|
11 |
+
128009
|
12 |
+
],
|
13 |
+
"head_dim": 64,
|
14 |
+
"hidden_act": "silu",
|
15 |
+
"hidden_size": 2048,
|
16 |
+
"initializer_range": 0.02,
|
17 |
+
"intermediate_size": 8192,
|
18 |
+
"max_position_embeddings": 131072,
|
19 |
+
"mlp_bias": false,
|
20 |
+
"model_type": "llama",
|
21 |
+
"num_attention_heads": 32,
|
22 |
+
"num_hidden_layers": 16,
|
23 |
+
"num_key_value_heads": 8,
|
24 |
+
"pretraining_tp": 1,
|
25 |
+
"rms_norm_eps": 1e-05,
|
26 |
+
"rope_scaling": {
|
27 |
+
"factor": 32.0,
|
28 |
+
"high_freq_factor": 4.0,
|
29 |
+
"low_freq_factor": 1.0,
|
30 |
+
"original_max_position_embeddings": 8192,
|
31 |
+
"rope_type": "llama3"
|
32 |
+
},
|
33 |
+
"rope_theta": 500000.0,
|
34 |
+
"tie_word_embeddings": true,
|
35 |
+
"torch_dtype": "bfloat16",
|
36 |
+
"transformers_version": "4.45.0.dev0",
|
37 |
+
"use_cache": true,
|
38 |
+
"vocab_size": 128256
|
39 |
+
}
|