Upload LlamaForCausalLM
Browse files
config.json
CHANGED
@@ -11,17 +11,14 @@
|
|
11 |
"hidden_size": 4096,
|
12 |
"initializer_range": 0.02,
|
13 |
"intermediate_size": 14336,
|
14 |
-
"max_position_embeddings":
|
15 |
"model_type": "llama",
|
16 |
"num_attention_heads": 32,
|
17 |
"num_hidden_layers": 32,
|
18 |
"num_key_value_heads": 8,
|
19 |
"pretraining_tp": 1,
|
20 |
"rms_norm_eps": 1e-05,
|
21 |
-
"rope_scaling":
|
22 |
-
"factor": 4.0,
|
23 |
-
"type": "linear"
|
24 |
-
},
|
25 |
"rope_theta": 500000.0,
|
26 |
"tie_word_embeddings": false,
|
27 |
"torch_dtype": "float32",
|
|
|
11 |
"hidden_size": 4096,
|
12 |
"initializer_range": 0.02,
|
13 |
"intermediate_size": 14336,
|
14 |
+
"max_position_embeddings": 8192,
|
15 |
"model_type": "llama",
|
16 |
"num_attention_heads": 32,
|
17 |
"num_hidden_layers": 32,
|
18 |
"num_key_value_heads": 8,
|
19 |
"pretraining_tp": 1,
|
20 |
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_scaling": null,
|
|
|
|
|
|
|
22 |
"rope_theta": 500000.0,
|
23 |
"tie_word_embeddings": false,
|
24 |
"torch_dtype": "float32",
|
model-00001-of-00007.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4886466168
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c862e8ecd6caf1b057ff90234945de45b7cc7fa3d21cc4c8accca5e78606f1c5
|
3 |
size 4886466168
|
model-00002-of-00007.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4832007448
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60a45e4e069d8bf0dc2f4438de856aa92a5571b0529b1d1efba02bf7a052c6e3
|
3 |
size 4832007448
|
model-00003-of-00007.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999813112
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ca8410b94749519a0fdb4ea586a0b4946708b057f7af094c3892b9de687c2aa
|
3 |
size 4999813112
|
model-00004-of-00007.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999813128
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3168fc1330a35602fe0d7120f10a18eb4c44128c35bf3248ccdfe23db285ad81
|
3 |
size 4999813128
|
model-00005-of-00007.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4832007496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dabf9d3758465c4faef25a9dc23af4569119eb6aabf765cdcb8cf89007be99d
|
3 |
size 4832007496
|
model-00006-of-00007.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999813120
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c2b084a978d37965315896b14fb76dd714f4594333ad8f12854e60264d9aa15
|
3 |
size 4999813120
|
model-00007-of-00007.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2571158184
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ff26d5dcce3254e446def094f836a70ef00767efa0ae0d39f26a0b521fd0b44
|
3 |
size 2571158184
|