Upload folder using huggingface_hub
Browse files- config.json +36 -0
- generation_config.json +6 -0
- model-00001-of-00025.safetensors +3 -0
- model-00002-of-00025.safetensors +3 -0
- model-00003-of-00025.safetensors +3 -0
- model-00004-of-00025.safetensors +3 -0
- model-00005-of-00025.safetensors +3 -0
- model-00006-of-00025.safetensors +3 -0
- model-00007-of-00025.safetensors +3 -0
- model-00008-of-00025.safetensors +3 -0
- model-00009-of-00025.safetensors +3 -0
- model-00010-of-00025.safetensors +3 -0
- model-00011-of-00025.safetensors +3 -0
- model-00012-of-00025.safetensors +3 -0
- model-00013-of-00025.safetensors +3 -0
- model-00014-of-00025.safetensors +3 -0
- model-00015-of-00025.safetensors +3 -0
- model-00016-of-00025.safetensors +3 -0
- model-00017-of-00025.safetensors +3 -0
- model-00018-of-00025.safetensors +3 -0
- model-00019-of-00025.safetensors +3 -0
- model-00020-of-00025.safetensors +3 -0
- model-00021-of-00025.safetensors +3 -0
- model-00022-of-00025.safetensors +3 -0
- model-00023-of-00025.safetensors +3 -0
- model-00024-of-00025.safetensors +3 -0
- model-00025-of-00025.safetensors +3 -0
- model.safetensors.index.json +0 -0
- special_tokens_map.json +28 -0
- tokenizer.json +0 -0
- tokenizer_config.json +46 -0
config.json
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "alpindale/goliath-120b",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"mlp_bias": false,
|
16 |
+
"model_type": "llama",
|
17 |
+
"num_attention_heads": 64,
|
18 |
+
"num_hidden_layers": 137,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"quantization_config": {
|
22 |
+
"activation_scheme": "dynamic",
|
23 |
+
"ignored_layers": [
|
24 |
+
"lm_head"
|
25 |
+
],
|
26 |
+
"quant_method": "fp8"
|
27 |
+
},
|
28 |
+
"rms_norm_eps": 1e-05,
|
29 |
+
"rope_scaling": null,
|
30 |
+
"rope_theta": 10000.0,
|
31 |
+
"tie_word_embeddings": false,
|
32 |
+
"torch_dtype": "float16",
|
33 |
+
"transformers_version": "4.44.0",
|
34 |
+
"use_cache": true,
|
35 |
+
"vocab_size": 32000
|
36 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.44.0"
|
6 |
+
}
|
model-00001-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8631953fc813b02dcf2ecd637a69be3bb1c4647dea442810496cc51b7c7f505a
|
3 |
+
size 4953646668
|
model-00002-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4416337b604dad80f3c4bcbbd19ca7fe8327b75096fa8bcf74780ddb96caf908
|
3 |
+
size 4983039368
|
model-00003-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:394c834b787e371b676700aadffa74d46aaaea509a29f3513f95d7709f673817
|
3 |
+
size 4899121060
|
model-00004-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:140f9ce4f2f32d7a42a7e1723dd1d020e20e505de3b13dd3bd2714a3b6dd3cb8
|
3 |
+
size 4899154052
|
model-00005-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3e2220211b833cc096b22103675c5dd6b0161324874c90f8d7ea5685805d936
|
3 |
+
size 4899154052
|
model-00006-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3ed6c29d0266110d157f1cfc6107cfc873b2c7009f72f3cf637080fcf202e0c
|
3 |
+
size 4983039448
|
model-00007-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb1dc985a54782651bde6d93e826d34d00f0acf9cfb0ee831d7c55f37f61b3b6
|
3 |
+
size 4899121060
|
model-00008-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03110c5a00d695be3d31f380661ff834abb0cea8bce31fb2d3c2e9302c1b20ae
|
3 |
+
size 4899154052
|
model-00009-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66c5a374f9f9051b3a50c7d1e41ac8e22ce58a4d4f2c278c531c9962ded0fc2a
|
3 |
+
size 4899154052
|
model-00010-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:659be052d93807570ed479aa248f57b07d7519b857615ddd3ef7a2a5686e46cf
|
3 |
+
size 4983039448
|
model-00011-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85949c6e6803a055172b0873a382c72039f42de7a4a480c03555c88965be6ca0
|
3 |
+
size 4899121060
|
model-00012-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29e3e7667b7c7f8d4151fbed1fdba0a09a4b62553446530da2c4eea1336d3e95
|
3 |
+
size 4899154052
|
model-00013-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6db16e62fa926ad206a4c2099a84d7e13dc2c5f41e83d45e31d37e7841a635c3
|
3 |
+
size 4899154052
|
model-00014-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4ae4fc7e7eaf6cad30b20a56dd53f42a219fc324205a9227cd56fb9f622af65
|
3 |
+
size 4983039448
|
model-00015-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78b494f41f5e88a79f28f7d7c144c48c109f323fbcdf4aac1a24d0aa94b186c0
|
3 |
+
size 4899121060
|
model-00016-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:165fdefb5abd5dc3776c1157939a283b5158958470788c0769ce549c7da58ebe
|
3 |
+
size 4899154052
|
model-00017-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a15eb57ed89f2c3b81b07c0d9bbade2e04ad92a6f7f0b45565c207c922bba062
|
3 |
+
size 4899154052
|
model-00018-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:875740c38b1cddc9b5492dbf6fa7e1bc56cf053d0d48e213cbd318d4c5893ccf
|
3 |
+
size 4983039488
|
model-00019-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bcd1f72141bb9149d155d6101fb5f07f1e51762a46eac70a0860026d2814194
|
3 |
+
size 4899121148
|
model-00020-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6501150573e3fb882a40d7322135f832a64a58ba9fdba0ee107f09dfb4e45467
|
3 |
+
size 4899154148
|
model-00021-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14130c4d528b1dc00540611cffbd2180da7e60c82f06c2b96679d17b01dda23d
|
3 |
+
size 4899154140
|
model-00022-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fe0f7964003b78b0e3b3b916570bbe59a39a3aa362391a829971b689da06cc9
|
3 |
+
size 4983039536
|
model-00023-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a00496abf3560a7c44d7b9eaecfdef576ecb3fe9f29a57dfa317477e37ebc848
|
3 |
+
size 4899121148
|
model-00024-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c8c534a5d83647cc415e17cad598bd53f6959729c818e746c9c8fdb32ac918a
|
3 |
+
size 4513293512
|
model-00025-of-00025.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9fe65daa03c1fd29b72f4c7ae72b3ff9ee57f78e469dbc7002cb81e9c2b8973
|
3 |
+
size 524288128
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"additional_special_tokens": [
|
3 |
+
"<unk>",
|
4 |
+
"<s>",
|
5 |
+
"</s>"
|
6 |
+
],
|
7 |
+
"bos_token": {
|
8 |
+
"content": "<s>",
|
9 |
+
"lstrip": false,
|
10 |
+
"normalized": false,
|
11 |
+
"rstrip": false,
|
12 |
+
"single_word": false
|
13 |
+
},
|
14 |
+
"eos_token": {
|
15 |
+
"content": "</s>",
|
16 |
+
"lstrip": false,
|
17 |
+
"normalized": false,
|
18 |
+
"rstrip": false,
|
19 |
+
"single_word": false
|
20 |
+
},
|
21 |
+
"unk_token": {
|
22 |
+
"content": "<unk>",
|
23 |
+
"lstrip": false,
|
24 |
+
"normalized": false,
|
25 |
+
"rstrip": false,
|
26 |
+
"single_word": false
|
27 |
+
}
|
28 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,46 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": true,
|
3 |
+
"add_eos_token": false,
|
4 |
+
"add_prefix_space": null,
|
5 |
+
"added_tokens_decoder": {
|
6 |
+
"0": {
|
7 |
+
"content": "<unk>",
|
8 |
+
"lstrip": false,
|
9 |
+
"normalized": false,
|
10 |
+
"rstrip": false,
|
11 |
+
"single_word": false,
|
12 |
+
"special": true
|
13 |
+
},
|
14 |
+
"1": {
|
15 |
+
"content": "<s>",
|
16 |
+
"lstrip": false,
|
17 |
+
"normalized": false,
|
18 |
+
"rstrip": false,
|
19 |
+
"single_word": false,
|
20 |
+
"special": true
|
21 |
+
},
|
22 |
+
"2": {
|
23 |
+
"content": "</s>",
|
24 |
+
"lstrip": false,
|
25 |
+
"normalized": false,
|
26 |
+
"rstrip": false,
|
27 |
+
"single_word": false,
|
28 |
+
"special": true
|
29 |
+
}
|
30 |
+
},
|
31 |
+
"additional_special_tokens": [
|
32 |
+
"<unk>",
|
33 |
+
"<s>",
|
34 |
+
"</s>"
|
35 |
+
],
|
36 |
+
"bos_token": "<s>",
|
37 |
+
"clean_up_tokenization_spaces": false,
|
38 |
+
"eos_token": "</s>",
|
39 |
+
"legacy": false,
|
40 |
+
"model_max_length": 1000000000000000019884624838656,
|
41 |
+
"pad_token": null,
|
42 |
+
"sp_model_kwargs": {},
|
43 |
+
"tokenizer_class": "LlamaTokenizer",
|
44 |
+
"unk_token": "<unk>",
|
45 |
+
"use_default_system_prompt": true
|
46 |
+
}
|