Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +17 -0
- config.json +30 -0
- mergekit_config.yml +30 -0
- merges.txt +0 -0
- model-00001-of-00082.safetensors +3 -0
- model-00002-of-00082.safetensors +3 -0
- model-00003-of-00082.safetensors +3 -0
- model-00004-of-00082.safetensors +3 -0
- model-00005-of-00082.safetensors +3 -0
- model-00006-of-00082.safetensors +3 -0
- model-00007-of-00082.safetensors +3 -0
- model-00008-of-00082.safetensors +3 -0
- model-00009-of-00082.safetensors +3 -0
- model-00010-of-00082.safetensors +3 -0
- model-00011-of-00082.safetensors +3 -0
- model-00012-of-00082.safetensors +3 -0
- model-00013-of-00082.safetensors +3 -0
- model-00014-of-00082.safetensors +3 -0
- model-00015-of-00082.safetensors +3 -0
- model-00016-of-00082.safetensors +3 -0
- model-00017-of-00082.safetensors +3 -0
- model-00018-of-00082.safetensors +3 -0
- model-00019-of-00082.safetensors +3 -0
- model-00020-of-00082.safetensors +3 -0
- model-00021-of-00082.safetensors +3 -0
- model-00022-of-00082.safetensors +3 -0
- model-00023-of-00082.safetensors +3 -0
- model-00024-of-00082.safetensors +3 -0
- model-00025-of-00082.safetensors +3 -0
- model-00026-of-00082.safetensors +3 -0
- model-00027-of-00082.safetensors +3 -0
- model-00028-of-00082.safetensors +3 -0
- model-00029-of-00082.safetensors +3 -0
- model-00030-of-00082.safetensors +3 -0
- model-00031-of-00082.safetensors +3 -0
- model-00032-of-00082.safetensors +3 -0
- model-00033-of-00082.safetensors +3 -0
- model-00034-of-00082.safetensors +3 -0
- model-00035-of-00082.safetensors +3 -0
- model-00036-of-00082.safetensors +3 -0
- model-00037-of-00082.safetensors +3 -0
- model-00038-of-00082.safetensors +3 -0
- model-00039-of-00082.safetensors +3 -0
- model-00040-of-00082.safetensors +3 -0
- model-00041-of-00082.safetensors +3 -0
- model-00042-of-00082.safetensors +3 -0
- model-00043-of-00082.safetensors +3 -0
- model-00044-of-00082.safetensors +3 -0
- model-00045-of-00082.safetensors +3 -0
- model-00046-of-00082.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
tags:
|
4 |
+
- merge
|
5 |
+
- mergekit
|
6 |
+
- lazymergekit
|
7 |
+
- davidkim205/Rhea-72b-v0.5
|
8 |
+
- abacusai/Smaug-72B-v0.1
|
9 |
+
---
|
10 |
+
|
11 |
+
# TW3-JRGL-v3
|
12 |
+
|
13 |
+
TW3-JRGL-v3 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
|
14 |
+
* [davidkim205/Rhea-72b-v0.5](https://huggingface.co/davidkim205/Rhea-72b-v0.5)
|
15 |
+
* [abacusai/Smaug-72B-v0.1](https://huggingface.co/abacusai/Smaug-72B-v0.1)
|
16 |
+
|
17 |
+
## 🧩 Configuration
|
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "davidkim205/Rhea-72b-v0.5",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 151643,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 24576,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 64,
|
19 |
+
"pad_token_id": 151643,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-06,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 1000000,
|
24 |
+
"seq_length": 32768,
|
25 |
+
"tie_word_embeddings": false,
|
26 |
+
"torch_dtype": "bfloat16",
|
27 |
+
"transformers_version": "4.39.3",
|
28 |
+
"use_cache": true,
|
29 |
+
"vocab_size": 152064
|
30 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
base_model: davidkim205/Rhea-72b-v0.5
|
2 |
+
dtype: bfloat16
|
3 |
+
merge_method: slerp
|
4 |
+
parameters:
|
5 |
+
t:
|
6 |
+
- filter: self_attn
|
7 |
+
value:
|
8 |
+
- 0
|
9 |
+
- 0.5
|
10 |
+
- 0.3
|
11 |
+
- 0.7
|
12 |
+
- 1
|
13 |
+
- filter: mlp
|
14 |
+
value:
|
15 |
+
- 1
|
16 |
+
- 0.5
|
17 |
+
- 0.7
|
18 |
+
- 0.3
|
19 |
+
- 0
|
20 |
+
- value: 0.5
|
21 |
+
slices:
|
22 |
+
- sources:
|
23 |
+
- layer_range:
|
24 |
+
- 0
|
25 |
+
- 80
|
26 |
+
model: davidkim205/Rhea-72b-v0.5
|
27 |
+
- layer_range:
|
28 |
+
- 0
|
29 |
+
- 80
|
30 |
+
model: abacusai/Smaug-72B-v0.1
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1aa619fc57e556b10c1fcfb5c1ef908be156450c312e6bcd6de6baf66ba93aa
|
3 |
+
size 1879164616
|
model-00002-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c34db1e04e4ee00d58c91d63896a8141a1232bec0eb2f2f99ce65b855678962
|
3 |
+
size 402703024
|
model-00003-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fa1a10feeab788c76005956249f06f5be60675a35069fdde009ceea4e5574ae
|
3 |
+
size 2491416720
|
model-00004-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c98d30f323e67d68b81920e502ad6a341eb72a98670cb4dd5bd1f65b07dec87b
|
3 |
+
size 1879164616
|
model-00005-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4565403fda6b1c51ce0f84699e05a1494e0a45e387220471053940040577464
|
3 |
+
size 1879164608
|
model-00006-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c54d21b47d6108c6856a402f32b07e96cdcf39a3f6ce5e3763d545318af45c3e
|
3 |
+
size 1610646216
|
model-00007-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77ae7e645d2365510c7a7463753f852b8ddf80bc2b9851fac8a5210ed432ea89
|
3 |
+
size 1744930280
|
model-00008-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c20636827a86ba04a498fe009b3de1c7194c300548ea46882f8c829c2834be51
|
3 |
+
size 1744930280
|
model-00009-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50fe9dbd9c7a4b040dfbe222b4ae8969720fc2d0c4a3c85f4a1136227fdc0430
|
3 |
+
size 1879131376
|
model-00010-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5a27df72b5d63753c039e3966b1d65fe6babe0da773909206dfc6ff25a8386c
|
3 |
+
size 1879148128
|
model-00011-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b479e8e92466a6b5d226fe5105436c3b43539e70f1c31cf6f44462691df6ecce
|
3 |
+
size 1879164616
|
model-00012-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30ec100626c74d113e7076ae1af96869de83d5bc90147fbcc51d399381d5c790
|
3 |
+
size 1610712664
|
model-00013-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da80bc929bd03725a6fc2a0252f16e52e9ad67c2489366d5bfb588347511e39c
|
3 |
+
size 1744930288
|
model-00014-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:430fff64ab1496ea0a379d7ba12517caa5cd95d7a2e2918a4689d1c5807b42b8
|
3 |
+
size 1879214112
|
model-00015-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40fbfbc183146026b8ceaeb259718c755c55430ad768065aca4d497b89d8ab4d
|
3 |
+
size 1879148136
|
model-00016-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0e6aab4f8429f361c084facea5fff49a2c66a1a66567ed881b575f721d07bf2
|
3 |
+
size 1879164632
|
model-00017-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1371224310cb5320c08cf34f5803717b2cb25d93acb9dbd628d230fa309d5019
|
3 |
+
size 1610695936
|
model-00018-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09d01140eb55ad5f2c11b00d72112003f9e96adafd7b2b4fac53a6386de52aef
|
3 |
+
size 1744930288
|
model-00019-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da0df6d432d1ce6cfa62402dbf838d54cb27e4967654e1e90345c94e4a4f570e
|
3 |
+
size 1744930288
|
model-00020-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f772dd83cef6c1915a67133b4aae75b9bc52e093c7cded9b09a4e2f13b57f90
|
3 |
+
size 1610646216
|
model-00021-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:123838a9ef7ad1e952005cbd7c88c25273c17686a27d71be69341e7d4f96d393
|
3 |
+
size 1744930288
|
model-00022-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba9d9c312d463d47db83ff0857c00fc125599b0477bb2355ec0f248f60a66755
|
3 |
+
size 1744930288
|
model-00023-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eab3c0087e6316c01b57fa7e5a099c1c7624cfd442fc79daa272faa2c6039c38
|
3 |
+
size 1879181112
|
model-00024-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3309ec94e79dac73aaa8a70b0b381ef07ce5457763d900b9fc20623f4ff689ad
|
3 |
+
size 1879148128
|
model-00025-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8e16d577c8ae740535f7c3e4c4c0487081324a244e59d594915ce216b35c71b
|
3 |
+
size 1744930280
|
model-00026-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5ba1399d9553847b497b281443b2be7cd0f69b172781ec52f96edab42c4214a
|
3 |
+
size 1744897296
|
model-00027-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04afa2f75a90c48e3bcc90a23e57f41ab7c2b2f077f173661faf8c7cf08b2f2d
|
3 |
+
size 1744930288
|
model-00028-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1889cfe68fe8c09d6a365643858f21ea8dffb834f457e1be0c33e3b85d7143fd
|
3 |
+
size 1879247336
|
model-00029-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:418e5878b85e1888ba43e8e09aafb2f46a74f0ef9c2658105b3f611bfe8d82fb
|
3 |
+
size 1744930280
|
model-00030-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83ac7fd38cf3dd5916e63d9f918a94250889bb236657d1fcb72fd0029c48501a
|
3 |
+
size 1744930280
|
model-00031-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7f06f40b47ac65566f6c7173ecc889158244c2ca6bcbdcf98a8663921dc8b25
|
3 |
+
size 1879114896
|
model-00032-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb822faccc3dee197f24933c5a6a2678394c5a40d0f31750025e8deb909c7d57
|
3 |
+
size 1744930288
|
model-00033-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f9ac94afeb2444951df56b73e84864e835b6c1a4c9aae5a527159bb0db65dd7
|
3 |
+
size 1744930288
|
model-00034-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ebbac9cd5111bb38fc8e455b7f7dc11e05771a123d54ed4794721c2aad40ee6
|
3 |
+
size 1879147896
|
model-00035-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84e0b1285910f4434c93f5a7f2959ed862dd7c1d97928c02533b3a69352c3245
|
3 |
+
size 1879164632
|
model-00036-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d36213a06e51901c910dd393c67e5429063436c64d3ecd7ee6a5e0c1f6509715
|
3 |
+
size 1610695944
|
model-00037-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9ddfff2b53722124cb91717e23177e264b6f54f808ce2e58d8421d40be54110
|
3 |
+
size 1744897296
|
model-00038-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecd8564c95e5cb681967c040aae5c86ece47a4606fdec33b1c3ad1089818fe6c
|
3 |
+
size 1744930288
|
model-00039-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b07325f5c85f5e3503a8163f3814a35c47090bcce883411e8196ede358696543
|
3 |
+
size 1879181112
|
model-00040-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7b864b230b60d754eb354f06f86cdf8d9b0c334dafabccb4ad7e10b2782f331
|
3 |
+
size 1879148136
|
model-00041-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c11fcc495539e78a529a50b0f5fc9f1e76efb3627e79fe4a4da212f07871ab07
|
3 |
+
size 1879164632
|
model-00042-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09151e7a24ce60c458484a2c7f347ed320fc9d1978a4350ddf22dfcfd2e28960
|
3 |
+
size 1879164624
|
model-00043-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52c30be8105596ba059d13a8f534be0df8e49f3e6b74e5049317c479ebcbf09a
|
3 |
+
size 1744930288
|
model-00044-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c97d71ddcaa9a2d15b620f3a9352f1987dbe2f4633d240a6ef96788bd1dfa16a
|
3 |
+
size 1879214112
|
model-00045-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e136b4de7e848f53e4eff313b28d06524ee6e5e0d5cc49af230dca2da287a10
|
3 |
+
size 1879148128
|
model-00046-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b79db05574e84a511f437a59c3ca1a30c4a98afddeb806eba0debf8199244cc
|
3 |
+
size 1744930280
|