Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +17 -0
- config.json +30 -0
- mergekit_config.yml +30 -0
- merges.txt +0 -0
- model-00001-of-00082.safetensors +3 -0
- model-00002-of-00082.safetensors +3 -0
- model-00003-of-00082.safetensors +3 -0
- model-00004-of-00082.safetensors +3 -0
- model-00005-of-00082.safetensors +3 -0
- model-00006-of-00082.safetensors +3 -0
- model-00007-of-00082.safetensors +3 -0
- model-00008-of-00082.safetensors +3 -0
- model-00009-of-00082.safetensors +3 -0
- model-00010-of-00082.safetensors +3 -0
- model-00011-of-00082.safetensors +3 -0
- model-00012-of-00082.safetensors +3 -0
- model-00013-of-00082.safetensors +3 -0
- model-00014-of-00082.safetensors +3 -0
- model-00015-of-00082.safetensors +3 -0
- model-00016-of-00082.safetensors +3 -0
- model-00017-of-00082.safetensors +3 -0
- model-00018-of-00082.safetensors +3 -0
- model-00019-of-00082.safetensors +3 -0
- model-00020-of-00082.safetensors +3 -0
- model-00021-of-00082.safetensors +3 -0
- model-00022-of-00082.safetensors +3 -0
- model-00023-of-00082.safetensors +3 -0
- model-00024-of-00082.safetensors +3 -0
- model-00025-of-00082.safetensors +3 -0
- model-00026-of-00082.safetensors +3 -0
- model-00027-of-00082.safetensors +3 -0
- model-00028-of-00082.safetensors +3 -0
- model-00029-of-00082.safetensors +3 -0
- model-00030-of-00082.safetensors +3 -0
- model-00031-of-00082.safetensors +3 -0
- model-00032-of-00082.safetensors +3 -0
- model-00033-of-00082.safetensors +3 -0
- model-00034-of-00082.safetensors +3 -0
- model-00035-of-00082.safetensors +3 -0
- model-00036-of-00082.safetensors +3 -0
- model-00037-of-00082.safetensors +3 -0
- model-00038-of-00082.safetensors +3 -0
- model-00039-of-00082.safetensors +3 -0
- model-00040-of-00082.safetensors +3 -0
- model-00041-of-00082.safetensors +3 -0
- model-00042-of-00082.safetensors +3 -0
- model-00043-of-00082.safetensors +3 -0
- model-00044-of-00082.safetensors +3 -0
- model-00045-of-00082.safetensors +3 -0
- model-00046-of-00082.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
tags:
|
4 |
+
- merge
|
5 |
+
- mergekit
|
6 |
+
- lazymergekit
|
7 |
+
- MTSAIR/MultiVerse_70B
|
8 |
+
- davidkim205/Rhea-72b-v0.5
|
9 |
+
---
|
10 |
+
|
11 |
+
# TW3-JRGL-v2
|
12 |
+
|
13 |
+
TW3-JRGL-v2 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
|
14 |
+
* [MTSAIR/MultiVerse_70B](https://huggingface.co/MTSAIR/MultiVerse_70B)
|
15 |
+
* [davidkim205/Rhea-72b-v0.5](https://huggingface.co/davidkim205/Rhea-72b-v0.5)
|
16 |
+
|
17 |
+
## 🧩 Configuration
|
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "davidkim205/Rhea-72b-v0.5",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 151643,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 24576,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 64,
|
19 |
+
"pad_token_id": 151643,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-06,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 1000000,
|
24 |
+
"seq_length": 32768,
|
25 |
+
"tie_word_embeddings": false,
|
26 |
+
"torch_dtype": "bfloat16",
|
27 |
+
"transformers_version": "4.39.2",
|
28 |
+
"use_cache": true,
|
29 |
+
"vocab_size": 152064
|
30 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
base_model: davidkim205/Rhea-72b-v0.5
|
2 |
+
dtype: bfloat16
|
3 |
+
merge_method: slerp
|
4 |
+
parameters:
|
5 |
+
t:
|
6 |
+
- filter: self_attn
|
7 |
+
value:
|
8 |
+
- 0
|
9 |
+
- 0.5
|
10 |
+
- 0.3
|
11 |
+
- 0.7
|
12 |
+
- 1
|
13 |
+
- filter: mlp
|
14 |
+
value:
|
15 |
+
- 1
|
16 |
+
- 0.5
|
17 |
+
- 0.7
|
18 |
+
- 0.3
|
19 |
+
- 0
|
20 |
+
- value: 0.5
|
21 |
+
slices:
|
22 |
+
- sources:
|
23 |
+
- layer_range:
|
24 |
+
- 0
|
25 |
+
- 80
|
26 |
+
model: MTSAIR/MultiVerse_70B
|
27 |
+
- layer_range:
|
28 |
+
- 0
|
29 |
+
- 80
|
30 |
+
model: davidkim205/Rhea-72b-v0.5
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eedc51c6396b392ec6641830b7ed3f3a0a346b9a656e999c20806ceec2825a77
|
3 |
+
size 1879164616
|
model-00002-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c34db1e04e4ee00d58c91d63896a8141a1232bec0eb2f2f99ce65b855678962
|
3 |
+
size 402703024
|
model-00003-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d48975c6f125467e8fe47430e4d51409a2e89e3f6b4ca527bb0f26ef297ea9c9
|
3 |
+
size 2491416720
|
model-00004-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab25f323b498ef4f8dbfdd3b8d7ad0e63b3007fb1468546bcfae7c396582cc68
|
3 |
+
size 1879164616
|
model-00005-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df98503657aeb6ec5dcf1ee96f43cd8e266996aa3d2e61776d059b96841e0635
|
3 |
+
size 1879164608
|
model-00006-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:572cf03812d04a59252a437be65f3802e67be3a9ce7aef56c36a3f87490b622a
|
3 |
+
size 1610646216
|
model-00007-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f6e579aae7b9a22d3aeb0704f3d10191300d92e409b6d7ec1ae49382532a0a
|
3 |
+
size 1744930280
|
model-00008-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37d6551d8fcb2097cd53026af5535bf3dca19a528987276bb91f320b74476448
|
3 |
+
size 1744930280
|
model-00009-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d57ed1d7201cdca52314f8afc331e54ebaa0e7b11d0a7f850237435387805c8
|
3 |
+
size 1879131376
|
model-00010-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:946448ec4f71b8089f14cfbec10affdfc454798dce33db34a20d64febbca7066
|
3 |
+
size 1879148128
|
model-00011-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa1a7f64f5075e0beadffa8f0e161b397c6101b2292cb1e6431618d63d824d81
|
3 |
+
size 1879164616
|
model-00012-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a229c5a1b37951b1d0c13063ff145e69d816db7d01e548472a696bddf736165c
|
3 |
+
size 1610712664
|
model-00013-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c89fefcca6df002f41335619f585ad688203d3e933035feae4ec04eb83c22dfb
|
3 |
+
size 1744930288
|
model-00014-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af60c769546207441d550b05eacba983bf949763913e1da933cad77b29ad30da
|
3 |
+
size 1879214112
|
model-00015-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c17a40f6777fe1ad888d80dd5ee06a82f6500cc87051f452ba0e2c271e706db
|
3 |
+
size 1879148136
|
model-00016-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e0b87eed1b36e9c605010f59d24e91774a8beb45ba9fe938eab48994a0b0287
|
3 |
+
size 1879164632
|
model-00017-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e686306551a3d172e19c50ff11662b5a8077ad3e1b9aef5819c4c80fbfdf557
|
3 |
+
size 1610695936
|
model-00018-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67e8a93da77752c2b140838282aaddfe7f74d7ceda635ad637976ec796b6985c
|
3 |
+
size 1744930288
|
model-00019-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36624dd4333682f6d65b9c8591f2a5ae12c5ed7eacba884e26961f8efc149645
|
3 |
+
size 1744930288
|
model-00020-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f1b0c97be489fe7783fbf88634354b1fa73b7be9d72d9ef51a131453e46f93d
|
3 |
+
size 1610646216
|
model-00021-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b19690f1fd29e5c06f550bc25cc9a59a73ddb6de29cb9387872afa74749d4d3e
|
3 |
+
size 1744930288
|
model-00022-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3da763e9cff37326791913cce58263aae7a15e4c3a9e3963aa186518ebf1b124
|
3 |
+
size 1744930288
|
model-00023-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10c0d64f603c2a66d3a01a21c9443c78c1bf1295aa8d3923b33f0ede366c3dec
|
3 |
+
size 1879181112
|
model-00024-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e115a87e07652c0d649fa521a960c52e37c78cfd6d1da6771a8558683366b72
|
3 |
+
size 1879148128
|
model-00025-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e05f10d47da4a6a38fa331727addd8a5ff9b176ad94cbfb1aa2bed70ff761356
|
3 |
+
size 1744930280
|
model-00026-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e18cfc30dd1d600662925cd2d3e3a8f93ce03b07ab5f654ec88e6717c767dc97
|
3 |
+
size 1744897296
|
model-00027-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d852c385419e928d192c9919de1c56de24e8598947c90a0a10d0fddbd04b899
|
3 |
+
size 1744930288
|
model-00028-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cbf2a11a468a4217dc117f6a9114b228d10115b7810a80c6f1b04cd74fd9742
|
3 |
+
size 1879247336
|
model-00029-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a728c2c94c4e47df0c1d9ee42936cea60e8dac11e5b8571ccdbc4812c15e7c99
|
3 |
+
size 1744930280
|
model-00030-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b5afd5a4f97ba61b58c7fcbd75cb81d660f7af0e7ffa1521ca477fb566a976c
|
3 |
+
size 1744930280
|
model-00031-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcbb94368adabaad40fa746901488d590fc0c9c4b6ed67d4ed8e994c5a2c0e82
|
3 |
+
size 1879114896
|
model-00032-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49dee2c2a0c0b77b5a8fec1dd67085e68f66a93a42e095f55d977c41a6a8e9a2
|
3 |
+
size 1744930288
|
model-00033-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbe45bdca934edf458ed22ccacc8a502f68112fd80ac984d2cac4e21cceb4c04
|
3 |
+
size 1744930288
|
model-00034-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c26913aae122b3797b9870b4afe04d6306648a626b4493c30b3510d1c5280b3d
|
3 |
+
size 1879147896
|
model-00035-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37676346cd04369df7153defc664e6f21341d238c4c8c05b75510f2cf55403ba
|
3 |
+
size 1879164632
|
model-00036-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:548cb0362c6b3cd41537dcb25bd835ef73edf7d09c895c8fac8e946ad2ef651a
|
3 |
+
size 1610695944
|
model-00037-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6e70bf1693e6843099f57b79cbbe98c9a3c1f681aaa8715641b5298758cdae3
|
3 |
+
size 1744897296
|
model-00038-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b2b8a8d89d06fe779e20c0c02eb23617d6e6a4a17ecd10f692ebdf60a4ce1ff
|
3 |
+
size 1744930288
|
model-00039-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33f3cb76d394f073e9af5be82efc84e56b63e1745b1e3afdcbe5f89cbceb007c
|
3 |
+
size 1879181112
|
model-00040-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e467891902de88d4794f0baffa6d55dfa49965a0c6600002412cc188cf34c0e
|
3 |
+
size 1879148136
|
model-00041-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e6ae2a58955d7dcb904e90155a64ca8edb97f94e2c99b9b96800438125b531a
|
3 |
+
size 1879164632
|
model-00042-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad687b8c63ffb736b1cf704498366028f42732ecbe178b8a9f14a7143737881f
|
3 |
+
size 1879164624
|
model-00043-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef41c16a937ed68475b4107e7162efcfc202be6191a7808240d5747f995ca647
|
3 |
+
size 1744930288
|
model-00044-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daca48d3ae4e5558b6683c312bc862deb9dcaa9317b3cc6a6759bd1fefcbd662
|
3 |
+
size 1879214112
|
model-00045-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9c7e8d5bc47d3ca2ffb8e6619b9e30c76414f62bac9d00606ec9544aafc1da8
|
3 |
+
size 1879148128
|
model-00046-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb402cda328c560304996d99e0931be029f79b946139e4c216d2ff641cc2db47
|
3 |
+
size 1744930280
|