paloalma commited on
Commit
217a060
1 Parent(s): 5073eea

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +17 -0
  2. config.json +30 -0
  3. mergekit_config.yml +30 -0
  4. merges.txt +0 -0
  5. model-00001-of-00082.safetensors +3 -0
  6. model-00002-of-00082.safetensors +3 -0
  7. model-00003-of-00082.safetensors +3 -0
  8. model-00004-of-00082.safetensors +3 -0
  9. model-00005-of-00082.safetensors +3 -0
  10. model-00006-of-00082.safetensors +3 -0
  11. model-00007-of-00082.safetensors +3 -0
  12. model-00008-of-00082.safetensors +3 -0
  13. model-00009-of-00082.safetensors +3 -0
  14. model-00010-of-00082.safetensors +3 -0
  15. model-00011-of-00082.safetensors +3 -0
  16. model-00012-of-00082.safetensors +3 -0
  17. model-00013-of-00082.safetensors +3 -0
  18. model-00014-of-00082.safetensors +3 -0
  19. model-00015-of-00082.safetensors +3 -0
  20. model-00016-of-00082.safetensors +3 -0
  21. model-00017-of-00082.safetensors +3 -0
  22. model-00018-of-00082.safetensors +3 -0
  23. model-00019-of-00082.safetensors +3 -0
  24. model-00020-of-00082.safetensors +3 -0
  25. model-00021-of-00082.safetensors +3 -0
  26. model-00022-of-00082.safetensors +3 -0
  27. model-00023-of-00082.safetensors +3 -0
  28. model-00024-of-00082.safetensors +3 -0
  29. model-00025-of-00082.safetensors +3 -0
  30. model-00026-of-00082.safetensors +3 -0
  31. model-00027-of-00082.safetensors +3 -0
  32. model-00028-of-00082.safetensors +3 -0
  33. model-00029-of-00082.safetensors +3 -0
  34. model-00030-of-00082.safetensors +3 -0
  35. model-00031-of-00082.safetensors +3 -0
  36. model-00032-of-00082.safetensors +3 -0
  37. model-00033-of-00082.safetensors +3 -0
  38. model-00034-of-00082.safetensors +3 -0
  39. model-00035-of-00082.safetensors +3 -0
  40. model-00036-of-00082.safetensors +3 -0
  41. model-00037-of-00082.safetensors +3 -0
  42. model-00038-of-00082.safetensors +3 -0
  43. model-00039-of-00082.safetensors +3 -0
  44. model-00040-of-00082.safetensors +3 -0
  45. model-00041-of-00082.safetensors +3 -0
  46. model-00042-of-00082.safetensors +3 -0
  47. model-00043-of-00082.safetensors +3 -0
  48. model-00044-of-00082.safetensors +3 -0
  49. model-00045-of-00082.safetensors +3 -0
  50. model-00046-of-00082.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - lazymergekit
7
+ - MTSAIR/MultiVerse_70B
8
+ - davidkim205/Rhea-72b-v0.5
9
+ ---
10
+
11
+ # TW3-JRGL-v2
12
+
13
+ TW3-JRGL-v2 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
14
+ * [MTSAIR/MultiVerse_70B](https://huggingface.co/MTSAIR/MultiVerse_70B)
15
+ * [davidkim205/Rhea-72b-v0.5](https://huggingface.co/davidkim205/Rhea-72b-v0.5)
16
+
17
+ ## 🧩 Configuration
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "davidkim205/Rhea-72b-v0.5",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": true,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 151643,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 24576,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 64,
19
+ "pad_token_id": 151643,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-06,
22
+ "rope_scaling": null,
23
+ "rope_theta": 1000000,
24
+ "seq_length": 32768,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.39.2",
28
+ "use_cache": true,
29
+ "vocab_size": 152064
30
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: davidkim205/Rhea-72b-v0.5
2
+ dtype: bfloat16
3
+ merge_method: slerp
4
+ parameters:
5
+ t:
6
+ - filter: self_attn
7
+ value:
8
+ - 0
9
+ - 0.5
10
+ - 0.3
11
+ - 0.7
12
+ - 1
13
+ - filter: mlp
14
+ value:
15
+ - 1
16
+ - 0.5
17
+ - 0.7
18
+ - 0.3
19
+ - 0
20
+ - value: 0.5
21
+ slices:
22
+ - sources:
23
+ - layer_range:
24
+ - 0
25
+ - 80
26
+ model: MTSAIR/MultiVerse_70B
27
+ - layer_range:
28
+ - 0
29
+ - 80
30
+ model: davidkim205/Rhea-72b-v0.5
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eedc51c6396b392ec6641830b7ed3f3a0a346b9a656e999c20806ceec2825a77
3
+ size 1879164616
model-00002-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c34db1e04e4ee00d58c91d63896a8141a1232bec0eb2f2f99ce65b855678962
3
+ size 402703024
model-00003-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d48975c6f125467e8fe47430e4d51409a2e89e3f6b4ca527bb0f26ef297ea9c9
3
+ size 2491416720
model-00004-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab25f323b498ef4f8dbfdd3b8d7ad0e63b3007fb1468546bcfae7c396582cc68
3
+ size 1879164616
model-00005-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df98503657aeb6ec5dcf1ee96f43cd8e266996aa3d2e61776d059b96841e0635
3
+ size 1879164608
model-00006-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:572cf03812d04a59252a437be65f3802e67be3a9ce7aef56c36a3f87490b622a
3
+ size 1610646216
model-00007-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0f6e579aae7b9a22d3aeb0704f3d10191300d92e409b6d7ec1ae49382532a0a
3
+ size 1744930280
model-00008-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37d6551d8fcb2097cd53026af5535bf3dca19a528987276bb91f320b74476448
3
+ size 1744930280
model-00009-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d57ed1d7201cdca52314f8afc331e54ebaa0e7b11d0a7f850237435387805c8
3
+ size 1879131376
model-00010-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:946448ec4f71b8089f14cfbec10affdfc454798dce33db34a20d64febbca7066
3
+ size 1879148128
model-00011-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa1a7f64f5075e0beadffa8f0e161b397c6101b2292cb1e6431618d63d824d81
3
+ size 1879164616
model-00012-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a229c5a1b37951b1d0c13063ff145e69d816db7d01e548472a696bddf736165c
3
+ size 1610712664
model-00013-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c89fefcca6df002f41335619f585ad688203d3e933035feae4ec04eb83c22dfb
3
+ size 1744930288
model-00014-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af60c769546207441d550b05eacba983bf949763913e1da933cad77b29ad30da
3
+ size 1879214112
model-00015-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c17a40f6777fe1ad888d80dd5ee06a82f6500cc87051f452ba0e2c271e706db
3
+ size 1879148136
model-00016-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e0b87eed1b36e9c605010f59d24e91774a8beb45ba9fe938eab48994a0b0287
3
+ size 1879164632
model-00017-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e686306551a3d172e19c50ff11662b5a8077ad3e1b9aef5819c4c80fbfdf557
3
+ size 1610695936
model-00018-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67e8a93da77752c2b140838282aaddfe7f74d7ceda635ad637976ec796b6985c
3
+ size 1744930288
model-00019-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36624dd4333682f6d65b9c8591f2a5ae12c5ed7eacba884e26961f8efc149645
3
+ size 1744930288
model-00020-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f1b0c97be489fe7783fbf88634354b1fa73b7be9d72d9ef51a131453e46f93d
3
+ size 1610646216
model-00021-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b19690f1fd29e5c06f550bc25cc9a59a73ddb6de29cb9387872afa74749d4d3e
3
+ size 1744930288
model-00022-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3da763e9cff37326791913cce58263aae7a15e4c3a9e3963aa186518ebf1b124
3
+ size 1744930288
model-00023-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10c0d64f603c2a66d3a01a21c9443c78c1bf1295aa8d3923b33f0ede366c3dec
3
+ size 1879181112
model-00024-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e115a87e07652c0d649fa521a960c52e37c78cfd6d1da6771a8558683366b72
3
+ size 1879148128
model-00025-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e05f10d47da4a6a38fa331727addd8a5ff9b176ad94cbfb1aa2bed70ff761356
3
+ size 1744930280
model-00026-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e18cfc30dd1d600662925cd2d3e3a8f93ce03b07ab5f654ec88e6717c767dc97
3
+ size 1744897296
model-00027-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d852c385419e928d192c9919de1c56de24e8598947c90a0a10d0fddbd04b899
3
+ size 1744930288
model-00028-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cbf2a11a468a4217dc117f6a9114b228d10115b7810a80c6f1b04cd74fd9742
3
+ size 1879247336
model-00029-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a728c2c94c4e47df0c1d9ee42936cea60e8dac11e5b8571ccdbc4812c15e7c99
3
+ size 1744930280
model-00030-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b5afd5a4f97ba61b58c7fcbd75cb81d660f7af0e7ffa1521ca477fb566a976c
3
+ size 1744930280
model-00031-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcbb94368adabaad40fa746901488d590fc0c9c4b6ed67d4ed8e994c5a2c0e82
3
+ size 1879114896
model-00032-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49dee2c2a0c0b77b5a8fec1dd67085e68f66a93a42e095f55d977c41a6a8e9a2
3
+ size 1744930288
model-00033-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbe45bdca934edf458ed22ccacc8a502f68112fd80ac984d2cac4e21cceb4c04
3
+ size 1744930288
model-00034-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c26913aae122b3797b9870b4afe04d6306648a626b4493c30b3510d1c5280b3d
3
+ size 1879147896
model-00035-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37676346cd04369df7153defc664e6f21341d238c4c8c05b75510f2cf55403ba
3
+ size 1879164632
model-00036-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:548cb0362c6b3cd41537dcb25bd835ef73edf7d09c895c8fac8e946ad2ef651a
3
+ size 1610695944
model-00037-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6e70bf1693e6843099f57b79cbbe98c9a3c1f681aaa8715641b5298758cdae3
3
+ size 1744897296
model-00038-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b2b8a8d89d06fe779e20c0c02eb23617d6e6a4a17ecd10f692ebdf60a4ce1ff
3
+ size 1744930288
model-00039-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33f3cb76d394f073e9af5be82efc84e56b63e1745b1e3afdcbe5f89cbceb007c
3
+ size 1879181112
model-00040-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e467891902de88d4794f0baffa6d55dfa49965a0c6600002412cc188cf34c0e
3
+ size 1879148136
model-00041-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e6ae2a58955d7dcb904e90155a64ca8edb97f94e2c99b9b96800438125b531a
3
+ size 1879164632
model-00042-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad687b8c63ffb736b1cf704498366028f42732ecbe178b8a9f14a7143737881f
3
+ size 1879164624
model-00043-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef41c16a937ed68475b4107e7162efcfc202be6191a7808240d5747f995ca647
3
+ size 1744930288
model-00044-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daca48d3ae4e5558b6683c312bc862deb9dcaa9317b3cc6a6759bd1fefcbd662
3
+ size 1879214112
model-00045-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9c7e8d5bc47d3ca2ffb8e6619b9e30c76414f62bac9d00606ec9544aafc1da8
3
+ size 1879148128
model-00046-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb402cda328c560304996d99e0931be029f79b946139e4c216d2ff641cc2db47
3
+ size 1744930280