paloalma commited on
Commit
68bd1f7
1 Parent(s): 9cfd24d

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +17 -0
  2. added_tokens.json +3 -0
  3. config.json +30 -0
  4. mergekit_config.yml +30 -0
  5. merges.txt +0 -0
  6. model-00001-of-00082.safetensors +3 -0
  7. model-00002-of-00082.safetensors +3 -0
  8. model-00003-of-00082.safetensors +3 -0
  9. model-00004-of-00082.safetensors +3 -0
  10. model-00005-of-00082.safetensors +3 -0
  11. model-00006-of-00082.safetensors +3 -0
  12. model-00007-of-00082.safetensors +3 -0
  13. model-00008-of-00082.safetensors +3 -0
  14. model-00009-of-00082.safetensors +3 -0
  15. model-00010-of-00082.safetensors +3 -0
  16. model-00011-of-00082.safetensors +3 -0
  17. model-00012-of-00082.safetensors +3 -0
  18. model-00013-of-00082.safetensors +3 -0
  19. model-00014-of-00082.safetensors +3 -0
  20. model-00015-of-00082.safetensors +3 -0
  21. model-00016-of-00082.safetensors +3 -0
  22. model-00017-of-00082.safetensors +3 -0
  23. model-00018-of-00082.safetensors +3 -0
  24. model-00019-of-00082.safetensors +3 -0
  25. model-00020-of-00082.safetensors +3 -0
  26. model-00021-of-00082.safetensors +3 -0
  27. model-00022-of-00082.safetensors +3 -0
  28. model-00023-of-00082.safetensors +3 -0
  29. model-00024-of-00082.safetensors +3 -0
  30. model-00025-of-00082.safetensors +3 -0
  31. model-00026-of-00082.safetensors +3 -0
  32. model-00027-of-00082.safetensors +3 -0
  33. model-00028-of-00082.safetensors +3 -0
  34. model-00029-of-00082.safetensors +3 -0
  35. model-00030-of-00082.safetensors +3 -0
  36. model-00031-of-00082.safetensors +3 -0
  37. model-00032-of-00082.safetensors +3 -0
  38. model-00033-of-00082.safetensors +3 -0
  39. model-00034-of-00082.safetensors +3 -0
  40. model-00035-of-00082.safetensors +3 -0
  41. model-00036-of-00082.safetensors +3 -0
  42. model-00037-of-00082.safetensors +3 -0
  43. model-00038-of-00082.safetensors +3 -0
  44. model-00039-of-00082.safetensors +3 -0
  45. model-00040-of-00082.safetensors +3 -0
  46. model-00041-of-00082.safetensors +3 -0
  47. model-00042-of-00082.safetensors +3 -0
  48. model-00043-of-00082.safetensors +3 -0
  49. model-00044-of-00082.safetensors +3 -0
  50. model-00045-of-00082.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - lazymergekit
7
+ - migtissera/Tess-72B-v1.5b
8
+ - davidkim205/Rhea-72b-v0.5
9
+ ---
10
+
11
+ # TW3-JRGL-v4
12
+
13
+ TW3-JRGL-v4 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
14
+ * [migtissera/Tess-72B-v1.5b](https://huggingface.co/migtissera/Tess-72B-v1.5b)
15
+ * [davidkim205/Rhea-72b-v0.5](https://huggingface.co/davidkim205/Rhea-72b-v0.5)
16
+
17
+ ## 🧩 Configuration
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[PAD]": 151851
3
+ }
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "migtissera/Tess-72B-v1.5b",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": true,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128245,
9
+ "eos_token_id": 128247,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 24576,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 64,
19
+ "pad_token_id": 151643,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-06,
22
+ "rope_scaling": null,
23
+ "rope_theta": 1000000,
24
+ "seq_length": 32768,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.39.3",
28
+ "use_cache": false,
29
+ "vocab_size": 152064
30
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: migtissera/Tess-72B-v1.5b
2
+ dtype: bfloat16
3
+ merge_method: slerp
4
+ parameters:
5
+ t:
6
+ - filter: self_attn
7
+ value:
8
+ - 0
9
+ - 0.5
10
+ - 0.3
11
+ - 0.7
12
+ - 1
13
+ - filter: mlp
14
+ value:
15
+ - 1
16
+ - 0.5
17
+ - 0.7
18
+ - 0.3
19
+ - 0
20
+ - value: 0.5
21
+ slices:
22
+ - sources:
23
+ - layer_range:
24
+ - 0
25
+ - 80
26
+ model: migtissera/Tess-72B-v1.5b
27
+ - layer_range:
28
+ - 0
29
+ - 80
30
+ model: davidkim205/Rhea-72b-v0.5
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b076fba39171b1f315254c357286e41f81c082572bc4aaf947e96cd92b5f58fb
3
+ size 1879164616
model-00002-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf66cecfbbf417ba05714ad6aaa6297be5626f111344f1ea02afe616bf0919d8
3
+ size 402703024
model-00003-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a43130851c7ad8e89a98e9efe296ded2bde233d177d5ae3ccd92e44e3a5a9df
3
+ size 2491416720
model-00004-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cffdb823c4185c67998755c21e53ac79aa37062e828f14279cac897be85d142
3
+ size 1879164616
model-00005-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f972250550d8270ce1505d3dc57484bdb9b8ecf439c64a628ff0b9eba9b38cc3
3
+ size 1879164608
model-00006-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7652acaaf081e4f05a1035426f9d5c7b886edffd15c4eca346c65ed3bdbd3cfd
3
+ size 1610646216
model-00007-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa26f86c541b957a56815b8c1dc0036831574876af51b3ede7885bdaa6884ac6
3
+ size 1744930280
model-00008-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28c1c7aaf672a137595dc53a3978d34f341ad80ff51930b72c1a7402cd3c39f0
3
+ size 1744930280
model-00009-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4142891839942a500e1eb509aca4d14510c37f22742dbc78e5b1ab831759bac0
3
+ size 1879131376
model-00010-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f66787cf9bfd4405016ded7cf99e7a6c19e8c7572a8277df2b3bad291be988ee
3
+ size 1879148128
model-00011-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a47ec7685d2b05e11071901d6744e5a23b6eeb24966437e7168910336f202c3
3
+ size 1879164616
model-00012-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a81d18b0e16ac4576045099d5e447e835f365b3f9cbd52b3edef9037b0c5911b
3
+ size 1610712664
model-00013-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f8bd9531bb00829755c5adf289694c5c2c75f801dd3c254f78e1371c3eee51d
3
+ size 1744930288
model-00014-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a18bcadedbf0f6da21672c623d5e84228ea43f56074845f1f6048cd3b19fd280
3
+ size 1879214112
model-00015-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e64783f011149fc6889ac4da2258ac7b0da9bd6fa72f8e07a60c033f46f08fa0
3
+ size 1879148136
model-00016-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cb2937f6beb04956dc805e2c4b4d13a70501418c499644d9022df7b67d8211f
3
+ size 1879164632
model-00017-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebd65edb71bf5ea57b27ff626e96f1856441a16936779f1882a91dda06e3691a
3
+ size 1610695936
model-00018-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28df20056453843e2a20fef4722a71581c1d5c1ce97ce212195248709de6ffb2
3
+ size 1744930288
model-00019-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a12d96df5f8b9f996df4e49b04efe1ba4c79f96aab28971ae78ffe71c9a50c6
3
+ size 1744930288
model-00020-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e68482fadbb7ddafb7cc48d7c87b1ba04ef57a13b1d6d7f10a7620364cac7f4d
3
+ size 1610646216
model-00021-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f55fd252981c4b4496994a35e69c308dd81709f4240428166e83c82ee0a05192
3
+ size 1744930288
model-00022-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea2ee36362167c098f85dca3f951242aaf16ca364aabb3b1a5cea6e22441aca8
3
+ size 1744930288
model-00023-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7ddc843e86e21322a91e45c46c436ddba7e9a1bd291792a02d6184fb96990ae
3
+ size 1879181112
model-00024-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34c925f1746b58160b1b33030054d50c55460f94c13286fcc667cf47d942ac96
3
+ size 1879148128
model-00025-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9974d20698c08ce4e59f40d83048020aec42069754f1127ba4bb045a7f96d95b
3
+ size 1744930280
model-00026-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bdab875af7115c5b444675c77f6639b789c34ee708b65e429fe8a4b41dae4b3
3
+ size 1744897296
model-00027-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7453aa485829f08c09f2215d5dcb2dacfdc82742f42e7d9ccbae462bf5da5407
3
+ size 1744930288
model-00028-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5a5e4e1b4f60a00b83ea65fd4df51f62afe6db0e45849b4750b43244e29b175
3
+ size 1879247336
model-00029-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0462f41dfea71d13337091296f71ef885a284aca61a975dac368701522018131
3
+ size 1744930280
model-00030-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63db7e907803c4a9841bce9b73219dcf8e9e493943b94daaf398b8bc01f222f2
3
+ size 1744930280
model-00031-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d606c8c96ae446716cdbba966778947fc8afd16f764ebe6c9c378e8ec1c45ef1
3
+ size 1879114896
model-00032-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aa7f0d92104f3d7fa7effa45e9d5eabb129ab8b651b5128d0d4575b93764e5d
3
+ size 1744930288
model-00033-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:883ecfd3bc0118fc3fa2686ed604193d1a0b489596512cf115721a0a74bf3382
3
+ size 1744930288
model-00034-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ec762ed683af045c83f1b183965046c2dda2254280f64b6d2ed2dda23feeac1
3
+ size 1879147896
model-00035-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abfa943d8ace0a21f18214bb37afe4cb3ab69933e678983a0082ed417c331c7d
3
+ size 1879164632
model-00036-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffccaa5bca70ffcfa339fdc80a779f8369e0d6075ed037732a12d8411cd050be
3
+ size 1610695944
model-00037-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7611617dee33c0d85a5f8d8104ffeb0108297d492cf3de36997fbfa7cc00c6e
3
+ size 1744897296
model-00038-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a11eafc0f96c785a2bc8ac952c7d81ec9b2251cbe32d98fc04a90aee3879dfc7
3
+ size 1744930288
model-00039-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4351ec87134658eda01e4799ea8108a40a5dd2c49cf38d3dc699f16f1e78537
3
+ size 1879181112
model-00040-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9c5cfa84f58955bd5029f0f416656f22f4b1bd264e62ea5eabc0c96859d0a8c
3
+ size 1879148136
model-00041-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43a56ae6bdf87b5d23a58a76650f8a7d93515e77099d739f698747e8dd01f070
3
+ size 1879164632
model-00042-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d221cf041935f6cfbc8210d5f0bcd6ea156106944f521adc08491e31e37c093f
3
+ size 1879164624
model-00043-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a55dda9830fc1b8f66a77905f88a39f33a244b30b53fb8be48c963ad58e15ef2
3
+ size 1744930288
model-00044-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f6dc79cf95ac4569b8c983ee85b1a3b488db6b8e7e8419e1256081cc27e05dc
3
+ size 1879214112
model-00045-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:909734628ea75aae199d55c6bfab6e5cb5b9eb4d7e4c9d289a4c8b469caf1b5c
3
+ size 1879148128