paloalma commited on
Commit
6ceede4
1 Parent(s): 0ca6de4

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +17 -0
  2. added_tokens.json +3 -0
  3. config.json +30 -0
  4. mergekit_config.yml +30 -0
  5. merges.txt +0 -0
  6. model-00001-of-00082.safetensors +3 -0
  7. model-00002-of-00082.safetensors +3 -0
  8. model-00003-of-00082.safetensors +3 -0
  9. model-00004-of-00082.safetensors +3 -0
  10. model-00005-of-00082.safetensors +3 -0
  11. model-00006-of-00082.safetensors +3 -0
  12. model-00007-of-00082.safetensors +3 -0
  13. model-00008-of-00082.safetensors +3 -0
  14. model-00009-of-00082.safetensors +3 -0
  15. model-00010-of-00082.safetensors +3 -0
  16. model-00011-of-00082.safetensors +3 -0
  17. model-00012-of-00082.safetensors +3 -0
  18. model-00013-of-00082.safetensors +3 -0
  19. model-00014-of-00082.safetensors +3 -0
  20. model-00015-of-00082.safetensors +3 -0
  21. model-00016-of-00082.safetensors +3 -0
  22. model-00017-of-00082.safetensors +3 -0
  23. model-00018-of-00082.safetensors +3 -0
  24. model-00019-of-00082.safetensors +3 -0
  25. model-00020-of-00082.safetensors +3 -0
  26. model-00021-of-00082.safetensors +3 -0
  27. model-00022-of-00082.safetensors +3 -0
  28. model-00023-of-00082.safetensors +3 -0
  29. model-00024-of-00082.safetensors +3 -0
  30. model-00025-of-00082.safetensors +3 -0
  31. model-00026-of-00082.safetensors +3 -0
  32. model-00027-of-00082.safetensors +3 -0
  33. model-00028-of-00082.safetensors +3 -0
  34. model-00029-of-00082.safetensors +3 -0
  35. model-00030-of-00082.safetensors +3 -0
  36. model-00031-of-00082.safetensors +3 -0
  37. model-00032-of-00082.safetensors +3 -0
  38. model-00033-of-00082.safetensors +3 -0
  39. model-00034-of-00082.safetensors +3 -0
  40. model-00035-of-00082.safetensors +3 -0
  41. model-00036-of-00082.safetensors +3 -0
  42. model-00037-of-00082.safetensors +3 -0
  43. model-00038-of-00082.safetensors +3 -0
  44. model-00039-of-00082.safetensors +3 -0
  45. model-00040-of-00082.safetensors +3 -0
  46. model-00041-of-00082.safetensors +3 -0
  47. model-00042-of-00082.safetensors +3 -0
  48. model-00043-of-00082.safetensors +3 -0
  49. model-00044-of-00082.safetensors +3 -0
  50. model-00045-of-00082.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - lazymergekit
7
+ - migtissera/Tess-72B-v1.5b
8
+ - abacusai/Smaug-72B-v0.1
9
+ ---
10
+
11
+ # ECE-TW3-JRGL-V3
12
+
13
+ ECE-TW3-JRGL-V3 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
14
+ * [migtissera/Tess-72B-v1.5b](https://huggingface.co/migtissera/Tess-72B-v1.5b)
15
+ * [abacusai/Smaug-72B-v0.1](https://huggingface.co/abacusai/Smaug-72B-v0.1)
16
+
17
+ ## 🧩 Configuration
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[PAD]": 151851
3
+ }
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "migtissera/Tess-72B-v1.5b",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": true,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128245,
9
+ "eos_token_id": 128247,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 24576,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 64,
19
+ "pad_token_id": 151643,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-06,
22
+ "rope_scaling": null,
23
+ "rope_theta": 1000000,
24
+ "seq_length": 32768,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.39.3",
28
+ "use_cache": false,
29
+ "vocab_size": 152064
30
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: migtissera/Tess-72B-v1.5b
2
+ dtype: bfloat16
3
+ merge_method: slerp
4
+ parameters:
5
+ t:
6
+ - filter: self_attn
7
+ value:
8
+ - 0
9
+ - 0.5
10
+ - 0.3
11
+ - 0.7
12
+ - 1
13
+ - filter: mlp
14
+ value:
15
+ - 1
16
+ - 0.5
17
+ - 0.7
18
+ - 0.3
19
+ - 0
20
+ - value: 0.5
21
+ slices:
22
+ - sources:
23
+ - layer_range:
24
+ - 0
25
+ - 80
26
+ model: migtissera/Tess-72B-v1.5b
27
+ - layer_range:
28
+ - 0
29
+ - 80
30
+ model: abacusai/Smaug-72B-v0.1
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03c556d40850abccf7d25cf0fb1a081f51efb98af6bb627540641606be68c6b5
3
+ size 1879065656
model-00002-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67b881bbc5bc354c89978e8ec3535c1cb851b853891bb6de1ea8a0bb0ebfece0
3
+ size 402670048
model-00003-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a43130851c7ad8e89a98e9efe296ded2bde233d177d5ae3ccd92e44e3a5a9df
3
+ size 2491416720
model-00004-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f86236f418804108814d2d1791b23c7be957daa26a4c04bbbe9c93c1b13d4748
3
+ size 1879065656
model-00005-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd8b3835945902167d58e11592aebb582c7430d4e7c75bc135e5ccbd6afefde7
3
+ size 1879098632
model-00006-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b06578db796a63bc59f176f26121f8fc75c553e4562b605048382e67d27d750e
3
+ size 1610646216
model-00007-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a45576ce2744b561922a1b3da4e59da617a938b10e8c37ba66650c3778713492
3
+ size 1744864304
model-00008-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31574066e39a71fedd6073237dd92043951667b9d613e5fef5b547050092423e
3
+ size 1744864304
model-00009-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ede497a15f3235a377fe0f752c937240118f028bdf7433a35b72bcedeb0aab4b
3
+ size 1879081896
model-00010-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a4da81c5fb72d955350c4702c0f6f5f31a6903feccc00d0999560fda1012676
3
+ size 1879065656
model-00011-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b5d3f46cd504572fca62ec960adade4d7f9f0663ccf87527e76646a9c6a0139
3
+ size 1879082152
model-00012-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed723de14eacd841fb27527ffeddac58cd41e04a1d0d4e9406822165bfd7945
3
+ size 1610630200
model-00013-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0bbf6dbfb817c36d5161f3bb1c2ef12fb58e397b5b9ff8efbf2ae0b15280c88
3
+ size 1744864312
model-00014-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c73b98095d58341ec1a463dad09a2eb7f0bffc7ceb04f3b88b14105b52dffdf9
3
+ size 1879115144
model-00015-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f0e72a42be44b636d073567d86775514b7144c1c4cbcd6a0a6417a49c29e612
3
+ size 1879065664
model-00016-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3f822f03e2c9be0dc4b450bd18bebedab6356dc7d7d2896361e4874ed71ba16
3
+ size 1879082160
model-00017-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:456801ddd7d3a0d0904e0f9facf6301b6d21881691f03dd5c46122a9fdc40bc3
3
+ size 1610662944
model-00018-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4de87aeaeccc7350a6196e1d4a003d587538734318b2d957dcb66c0f9675cc3
3
+ size 1744864312
model-00019-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3821233823a0a8dadd2ecf3c6e292802653d5974e0720540f6e638f12f82744
3
+ size 1744864312
model-00020-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89b6e53e939ff3c3167f4a0579364dadb2043c046df6a26f6bc4ad1a122875bd
3
+ size 1610646216
model-00021-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47d4845f3f34c503f14a327cf8dd2de1b9cfdf69d3b77277356594e8c73afadd
3
+ size 1744864312
model-00022-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2da51f9ae3eae4028fd12ce3714e98a8d98d76707a9d4511748d59b7375ada3
3
+ size 1744864312
model-00023-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36cb3ddfc41ec7c2022bd60f7f6e045dc0503f62959647299920e2971fa1fde9
3
+ size 1879082144
model-00024-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c315034611cf7e0edfb2fb65d1a8fb5087552c0e60e6ecfb814026a2838a20bd
3
+ size 1879082152
model-00025-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c76f96266ee13b843b91084c935a935e8d77ac5a0cb3278c46f5d3ec72a2f37
3
+ size 1744864304
model-00026-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:423a2e424c479976e3a862e684bc0f82127b015d71e11e30b00c964ce4029d5b
3
+ size 1744831312
model-00027-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ae121d73df2cad4057ee0e44a8fcb4938d4c92be0e4c0a2a571bdd30af6f72a
3
+ size 1744864312
model-00028-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20b84c3134ed316aa81308bd291af244f6b53904557f0cb9591bdf210e08b440
3
+ size 1879115384
model-00029-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5330afce9065b0380e1b5e14f1ff02e0f16bcba21a6416be8dad077984853b5
3
+ size 1744864304
model-00030-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f04df0219207c9ed395fd2f4f6283ec8b7023944d52159510fd3dee1bd221938
3
+ size 1744864304
model-00031-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d15ebf1489cc3594ed7e4f80b4b5d0ea89c1574c3ce7f92a5820d38598e76bdd
3
+ size 1879081912
model-00032-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f63eb3780cd0740ec1585ae836018a8731f2ba54ea9ea914a5424ffe131de8ec
3
+ size 1744864312
model-00033-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2df405a3a5bfea83001cd54db2573a1610de3335b6f696dd38a2ada17be1aca4
3
+ size 1744864312
model-00034-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b465295db14e645fe7c2a43f1a129964797b9ef0d1f3c3c1df970d9c576821d2
3
+ size 1879098416
model-00035-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad61aa98cf99902fcd255a4f6553f04fda5795b25d404c104d4859f8b621bd08
3
+ size 1879082160
model-00036-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e93a85a5ad272acdb10b14f46096ead98e342d838aca8fcdf4dacc03ff51002
3
+ size 1610662952
model-00037-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82f3751472212ddd67ebeae7340bb546eb5125c66a4b5f76307a28e7f21c65c9
3
+ size 1744831312
model-00038-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab36745bb6e06b60ab65ead009f66acc47e9c080010cdb4e9efc0663da3ceb7b
3
+ size 1744864312
model-00039-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7c0afdbf59b15dc412cca6cd76d579b1a19e101df5c025e1069dc816b92558c
3
+ size 1879082144
model-00040-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75206caa7a632d535e15871654a5c579bd385e0d534466578a53419b7387cf4f
3
+ size 1879065664
model-00041-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bcc6e409cbda48126c43cca861dd2b0fdbf6bb304150f16a8694591bdc55a4a
3
+ size 1879082160
model-00042-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72b1163ac7d9f71ff3057f7d152f58932df85687d975f388a2b1f55ff775a653
3
+ size 1879098640
model-00043-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df5504c6ea45c53a32711750f9caba3dd3801b30624884e2f4f856a2aaa3226a
3
+ size 1744864312
model-00044-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9cb1e5ff93a598e9f354d4d54af797899fed000b1762990c5309934035600c8
3
+ size 1879115144
model-00045-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:067ded147fab7f3fee24fe43a1077e16dd9a4dac457689456cb99da96c6a6d8d
3
+ size 1879082152