MatthieuJ commited on
Commit
8da87c8
1 Parent(s): d185ac1

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +17 -0
  2. config.json +30 -0
  3. mergekit_config.yml +30 -0
  4. merges.txt +0 -0
  5. model-00001-of-00082.safetensors +3 -0
  6. model-00002-of-00082.safetensors +3 -0
  7. model-00003-of-00082.safetensors +3 -0
  8. model-00004-of-00082.safetensors +3 -0
  9. model-00005-of-00082.safetensors +3 -0
  10. model-00006-of-00082.safetensors +3 -0
  11. model-00007-of-00082.safetensors +3 -0
  12. model-00008-of-00082.safetensors +3 -0
  13. model-00009-of-00082.safetensors +3 -0
  14. model-00010-of-00082.safetensors +3 -0
  15. model-00011-of-00082.safetensors +3 -0
  16. model-00012-of-00082.safetensors +3 -0
  17. model-00013-of-00082.safetensors +3 -0
  18. model-00014-of-00082.safetensors +3 -0
  19. model-00015-of-00082.safetensors +3 -0
  20. model-00016-of-00082.safetensors +3 -0
  21. model-00017-of-00082.safetensors +3 -0
  22. model-00018-of-00082.safetensors +3 -0
  23. model-00019-of-00082.safetensors +3 -0
  24. model-00020-of-00082.safetensors +3 -0
  25. model-00021-of-00082.safetensors +3 -0
  26. model-00022-of-00082.safetensors +3 -0
  27. model-00023-of-00082.safetensors +3 -0
  28. model-00024-of-00082.safetensors +3 -0
  29. model-00025-of-00082.safetensors +3 -0
  30. model-00026-of-00082.safetensors +3 -0
  31. model-00027-of-00082.safetensors +3 -0
  32. model-00028-of-00082.safetensors +3 -0
  33. model-00029-of-00082.safetensors +3 -0
  34. model-00030-of-00082.safetensors +3 -0
  35. model-00031-of-00082.safetensors +3 -0
  36. model-00032-of-00082.safetensors +3 -0
  37. model-00033-of-00082.safetensors +3 -0
  38. model-00034-of-00082.safetensors +3 -0
  39. model-00035-of-00082.safetensors +3 -0
  40. model-00036-of-00082.safetensors +3 -0
  41. model-00037-of-00082.safetensors +3 -0
  42. model-00038-of-00082.safetensors +3 -0
  43. model-00039-of-00082.safetensors +3 -0
  44. model-00040-of-00082.safetensors +3 -0
  45. model-00041-of-00082.safetensors +3 -0
  46. model-00042-of-00082.safetensors +3 -0
  47. model-00043-of-00082.safetensors +3 -0
  48. model-00044-of-00082.safetensors +3 -0
  49. model-00045-of-00082.safetensors +3 -0
  50. model-00046-of-00082.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - lazymergekit
7
+ - davidkim205/Rhea-72b-v0.5
8
+ - abacusai/Smaug-72B-v0.1
9
+ ---
10
+
11
+ # ECE-TW3-JRGL-V5
12
+
13
+ ECE-TW3-JRGL-V5 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
14
+ * [davidkim205/Rhea-72b-v0.5](https://huggingface.co/davidkim205/Rhea-72b-v0.5)
15
+ * [abacusai/Smaug-72B-v0.1](https://huggingface.co/abacusai/Smaug-72B-v0.1)
16
+
17
+ ## 🧩 Configuration
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "davidkim205/Rhea-72b-v0.5",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": true,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 151643,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 24576,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 64,
19
+ "pad_token_id": 151643,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-06,
22
+ "rope_scaling": null,
23
+ "rope_theta": 1000000,
24
+ "seq_length": 32768,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.39.3",
28
+ "use_cache": true,
29
+ "vocab_size": 152064
30
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: davidkim205/Rhea-72b-v0.5
2
+ dtype: bfloat16
3
+ merge_method: slerp
4
+ parameters:
5
+ t:
6
+ - filter: self_attn
7
+ value:
8
+ - 0
9
+ - 0.5
10
+ - 0.3
11
+ - 0.7
12
+ - 1
13
+ - filter: mlp
14
+ value:
15
+ - 1
16
+ - 0.5
17
+ - 0.7
18
+ - 0.3
19
+ - 0
20
+ - value: 0.5
21
+ slices:
22
+ - sources:
23
+ - layer_range:
24
+ - 0
25
+ - 80
26
+ model: davidkim205/Rhea-72b-v0.5
27
+ - layer_range:
28
+ - 0
29
+ - 80
30
+ model: abacusai/Smaug-72B-v0.1
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11fad8ed89c2bfc7939a6d964c1a54efb3b420decac9896e49d6c89cc1e4c173
3
+ size 1879065656
model-00002-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4508120286cb5db852c8b6aa54290b1ac55db2fa5c4ba5e54ccae0782bf64c1b
3
+ size 402670048
model-00003-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fa1a10feeab788c76005956249f06f5be60675a35069fdde009ceea4e5574ae
3
+ size 2491416720
model-00004-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d88e6305c898738eb4ed7e9e0942305c103aa42de2184dbbd1817b2e8122515c
3
+ size 1879065656
model-00005-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:806b125b7affd60509820def010e87ae9c0e8a04254f2e852b943cb09fc9c3a8
3
+ size 1879098632
model-00006-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c54d21b47d6108c6856a402f32b07e96cdcf39a3f6ce5e3763d545318af45c3e
3
+ size 1610646216
model-00007-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a23ea0c23a212e8826f520fc3cb17fe7728c61fc695ba94220b531f9ba517854
3
+ size 1744864304
model-00008-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eb3c765f55c4c3cc3911ef3145e839e7da29d6bf7328d3325181ef14f431c1c
3
+ size 1744864304
model-00009-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5805aabdbfbd99ba40c92529c687e3d7ae3278f1708453f8acc13d691bcd69b4
3
+ size 1879081896
model-00010-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba9469d665b8e41f008c56e76f123d20d3b2fc94bbc0ed5954b02e16fc4391c6
3
+ size 1879065656
model-00011-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dc62e2a40ed15398df42acf7f093984244751dd0f8ae9f2acd1032b75d523fb
3
+ size 1879082152
model-00012-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d91ff97e66728c0ed6eeb57db771717a8ed04ae161428fbc317e5cb970371613
3
+ size 1610630200
model-00013-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8801fd14f9de87788be0ca2d6f6b88603fd9dc1485d4e4c77f09f6489cfc05ff
3
+ size 1744864312
model-00014-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88d621f86b511e5bc493bc700649aba0a8fe92e9cc355d18c8a574b57e9f0656
3
+ size 1879115144
model-00015-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8652adfb164f3b7c92ac8df15fec6ef88f7479d68ee457b3318a04814dbd4f27
3
+ size 1879065664
model-00016-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a245f2529212cba0dff28d53e2d6342a39943e542ef2115b251586a7592dd3a
3
+ size 1879082160
model-00017-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2473ffdc61b18a62bdded09bff617faacf33b9e1af86fa1805cc401e77ad248c
3
+ size 1610662944
model-00018-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:139520f6cf82173ae7aebdd0d01f0cb157bcbbacaf99cd46a736425cb3907edf
3
+ size 1744864312
model-00019-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45a4db0db3e5c10e491279e01b203eef435897fbf28f4c2be01f80fa198e5088
3
+ size 1744864312
model-00020-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f772dd83cef6c1915a67133b4aae75b9bc52e093c7cded9b09a4e2f13b57f90
3
+ size 1610646216
model-00021-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba33189ec1aa83c2258b4ecac853c0acec9f3df21ca8efd74803734c18a93f37
3
+ size 1744864312
model-00022-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4987ef1bab081bc4109da67fe4c035ad4d6aff14a0c7b10d12c7998e44751a0
3
+ size 1744864312
model-00023-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:863b0eb8c18e58fd84a1e45c7fcb9c18f77bc33792a7c034755da05357d42c06
3
+ size 1879082144
model-00024-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b77e6a742dcca08403c12db8a971f6f6014a01f89bb87376b718590ea31e4f04
3
+ size 1879082152
model-00025-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b58520e8ab5e6bf697387d15f232817d7eba29bb1216b3a58f5b55e9da91274
3
+ size 1744864304
model-00026-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c4655508ee7c7062b7a31c0d9279dfab00fa251464434578538eabf93446449
3
+ size 1744831312
model-00027-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9116577c68af520155de3b422b1460424ee0f9f289f053a57bb9a1cab030f467
3
+ size 1744864312
model-00028-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebb9a654fe4132a2f05937fd4c239c1c1e7c0d3ece27623263014bc511e90dbd
3
+ size 1879115384
model-00029-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a84794711ee8cae477a833a1dbfe4a97a076cf8016c53f471843769bd63febfe
3
+ size 1744864304
model-00030-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0cc0f59cb346addf0d447e789f1a95606f1e6a7477a75c6ec99c3531958dd63
3
+ size 1744864304
model-00031-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:203a9d0a752cf7868532ef2f0bbc045964bf950d1f687503050b21953b845ccc
3
+ size 1879081912
model-00032-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21277c586468a4dc1edccb8e3b969127bf3e0e9000a3f8d860a7e049e5affe55
3
+ size 1744864312
model-00033-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ecd438613792b1b72ca19bb4df4775396d025fa16b4aca36ea3c53dfaac1f65
3
+ size 1744864312
model-00034-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ad0a1f37f791ebdd722b42db18f4dd62d685e684bd6636a1665b53409a9902c
3
+ size 1879098416
model-00035-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:319035b3b1f024661e67a0eb416a76cab3d909b9c1f2f88834685e275576a7fb
3
+ size 1879082160
model-00036-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e41f1579001fbdbf1e47853c76ef9aa2a5abd65c0467dbeb11032e6e2131ce6a
3
+ size 1610662952
model-00037-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75e06b2a2aa85f763253c69c71ae01fdc8d0d8b9b4558a9a86c42419d50a39fe
3
+ size 1744831312
model-00038-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26e0279032fd3743156c936463cfcbf63b9bb745bf96992efcfcc2bc48c203cf
3
+ size 1744864312
model-00039-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:645659b2c32bad7dba8efb139b2cc7ce4d58a15f2fcf287c513f991cef5fa1f4
3
+ size 1879082144
model-00040-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb8b5d5498ae63cc29b17c9bc71f46ed8e0894765a8d57ba968bd01966996357
3
+ size 1879065664
model-00041-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9c613966431dc0f62e12bb15595de990f61fa1be317780ae6989467de3305e7
3
+ size 1879082160
model-00042-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51f2aa339e91ae14f8966ab9cec2560d995887f2f2af8a5eac9ad74f5be42272
3
+ size 1879098640
model-00043-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1d6987ec1773bad3d5860178cba3d39daf1b42b9e1da5af93a2784ce7b6f093
3
+ size 1744864312
model-00044-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e77cd02a226accd3715729f9ee5444d5b68e0845541b3ea0c1e385fabfe103d
3
+ size 1879115144
model-00045-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b55295d816a2076382bf058671dc5c96b94f78c4835d541436e441a02c05b30
3
+ size 1879082152
model-00046-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae1fe66737b4863d8e96fa3a030975b7bc6a3275b4f0cff85c98605fcdf26772
3
+ size 1744864304