paloalma commited on
Commit
aa4d908
1 Parent(s): cd4932b

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +17 -0
  2. config.json +30 -0
  3. mergekit_config.yml +30 -0
  4. merges.txt +0 -0
  5. model-00001-of-00082.safetensors +3 -0
  6. model-00002-of-00082.safetensors +3 -0
  7. model-00003-of-00082.safetensors +3 -0
  8. model-00004-of-00082.safetensors +3 -0
  9. model-00005-of-00082.safetensors +3 -0
  10. model-00006-of-00082.safetensors +3 -0
  11. model-00007-of-00082.safetensors +3 -0
  12. model-00008-of-00082.safetensors +3 -0
  13. model-00009-of-00082.safetensors +3 -0
  14. model-00010-of-00082.safetensors +3 -0
  15. model-00011-of-00082.safetensors +3 -0
  16. model-00012-of-00082.safetensors +3 -0
  17. model-00013-of-00082.safetensors +3 -0
  18. model-00014-of-00082.safetensors +3 -0
  19. model-00015-of-00082.safetensors +3 -0
  20. model-00016-of-00082.safetensors +3 -0
  21. model-00017-of-00082.safetensors +3 -0
  22. model-00018-of-00082.safetensors +3 -0
  23. model-00019-of-00082.safetensors +3 -0
  24. model-00020-of-00082.safetensors +3 -0
  25. model-00021-of-00082.safetensors +3 -0
  26. model-00022-of-00082.safetensors +3 -0
  27. model-00023-of-00082.safetensors +3 -0
  28. model-00024-of-00082.safetensors +3 -0
  29. model-00025-of-00082.safetensors +3 -0
  30. model-00026-of-00082.safetensors +3 -0
  31. model-00027-of-00082.safetensors +3 -0
  32. model-00028-of-00082.safetensors +3 -0
  33. model-00029-of-00082.safetensors +3 -0
  34. model-00030-of-00082.safetensors +3 -0
  35. model-00031-of-00082.safetensors +3 -0
  36. model-00032-of-00082.safetensors +3 -0
  37. model-00033-of-00082.safetensors +3 -0
  38. model-00034-of-00082.safetensors +3 -0
  39. model-00035-of-00082.safetensors +3 -0
  40. model-00036-of-00082.safetensors +3 -0
  41. model-00037-of-00082.safetensors +3 -0
  42. model-00038-of-00082.safetensors +3 -0
  43. model-00039-of-00082.safetensors +3 -0
  44. model-00040-of-00082.safetensors +3 -0
  45. model-00041-of-00082.safetensors +3 -0
  46. model-00042-of-00082.safetensors +3 -0
  47. model-00043-of-00082.safetensors +3 -0
  48. model-00044-of-00082.safetensors +3 -0
  49. model-00045-of-00082.safetensors +3 -0
  50. model-00046-of-00082.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - lazymergekit
7
+ - abacusai/Smaug-72B-v0.1
8
+ - MTSAIR/MultiVerse_70B
9
+ ---
10
+
11
+ # TW3-JRGL-v1
12
+
13
+ TW3-JRGL-v1 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
14
+ * [abacusai/Smaug-72B-v0.1](https://huggingface.co/abacusai/Smaug-72B-v0.1)
15
+ * [MTSAIR/MultiVerse_70B](https://huggingface.co/MTSAIR/MultiVerse_70B)
16
+
17
+ ## 🧩 Configuration
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "abacusai/Smaug-72B-v0.1",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": true,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 151643,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 24576,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 64,
19
+ "pad_token_id": 151643,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-06,
22
+ "rope_scaling": null,
23
+ "rope_theta": 1000000,
24
+ "seq_length": 32768,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.39.2",
28
+ "use_cache": true,
29
+ "vocab_size": 152064
30
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: abacusai/Smaug-72B-v0.1
2
+ dtype: bfloat16
3
+ merge_method: slerp
4
+ parameters:
5
+ t:
6
+ - filter: self_attn
7
+ value:
8
+ - 0
9
+ - 0.5
10
+ - 0.3
11
+ - 0.7
12
+ - 1
13
+ - filter: mlp
14
+ value:
15
+ - 1
16
+ - 0.5
17
+ - 0.7
18
+ - 0.3
19
+ - 0
20
+ - value: 0.5
21
+ slices:
22
+ - sources:
23
+ - layer_range:
24
+ - 0
25
+ - 80
26
+ model: abacusai/Smaug-72B-v0.1
27
+ - layer_range:
28
+ - 0
29
+ - 80
30
+ model: MTSAIR/MultiVerse_70B
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d9e0ac565b7fc015dd84bd6253ba51f634e7a60c775f8957f672370c1843777
3
+ size 1879164616
model-00002-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa8ace3badd36c9671d98e11ffef705dc2195083c6978d3b68584a582d959e5
3
+ size 402703024
model-00003-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d48975c6f125467e8fe47430e4d51409a2e89e3f6b4ca527bb0f26ef297ea9c9
3
+ size 2491416720
model-00004-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e30e7f284e1bdf4bde90f88c68eccb2cc809680feb68df7fa543f4f9f5cc144
3
+ size 1879164616
model-00005-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:918bed83eecf13651e4267e65a60835b423ba226ba7c9cf9b1421ff07e9d89bf
3
+ size 1879164608
model-00006-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fe37ca317a0b2bb3615abfa9727aa003a70793098b476c89ceba1cf95517b17
3
+ size 1610646216
model-00007-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3201095441f142d1310be71966d7faf09e82396c0cdabaaec867c91d291acca
3
+ size 1744930280
model-00008-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee72f9b56ee6b3d4aad3c1b0739d034c6923d9eafe4598ec61bf083a399b3284
3
+ size 1744930280
model-00009-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23a4be6cd47a71e967bfdc9c55eb37f7bcd1078292120cdc4b8ef58bc44c5728
3
+ size 1879131376
model-00010-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42aa62ad81f8e3b84070f18ee9124d535c01379722319588e93b0eceb3088fb8
3
+ size 1879148128
model-00011-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99f9b0ea71993972967ec014fc239601f38c13e619a9c279c628f92b2a40f208
3
+ size 1879164616
model-00012-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e57ca3666c41b1df9aa36d05ea691feafdc7719ada82806c2d32896e56937b81
3
+ size 1610712664
model-00013-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5e592aa394ea939818c82eac70c975bc5fe36be14e9be08e5a6ea4c66308094
3
+ size 1744930288
model-00014-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32d5cc1a8fb9ad31b7e502a2a9432f9caf4e5b8700bec6ce57dc60a19a82a230
3
+ size 1879214112
model-00015-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78f96c160afba0c525e2b41105f6448b727cff1e918897735dca4dabc72dbe33
3
+ size 1879148136
model-00016-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61aa1fd874c2347d657b911d939da9c13d858c91d1ba35026e7d0b56d5126180
3
+ size 1879164632
model-00017-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:677b2d38f523c5edddea90291cf10fda98688c892f4cc79e3bd4eb33c7bb29b3
3
+ size 1610695936
model-00018-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5250aeaba1118087c60336e7efe9bf30a1cee521cd86ca7d39ba6683c803610
3
+ size 1744930288
model-00019-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5826e287256faf958a8b542d57450727d480b5631975c7cbe69b3171697a6226
3
+ size 1744930288
model-00020-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8993d45d2a554c8575583c4f5969b30520ab496afb0cb6e1e8b264b9181b6079
3
+ size 1610646216
model-00021-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc3e62d3ec88d6bceaeaee0e6903464fac79ef29c1f0fa7339969245dcc6220d
3
+ size 1744930288
model-00022-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f553b2989f9b60f62332eaa65d709d7dc67d7c79a873a7798ef4b4086ee6850
3
+ size 1744930288
model-00023-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bea186a14220caf882353aa44f66d137a311ffb8704b5ec93e353854386dd2f
3
+ size 1879181112
model-00024-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7601b94dbaf325d7ad5a3e9ed7e99ffdb026bfcff718a340f71fc1401b7a734b
3
+ size 1879148128
model-00025-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f3d3e02f5cb05680736e719e08d1bd0001c069a8902f6d011d377a0fabb5228
3
+ size 1744930280
model-00026-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:929270edef9fffb446f74b1022cb605a8d2398ea8f180ce03660b1edee797fd5
3
+ size 1744897296
model-00027-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1e478f6c44952cc88c23a653482be3a9fd6c5c04c1936e147cdf319e781ccbf
3
+ size 1744930288
model-00028-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c14a9bce2472c01727e23f0c616db8c1424727a62e0022824c31420b79388576
3
+ size 1879247336
model-00029-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dd103cd75191c58a2b0a4694353906d6e06582faee108a7f5c1814013e9434c
3
+ size 1744930280
model-00030-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ada0d9460bd45e4e3be720708ed75cf66b3250fc5ce2abe9f71e6178982edc98
3
+ size 1744930280
model-00031-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:511241485b6b7323cb90d6621360394d1f7e5265102a57a61691987d15e2900c
3
+ size 1879114896
model-00032-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:154e0ba71abf725a142d46ec31a603df6d86a132d9fe96cb1a4761a058f074fb
3
+ size 1744930288
model-00033-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8603e947169683224d3b2a005ec3e9f32ce0efd5b2a86254dac66148e5cbbb3
3
+ size 1744930288
model-00034-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4338371cfafc69036c651599b2186c4335350188a22a80983c1b097a732700b6
3
+ size 1879147896
model-00035-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9950b8dab81b131a5208edeb49599287389fe44b98f104ba9f3e093cbdc83c44
3
+ size 1879164632
model-00036-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba2d3df0f947a446b9ba25b1a9b7363e1597e803ecd014298e00db820632e3c2
3
+ size 1610695944
model-00037-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9276aae55f179f1ad8f278647bfde0fb51004920b815e6f9ed38aa22fea7e732
3
+ size 1744897296
model-00038-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7eecd2c4fa32ae5f8888b6265c360694f1fe15c920fd0f03288c5ecae5ace32b
3
+ size 1744930288
model-00039-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f6f05e7f5521e468c27eef4e5a26dd66096d66224f6f42d5d7360a7c4543899
3
+ size 1879181112
model-00040-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b9d403f58c52ce49b88e7a4ea5eda66d2ffe3108312fc356129c8ecb9c4969b
3
+ size 1879148136
model-00041-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87fd867e36b92e5d466725f35a4d51c3321f9686d53074aed1d408add0d6f7cd
3
+ size 1879164632
model-00042-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89dedab3aca8fb431997172218a3c6b5b65d3abb699a8f116a2e1e257e721fe2
3
+ size 1879164624
model-00043-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31205b520bfd03436f41929208365acfeb6c46d12594817ec6d4fa274f102c1a
3
+ size 1744930288
model-00044-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c33a8aad42b3b74c5e467e7e163123d51185190a4360614e95acd16862e6e79
3
+ size 1879214112
model-00045-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60335a84fe167c4e086c0ede093ed6e98fd9e0e1b2ac0fd7f9c5d5b5036621f4
3
+ size 1879148128
model-00046-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53a21b49dafd9ae53b552b9012ad5d612d1c9841d4c16a2abd772cb20ece3ac1
3
+ size 1744930280