Upload folder using huggingface_hub

Browse files

Files changed (7) hide show

README.md +31 -35
config.json +2 -2
mergekit_config.yml +13 -31
model-00001-of-00004.safetensors +2 -2
model-00002-of-00004.safetensors +2 -2
model-00003-of-00004.safetensors +2 -2
model-00004-of-00004.safetensors +2 -2

README.md CHANGED Viewed

@@ -1,8 +1,16 @@
 ---
 base_model:
-- MrRobotoAI/MrRoboto-ProLong-8b-v2e
 - MrRobotoAI/MrRoboto-ProLong-8b-v2g
-- MrRobotoAI/MrRoboto-ProLong-8b-v1n
 library_name: transformers
 tags:
 - mergekit
@@ -16,51 +24,39 @@ This is a merge of pre-trained language models created using [mergekit](https://
 ## Merge Details
 ### Merge Method
-This model was merged using the linear [DARE](https://arxiv.org/abs/2311.03099) merge method using [MrRobotoAI/MrRoboto-ProLong-8b-v1n](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v1n) as a base.
 ### Models Merged
 The following models were included in the merge:
-* [MrRobotoAI/MrRoboto-ProLong-8b-v2e](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2e)
 * [MrRobotoAI/MrRoboto-ProLong-8b-v2g](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2g)
 ### Configuration
 The following YAML configuration was used to produce this model:
 ```yaml
-merge_method: dare_linear
 models:
-  - model: MrRobotoAI/MrRoboto-ProLong-8b-v2e
-    parameters:
-      weight:
-        - filter: v_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - filter: o_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - filter: up_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - filter: gate_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - filter: down_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - value: 1
   - model: MrRobotoAI/MrRoboto-ProLong-8b-v2g
-    parameters:
-      weight:
-        - filter: v_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - filter: o_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - filter: up_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - filter: gate_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - filter: down_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - value: 0
-base_model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
-tokenizer_source: base
-dtype: bfloat16
 ```

 ---
 base_model:
+- akjindal53244/Llama-3.1-Storm-8B
+- nothingiisreal/L3-8B-Stheno-Horny-v3.3-32K
+- Blackroot/Llama-3-LongStory-LORA
+- cgato/L3-TheSpice-8b-v0.8.3
+- Blackroot/Llama-3-8B-Abomination-LORA
+- DeepAutoAI/ldm_soup_Llama-3.1-8B-Inst
+- MrRobotoAI/MrRoboto-ProLong-8b-v2l
+- v000000/L3.1-Sthenorm-8B
+- OpenBuddy/openbuddy-llama3.1-8b-v22.2-131k
 - MrRobotoAI/MrRoboto-ProLong-8b-v2g
+- MrRobotoAI/Thor-v1.4-8b-DARK-FICTION
 library_name: transformers
 tags:
 - mergekit
 ## Merge Details
 ### Merge Method
+This model was merged using the [Model Stock](https://arxiv.org/abs/2403.19522) merge method using [MrRobotoAI/MrRoboto-ProLong-8b-v2l](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2l) as a base.
 ### Models Merged
 The following models were included in the merge:
+* [akjindal53244/Llama-3.1-Storm-8B](https://huggingface.co/akjindal53244/Llama-3.1-Storm-8B)
+* [nothingiisreal/L3-8B-Stheno-Horny-v3.3-32K](https://huggingface.co/nothingiisreal/L3-8B-Stheno-Horny-v3.3-32K) + [Blackroot/Llama-3-LongStory-LORA](https://huggingface.co/Blackroot/Llama-3-LongStory-LORA)
+* [cgato/L3-TheSpice-8b-v0.8.3](https://huggingface.co/cgato/L3-TheSpice-8b-v0.8.3) + [Blackroot/Llama-3-8B-Abomination-LORA](https://huggingface.co/Blackroot/Llama-3-8B-Abomination-LORA)
+* [DeepAutoAI/ldm_soup_Llama-3.1-8B-Inst](https://huggingface.co/DeepAutoAI/ldm_soup_Llama-3.1-8B-Inst)
+* [v000000/L3.1-Sthenorm-8B](https://huggingface.co/v000000/L3.1-Sthenorm-8B)
+* [OpenBuddy/openbuddy-llama3.1-8b-v22.2-131k](https://huggingface.co/OpenBuddy/openbuddy-llama3.1-8b-v22.2-131k)
 * [MrRobotoAI/MrRoboto-ProLong-8b-v2g](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2g)
+* [MrRobotoAI/Thor-v1.4-8b-DARK-FICTION](https://huggingface.co/MrRobotoAI/Thor-v1.4-8b-DARK-FICTION)
 ### Configuration
 The following YAML configuration was used to produce this model:
 ```yaml
 models:
+  - model: OpenBuddy/openbuddy-llama3.1-8b-v22.2-131k
+  - model: akjindal53244/Llama-3.1-Storm-8B
+  - model: v000000/L3.1-Sthenorm-8B
+  - model: DeepAutoAI/ldm_soup_Llama-3.1-8B-Inst
+  - model: cgato/L3-TheSpice-8b-v0.8.3+Blackroot/Llama-3-8B-Abomination-LORA
   - model: MrRobotoAI/MrRoboto-ProLong-8b-v2g
+  - model: nothingiisreal/L3-8B-Stheno-Horny-v3.3-32K+Blackroot/Llama-3-LongStory-LORA
+  - model: MrRobotoAI/Thor-v1.4-8b-DARK-FICTION
+merge_method: model_stock
+base_model: MrRobotoAI/MrRoboto-ProLong-8b-v2l
+normalize: true
+dtype: float16
 ```

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "MrRobotoAI/MrRoboto-ProLong-8b-v1n",
   "architectures": [
     "LlamaForCausalLM"
   ],
@@ -23,7 +23,7 @@
   "rope_scaling": null,
   "rope_theta": 2804339835.0,
   "tie_word_embeddings": false,
-  "torch_dtype": "bfloat16",
   "transformers_version": "4.46.2",
   "use_cache": true,
   "vocab_size": 128256

 {
+  "_name_or_path": "MrRobotoAI/MrRoboto-ProLong-8b-v2l",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "rope_scaling": null,
   "rope_theta": 2804339835.0,
   "tie_word_embeddings": false,
+  "torch_dtype": "float16",
   "transformers_version": "4.46.2",
   "use_cache": true,
   "vocab_size": 128256

mergekit_config.yml CHANGED Viewed

@@ -1,33 +1,15 @@
-merge_method: dare_linear
 models:
-  - model: MrRobotoAI/MrRoboto-ProLong-8b-v2e
-    parameters:
-      weight:
-        - filter: v_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - filter: o_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - filter: up_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - filter: gate_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - filter: down_proj
-          value: [0.2, 0.2, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.45, 0.2, 0.2]
-        - value: 1
   - model: MrRobotoAI/MrRoboto-ProLong-8b-v2g
-    parameters:
-      weight:
-        - filter: v_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - filter: o_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - filter: up_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - filter: gate_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - filter: down_proj
-          value: [0.8, 0.8, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.55, 0.8, 0.8]
-        - value: 0
-base_model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
-tokenizer_source: base
-dtype: bfloat16

 models:
+  - model: OpenBuddy/openbuddy-llama3.1-8b-v22.2-131k
+  - model: akjindal53244/Llama-3.1-Storm-8B
+  - model: v000000/L3.1-Sthenorm-8B
+  - model: DeepAutoAI/ldm_soup_Llama-3.1-8B-Inst
+  - model: cgato/L3-TheSpice-8b-v0.8.3+Blackroot/Llama-3-8B-Abomination-LORA
   - model: MrRobotoAI/MrRoboto-ProLong-8b-v2g
+  - model: nothingiisreal/L3-8B-Stheno-Horny-v3.3-32K+Blackroot/Llama-3-LongStory-LORA
+  - model: MrRobotoAI/Thor-v1.4-8b-DARK-FICTION
+merge_method: model_stock
+base_model: MrRobotoAI/MrRoboto-ProLong-8b-v2l
+normalize: true
+dtype: float16

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b49c7786a0438d8c75dd2db6a3b2b9db6038dd74463cc8a0e37da2c9cfc21981
-size 4953586384

 version https://git-lfs.github.com/spec/v1
+oid sha256:87cb93d68ff5e647e19bad5adf052d3700396a4d29917583b2f36b9173011e96
+size 4953586328

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:184dab4aa343b306cf17aedeec57adae78ead74c436d134ef72046387fed606c
-size 4999819336

 version https://git-lfs.github.com/spec/v1
+oid sha256:d428e29c0d524c6e7dcf960f6eec01201748bd092bdf32e61d63486841e0b2f6
+size 4999819232

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd10bf731074047bc67a435eeef404d1c8dd99a832c1d0e4fd3ce43a8669029c
-size 4915916144

 version https://git-lfs.github.com/spec/v1
+oid sha256:c0e6e0ff38e4cbb18530d3f585fd2f4aedd6a16da7a2f071634dc888ebee2ca0
+size 4915916048

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0bf4d79d52512f7cda4779f4ff0ac40fd6e3d9f9e3815534dd10ee181febbe99
-size 1191234472

 version https://git-lfs.github.com/spec/v1
+oid sha256:f7a93c6812ac2d967509bb31248b0145eacf0d4adc4eead3b6dd5fe7eec09675
+size 1191234448