MrRobotoAI
commited on
Commit
•
34d8512
1
Parent(s):
8771b08
Upload folder using huggingface_hub
Browse files- README.md +12 -1
- mergekit_config.yml +5 -1
- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
README.md
CHANGED
@@ -1,8 +1,12 @@
|
|
1 |
---
|
2 |
base_model:
|
3 |
-
- MrRobotoAI/MrRoboto-ProLong-8b-v1p
|
4 |
- MrRobotoAI/MrRoboto-ProLong-8b-v1n
|
|
|
5 |
- MrRobotoAI/MrRoboto-ProLong-8b-v2a
|
|
|
|
|
|
|
|
|
6 |
library_name: transformers
|
7 |
tags:
|
8 |
- mergekit
|
@@ -23,6 +27,8 @@ This model was merged using the [Model Stock](https://arxiv.org/abs/2403.19522)
|
|
23 |
The following models were included in the merge:
|
24 |
* [MrRobotoAI/MrRoboto-ProLong-8b-v1p](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v1p)
|
25 |
* [MrRobotoAI/MrRoboto-ProLong-8b-v2a](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2a)
|
|
|
|
|
26 |
|
27 |
### Configuration
|
28 |
|
@@ -31,9 +37,14 @@ The following YAML configuration was used to produce this model:
|
|
31 |
```yaml
|
32 |
models:
|
33 |
- model: MrRobotoAI/MrRoboto-ProLong-8b-v1p
|
|
|
|
|
34 |
- model: MrRobotoAI/MrRoboto-ProLong-8b-v2a
|
|
|
|
|
35 |
merge_method: model_stock
|
36 |
base_model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
|
37 |
normalize: true
|
38 |
dtype: float16
|
|
|
39 |
```
|
|
|
1 |
---
|
2 |
base_model:
|
|
|
3 |
- MrRobotoAI/MrRoboto-ProLong-8b-v1n
|
4 |
+
- MrRobotoAI/MrRoboto-ProLong-8b-v1p
|
5 |
- MrRobotoAI/MrRoboto-ProLong-8b-v2a
|
6 |
+
- princeton-nlp/Llama-3-8B-ProLong-512k-Instruct
|
7 |
+
- ResplendentAI/NoWarning_Llama3
|
8 |
+
- princeton-nlp/Llama-3-8B-ProLong-512k-Base
|
9 |
+
- ResplendentAI/NoWarning_Llama3
|
10 |
library_name: transformers
|
11 |
tags:
|
12 |
- mergekit
|
|
|
27 |
The following models were included in the merge:
|
28 |
* [MrRobotoAI/MrRoboto-ProLong-8b-v1p](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v1p)
|
29 |
* [MrRobotoAI/MrRoboto-ProLong-8b-v2a](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2a)
|
30 |
+
* [princeton-nlp/Llama-3-8B-ProLong-512k-Instruct](https://huggingface.co/princeton-nlp/Llama-3-8B-ProLong-512k-Instruct) + [ResplendentAI/NoWarning_Llama3](https://huggingface.co/ResplendentAI/NoWarning_Llama3)
|
31 |
+
* [princeton-nlp/Llama-3-8B-ProLong-512k-Base](https://huggingface.co/princeton-nlp/Llama-3-8B-ProLong-512k-Base) + [ResplendentAI/NoWarning_Llama3](https://huggingface.co/ResplendentAI/NoWarning_Llama3)
|
32 |
|
33 |
### Configuration
|
34 |
|
|
|
37 |
```yaml
|
38 |
models:
|
39 |
- model: MrRobotoAI/MrRoboto-ProLong-8b-v1p
|
40 |
+
- model: princeton-nlp/Llama-3-8B-ProLong-512k-Instruct+ResplendentAI/NoWarning_Llama3
|
41 |
+
- model: princeton-nlp/Llama-3-8B-ProLong-512k-Base+ResplendentAI/NoWarning_Llama3
|
42 |
- model: MrRobotoAI/MrRoboto-ProLong-8b-v2a
|
43 |
+
- model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
|
44 |
+
|
45 |
merge_method: model_stock
|
46 |
base_model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
|
47 |
normalize: true
|
48 |
dtype: float16
|
49 |
+
|
50 |
```
|
mergekit_config.yml
CHANGED
@@ -1,7 +1,11 @@
|
|
1 |
models:
|
2 |
- model: MrRobotoAI/MrRoboto-ProLong-8b-v1p
|
|
|
|
|
3 |
- model: MrRobotoAI/MrRoboto-ProLong-8b-v2a
|
|
|
|
|
4 |
merge_method: model_stock
|
5 |
base_model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
|
6 |
normalize: true
|
7 |
-
dtype: float16
|
|
|
1 |
models:
|
2 |
- model: MrRobotoAI/MrRoboto-ProLong-8b-v1p
|
3 |
+
- model: princeton-nlp/Llama-3-8B-ProLong-512k-Instruct+ResplendentAI/NoWarning_Llama3
|
4 |
+
- model: princeton-nlp/Llama-3-8B-ProLong-512k-Base+ResplendentAI/NoWarning_Llama3
|
5 |
- model: MrRobotoAI/MrRoboto-ProLong-8b-v2a
|
6 |
+
- model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
|
7 |
+
|
8 |
merge_method: model_stock
|
9 |
base_model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
|
10 |
normalize: true
|
11 |
+
dtype: float16
|
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4953586328
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92cb552475b0187e17fdb980fa0765c942d6a27885c4b67f00983d9bddfcaf1d
|
3 |
size 4953586328
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999819232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b00997fb334656caff8c1a584ba77fb91d1da02c73a29c69543bed649c1606ec
|
3 |
size 4999819232
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916048
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a3c660fe754c7dec80be8128e20321606ef950eb2f4827dfab66bba725b95c6
|
3 |
size 4915916048
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1191234448
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8494f1e8fc14242ba69803ca9fedc5172d0b67795ffde392651501382537863e
|
3 |
size 1191234448
|