Steelskull commited on
Commit
8fd8d3c
1 Parent(s): 2e727f6

Upload folder using huggingface_hub

Browse files
Files changed (22) hide show
  1. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/config.json +30 -0
  2. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/mergekit_moe_config.yml +120 -0
  3. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00001-of-00015.safetensors +3 -0
  4. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00002-of-00015.safetensors +3 -0
  5. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00003-of-00015.safetensors +3 -0
  6. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00004-of-00015.safetensors +3 -0
  7. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00005-of-00015.safetensors +3 -0
  8. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00006-of-00015.safetensors +3 -0
  9. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00007-of-00015.safetensors +3 -0
  10. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00008-of-00015.safetensors +3 -0
  11. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00009-of-00015.safetensors +3 -0
  12. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00010-of-00015.safetensors +3 -0
  13. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00011-of-00015.safetensors +3 -0
  14. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00012-of-00015.safetensors +3 -0
  15. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00013-of-00015.safetensors +3 -0
  16. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00014-of-00015.safetensors +3 -0
  17. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00015-of-00015.safetensors +3 -0
  18. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model.safetensors.index.json +0 -0
  19. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/special_tokens_map.json +24 -0
  20. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/tokenizer.json +0 -0
  21. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/tokenizer.model +3 -0
  22. https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/tokenizer_config.json +43 -0
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "vicgalle/CarbonBeagle-11B",
3
+ "architectures": [
4
+ "MixtralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 4096,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 14336,
13
+ "max_position_embeddings": 32768,
14
+ "model_type": "mixtral",
15
+ "num_attention_heads": 32,
16
+ "num_experts_per_tok": 2,
17
+ "num_hidden_layers": 48,
18
+ "num_key_value_heads": 8,
19
+ "num_local_experts": 8,
20
+ "output_router_logits": false,
21
+ "rms_norm_eps": 1e-05,
22
+ "rope_theta": 10000.0,
23
+ "router_aux_loss_coef": 0.001,
24
+ "sliding_window": null,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.37.1",
28
+ "use_cache": false,
29
+ "vocab_size": 32000
30
+ }
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/mergekit_moe_config.yml ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ base_model: vicgalle/CarbonBeagle-11B
3
+ gate_mode: hidden
4
+ dtype: bfloat16
5
+
6
+ experts:
7
+ - source_model: Sao10K/Fimbulvetr-10.7B-v1
8
+ positive_prompts:
9
+ - "Complex narrative development in fantasy and sci-fi genres"
10
+ - "Character-driven storytelling with deep emotional layers"
11
+ - "Interactive and dynamic role-playing game scenarios"
12
+ - "Developing intricate plot twists in fictional stories"
13
+ - "Crafting dialogues with rich and diverse character backgrounds"
14
+ - "Elaborate world-building in creative writing"
15
+ - "Integrating myths and legends into modern storytelling"
16
+ - "Designing engaging story arcs with unexpected endings"
17
+ negative_prompts:
18
+ - "Technical, scientific, or academic writing"
19
+ - "Factual reporting and data-based inquiries"
20
+
21
+ - source_model: maywell/PiVoT-10.7B-Mistral-v0.2-RP
22
+ positive_prompts:
23
+ - "Introductory-level creative writing and storytelling"
24
+ - "Basic character creation and simple plot lines"
25
+ - "Guiding new writers in developing narrative skills"
26
+ - "Role-play scenarios for language learning purposes"
27
+ - "Crafting straightforward and linear stories"
28
+ - "Simple dialogue writing for beginner storytellers"
29
+ - "Assisting in basic storyboarding and scene setting"
30
+ - "Creative exercises for amateur writers and role-players"
31
+ negative_prompts:
32
+ - "Complex literary analysis or critique"
33
+ - "Advanced academic content and technical writing"
34
+
35
+ - source_model: fblgit/UNA-POLAR-10.7B-InstructMath-v2
36
+ positive_prompts:
37
+ - "Advanced mathematical theories and problem-solving"
38
+ - "Instructional content on higher-level math topics"
39
+ - "Explaining mathematical concepts in applied sciences"
40
+ - "Guidance on complex STEM-based academic projects"
41
+ - "Quantitative analysis in economics and finance"
42
+ - "Logical reasoning in computer science and engineering"
43
+ - "Mathematical modeling and statistical analysis"
44
+ - "Developing educational STEM content for advanced learners"
45
+ negative_prompts:
46
+ - "Creative and narrative writing tasks"
47
+ - "General knowledge queries outside of STEM"
48
+
49
+ - source_model: Yhyu13/LMCocktail-10.7B-v1
50
+ positive_prompts:
51
+ - "Practical applications of scientific knowledge in everyday life"
52
+ - "Instructional guides on basic to intermediate STEM topics"
53
+ - "Explaining scientific phenomena to non-experts"
54
+ - "STEM-focused educational content for high school level"
55
+ - "Guidance on science fair projects and experiments"
56
+ - "Simple to moderate math problem-solving for educational purposes"
57
+ - "Answering common science and technology questions"
58
+ - "Providing clear explanations of scientific concepts"
59
+ negative_prompts:
60
+ - "In-depth literary or creative writing"
61
+ - "Advanced theoretical or abstract scientific research"
62
+
63
+ - source_model: vicgalle/CarbonBeagle-11B
64
+ positive_prompts:
65
+ - "Complex real-world problem-solving across various domains"
66
+ - "Interdisciplinary knowledge inquiries blending science, history, and culture"
67
+ - "In-depth discussions on historical events and their impact"
68
+ - "Exploring global issues and their socio-economic aspects"
69
+ - "Comprehensive explanations of contemporary topics"
70
+ - "Multifaceted analysis of current affairs"
71
+ - "Insights into cultural phenomena and trends"
72
+ - "Detailed explorations of technological advancements"
73
+ negative_prompts:
74
+ - "Highly technical scientific research"
75
+ - "Creative fiction and narrative story creation"
76
+
77
+ - source_model: DopeorNope/SOLARC-M-10.7B
78
+ positive_prompts:
79
+ - "Factual information and data analysis across a variety of topics"
80
+ - "Clarifying misconceptions in popular science and history"
81
+ - "Answering trivia and general inquiries with detailed explanations"
82
+ - "Providing nuanced perspectives on current events"
83
+ - "Exploring the intersection of technology and society"
84
+ - "Educational content on general health and wellness"
85
+ - "Guidance on everyday legal and financial questions"
86
+ - "Overview of global cultural and geographical knowledge"
87
+ negative_prompts:
88
+ - "Deeply technical or niche academic subjects"
89
+ - "Elaborate fictional writing and creative storytelling"
90
+
91
+ - source_model: bn22/Nous-Hermes-2-SOLAR-10.7B-MISALIGNED
92
+ positive_prompts:
93
+ - "In-depth academic research support in social sciences"
94
+ - "Logical analysis in economics and business studies"
95
+ - "Scientific explanations in environmental studies"
96
+ - "Data interpretation in political science and sociology"
97
+ - "Assistance with academic writing in humanities"
98
+ - "Problem-solving in logic-based disciplines"
99
+ - "Critical thinking and argumentation in philosophy"
100
+ - "Analyzing historical data and trends"
101
+ negative_prompts:
102
+ - "Creative story and character development"
103
+ - "Day-to-day general knowledge questions"
104
+ - "Mathematical calculations and STEM-focused queries"
105
+
106
+ - source_model: jeonsworld/CarbonVillain-en-10.7B-v4
107
+ positive_prompts:
108
+ - "Detailed scientific inquiry and research in technical fields"
109
+ - "Advanced data analysis and interpretation in STEM"
110
+ - "Complex problem-solving in physics and engineering"
111
+ - "In-depth exploration of biological and chemical concepts"
112
+ - "Technology-focused discussions and analyses"
113
+ - "Statistical modeling and data science applications"
114
+ - "Rigorous academic research in hard sciences"
115
+ - "Critical evaluations of scientific theories and studies"
116
+ negative_prompts:
117
+ - "Narrative writing and fictional storytelling"
118
+ - "Non-technical general knowledge inquiries"
119
+ - "Simple, everyday problem-solving tasks"
120
+
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00001-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd2ebcd672fa4e6c844e6425503549630d0afd19980a23d573e7c295f8d015f9
3
+ size 9919946528
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00002-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56c922f3b6edbdd700f2c5c757665a4867487408a312bbb9af85d9dad15507c4
3
+ size 9982454760
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00003-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f1ccedc9169440feb9de29d716f1c9791fc54234035aa971201e29b2f610fd6
3
+ size 9982454760
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00004-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0282d54081868ceb720faccedc9d702c7db7069987529de708e890ff025d6000
3
+ size 9982454760
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00005-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4960ac38dd79bbe49d8c32ca16f3240955bf61565781f1d24733a5954ec9fbe
3
+ size 9982454720
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00006-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c7bbe0c20c9c95b534c63f9e6d4ad3c615ce16173b68ddb65bf5eff1da9e214
3
+ size 9982454712
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00007-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:693cdff8c21e690760d51fdd205e97fa6062bfa80352b8a7762efa1eb638c2ce
3
+ size 9982454760
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00008-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbd74497359c46df1c1cfdb3d5e24d8f783515e79f64ca96f6001fc7f3bbf428
3
+ size 9982454760
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00009-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a220d3f0e053443678950fc667a86f54ce5d504f3a20d22c3416aee549a1a05
3
+ size 9982454760
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00010-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe7eba3c7436997eadcf1c72b1f65bffa9e7a46cc07760d76c9a8afa9dc0d3e9
3
+ size 9982454680
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00011-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e93010792883f8fe7e4b762493c1b73ec9b5ec3355244d4810392925fb3a543d
3
+ size 9982454752
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00012-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e22180a213ce901d58a4cab9f73f02842936f53dc3fd3c621807c3cbe04ffff
3
+ size 9982454760
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00013-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0226337c83a38389f109b093d0ca8621e966044ac5cc02f46c61e817ed781a54
3
+ size 9982454760
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00014-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5a93b3693f0c7fe86320663831e0653d2a230230b7dfa9f2447800446ec1ce6
3
+ size 9999648648
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model-00015-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b82d78fa11b4d34bd70f0901a7d553c60ddb1ef11fdcb2e8c3f642e38033fa2
3
+ size 137369408
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<s>",
17
+ "unk_token": {
18
+ "content": "<unk>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
+ size 493443
https:/huggingface.co/Steelskull/Celestria-MoE-8x10.7b/tree/main/tokenizer_config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "added_tokens_decoder": {
5
+ "0": {
6
+ "content": "<unk>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "1": {
14
+ "content": "<s>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "2": {
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ }
29
+ },
30
+ "additional_special_tokens": [],
31
+ "bos_token": "<s>",
32
+ "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}{% if message['content']%}{{'### System:\n' + message['content']+'\n\n'}}{% endif %}{% elif message['role'] == 'user' %}{{'### User:\n' + message['content']+'\n\n'}}{% elif message['role'] == 'assistant' %}{{'### Assistant:\n' + message['content']}}{% endif %}{% if loop.last and add_generation_prompt %}{{ '### Assistant:\n' }}{% endif %}{% endfor %}",
33
+ "clean_up_tokenization_spaces": false,
34
+ "eos_token": "</s>",
35
+ "legacy": true,
36
+ "model_max_length": 1000000000000000019884624838656,
37
+ "pad_token": "<s>",
38
+ "sp_model_kwargs": {},
39
+ "spaces_between_special_tokens": false,
40
+ "tokenizer_class": "LlamaTokenizer",
41
+ "unk_token": "<unk>",
42
+ "use_default_system_prompt": false
43
+ }