LoneStriker commited on
Commit
8dec3d1
1 Parent(s): e8715ca

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -1,35 +1,9 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
- *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
- *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
- *.tflite filter=lfs diff=lfs merge=lfs -text
30
- *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
- *.xz filter=lfs diff=lfs merge=lfs -text
33
- *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
- *tfevents* filter=lfs diff=lfs merge=lfs -text
 
1
+ KafkaLM-8x7b-German-V0.1-DPO-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
2
+ KafkaLM-8x7b-German-V0.1-DPO-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
3
+ KafkaLM-8x7b-German-V0.1-DPO-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
4
+ KafkaLM-8x7b-German-V0.1-DPO-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
5
+ KafkaLM-8x7b-German-V0.1-DPO-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
6
+ KafkaLM-8x7b-German-V0.1-DPO-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
7
+ KafkaLM-8x7b-German-V0.1-DPO-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
8
+ KafkaLM-8x7b-German-V0.1-DPO-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
9
+ KafkaLM-8x7b-German-V0.1-DPO-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
KafkaLM-8x7b-German-V0.1-DPO-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ff784695db69fa0d15c9beb21fb73a5d50416384cecf9d03c82b2765e6dca88
3
+ size 17309173152
KafkaLM-8x7b-German-V0.1-DPO-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae8c09a1839e7f58c99d2658311d2960dbeee2dd661e91cfaf44d49c71439ec5
3
+ size 24167589280
KafkaLM-8x7b-German-V0.1-DPO-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa46a893bdd43d6feb2888cb9c49700e09f71753d8b86d908ce9cb99373e9650
3
+ size 22544393632
KafkaLM-8x7b-German-V0.1-DPO-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:603aa7d853fd04d326c281a9e8dfe5d533c12affa77a49d8ec2ef9db76a0a4e5
3
+ size 20430464416
KafkaLM-8x7b-German-V0.1-DPO-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f32b2fae36c67670dcbf23ba2bafc72ede27cc19938d0f61396d605d24712521
3
+ size 28446410144
KafkaLM-8x7b-German-V0.1-DPO-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4bd67e389e9be836bbfe3ca9df076be47bead6811c4934e9598695152efed84
3
+ size 26743522720
KafkaLM-8x7b-German-V0.1-DPO-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7836a380a8171a15317033637304eca39e2b4fabe9d8f8d5f7512473c511e8ce
3
+ size 33227523488
KafkaLM-8x7b-German-V0.1-DPO-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:924e00e69c70a24fcf40a85394662a1e3c9dcb8664810cb23b91848e3f8788d7
3
+ size 32229279136
KafkaLM-8x7b-German-V0.1-DPO-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d4c22a1f56906b31a90c9f06be04c85175cc93e88bf5af571d6e1e6390bd1f8
3
+ size 38378759584
README.md ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ tags:
4
+ - deutsch
5
+ - german
6
+ - seedbox
7
+ - mistral
8
+ - mixtral
9
+ license: apache-2.0
10
+ datasets:
11
+ - seedboxai/multitask_german_examples_32k
12
+ - seedboxai/ultra_feedback_german_modified_v1
13
+ language:
14
+ - de
15
+ pipeline_tag: text-generation
16
+ ---
17
+
18
+ ![image/jpeg](https://cdn-uploads.huggingface.co/production/uploads/645ded34a45b4182d7f5c385/9QywLGTbRrHYSq-m6fQmJ.jpeg)
19
+
20
+
21
+ # KafkaLM-8x7b-German-V0.1
22
+
23
+ **KafkaLM 8x7b** is a MoE model based on [Mistral AI´s Mixtral 8x7b](https://mistral.ai/news/mixtral-of-experts/) which was finetuned on an ensemble of popular high-quality open-source instruction sets (translated from English to German).
24
+
25
+ KafkaLM 8x7b is a [Seedbox](https://huggingface.co/seedboxai) project trained by [Dennis Dickmann](https://huggingface.co/doubledsbv).
26
+
27
+ **Why Kafka?**
28
+ The models are proficient, yet creative, have some tendencies to linguistically push boundaries 😊
29
+
30
+
31
+ ## Model Details
32
+
33
+ The purpose of releasing the **KafkaLM series** is to contribute to the German AI community with a set of fine-tuned LLMs that are easy to use in everyday applications across a variety of tasks.
34
+
35
+ The main goal was to provide LLMs proficient in German, especially to be used in German-speaking business contexts where English alone is not sufficient.
36
+
37
+ ### DPO
38
+
39
+ The model has been aligned with a german and modified version of the ultra feedback dataset from huggingface.
40
+
41
+ ### Dataset
42
+
43
+ I used a 8k filtered version of the following [seedboxai/multitask_german_examples_32k](https://huggingface.co/datasets/seedboxai/multitask_german_examples_32k)
44
+
45
+ ### Prompt Format
46
+
47
+
48
+ This model follows the subsequent prompt format:
49
+
50
+ ```
51
+ <|system|>
52
+ Du bist ein freundlicher und hilfsbereiter KI-Assistent. Du beantwortest Fragen faktenorientiert und präzise, ohne dabei relevante Fakten auszulassen.</s>
53
+ <|user|>
54
+ Welche Möglichkeiten der energetischen Sanierung habe ich neben Solar und Energiespeicher?</s>
55
+ <|assistant|>
56
+ ```
57
+
58
+ ### Inference
59
+
60
+ Getting started with the model is straightforward
61
+
62
+ ```python
63
+ import transformers
64
+
65
+ model_id = "seedboxai/KafkaLM-8x7B-German-V0.1-DPO"
66
+
67
+ model = AutoModelForCausalLM.from_pretrained(model_id, load_in_4bit=True, trust_remote_code=True)
68
+
69
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
70
+
71
+ def generate_prompt(input):
72
+ prompt = ''
73
+ sys_prompt = "Du bist ein freundlicher und hilfsbereiter KI-Assistent. Du beantwortest Fragen faktenorientiert und präzise, ohne dabei relevante Fakten auszulassen."
74
+
75
+ prompt += f"<|system|>\n{sys_prompt.strip()}</s>\n"
76
+ prompt += f"<|user|>\n{input.strip()}</s>\n"
77
+ prompt += f"<|assistant|>\n"
78
+
79
+ return prompt.strip()
80
+
81
+
82
+ generate_text = transformers.pipeline(
83
+ model=model, tokenizer=tokenizer,
84
+ return_full_text=True,
85
+ task='text-generation',
86
+ temperature=0.5,
87
+ max_new_tokens=512,
88
+ top_p=0.95,
89
+ top_k=50,
90
+ do_sample=True,
91
+ )
92
+
93
+ print(generate_text(generate_prompt("Wer ist eigentlich dieser Kafka?"))
94
+
95
+ ```
96
+
97
+ ## Disclaimer
98
+
99
+ The license on this model does not constitute legal advice. We are not responsible for the actions of third parties who use this model.
100
+ This model should only be used for research purposes. The original Llama2 license and all restrictions of datasets used to train this model apply.
huggingface-metadata.txt ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ url: https://huggingface.co/seedboxai/KafkaLM-8x7b-German-V0.1-DPO
2
+ branch: main
3
+ download date: 2024-02-15 10:26:37
4
+ sha256sum:
5
+ 5c990c6ea3bdfcde5d6fa97a20f7bb8489e8c7338644e2b22f8cf25818ce9e11 model-00001-of-00039.safetensors
6
+ fe7646c12dd730078c98f2d44297b44458307dd12767b467b4f86a2984f1de47 model-00002-of-00039.safetensors
7
+ 13f19a49293abe99a576b0ce3929cc07ef41f27d0c9baaa3f52f68970b6720d4 model-00003-of-00039.safetensors
8
+ d518bfaaaed4ab6745318fd3547c4a30ad8f5dc9ed3880e23597976d34c68554 model-00004-of-00039.safetensors
9
+ 7cadcd62f958377f8c6ecd2a8d91789b39d947608ef5966dcbe1c4a1f47049d0 model-00005-of-00039.safetensors
10
+ 0db04d581cc8843ee905224a263c533aea2bc040df93ebd9e21f7485ea753132 model-00006-of-00039.safetensors
11
+ ff5119411700efc0b0d80b0e7b364eddbfb9847f91c3296e0b344acd981fcbd2 model-00007-of-00039.safetensors
12
+ f2d6314b97e43abad0e93d8fb3fdf2a1ff8dc7dd1e18d56abf07334ca1b56096 model-00008-of-00039.safetensors
13
+ b83d7e18dfbcca682465e23367fcb93655e2d5fe60ff00371b49844cdeb98b8b model-00009-of-00039.safetensors
14
+ 040485aa8f9d4d146e0b248ddcf16d2593ab47a156f026543ba659783bee51d8 model-00010-of-00039.safetensors
15
+ f9fda815c4e401d63794a75664e4454086808cada111685d56ccf9590e6fe54b model-00011-of-00039.safetensors
16
+ e7ac62fa7b4945beaa9aa2541df84b1b3df5cdce7d1af1accd308384ce7ddc9c model-00012-of-00039.safetensors
17
+ 41f87398271754733a0667682eb8ef4d211d1aab970ab86cff5bdca322f8a8df model-00013-of-00039.safetensors
18
+ b1c4e598453fdcc597b6291e8b4788b21cab23be4f1b806e0871ab4140680603 model-00014-of-00039.safetensors
19
+ eb037b28ce4cd25ae3f235c22a40735520ec542c14da4c335de353b6155e1835 model-00015-of-00039.safetensors
20
+ 0e2e178b8bedb7d402569aa1a1dbfa1fe3161944d2854b255eee94c73162015f model-00016-of-00039.safetensors
21
+ 76943d899f6924da8272f4cc50d02e8864de99158d355bc35f5ba0e8915a858e model-00017-of-00039.safetensors
22
+ 434c588897cde14211182cfd7d2eade857b0addd8c9c409655f72b1d005b910e model-00018-of-00039.safetensors
23
+ c5bdbc41a8f2386b2ecfb6ff9844e26deec4023ada34b3f2dd555506f5ef9d73 model-00019-of-00039.safetensors
24
+ d58562d1f02dd718c7ed1da1fd0ca6f73c9e356cb3bffcc5d93106b61a9359a3 model-00020-of-00039.safetensors
25
+ 26fab439fad7a239ae79a27dad2dbc7ca9ff1c35ffaad6c28922f7a1f91f81b2 model-00021-of-00039.safetensors
26
+ f809057c08a390638024321e4c22d68c25dc5de15033bf875ccb4e3f807d1dd9 model-00022-of-00039.safetensors
27
+ 24141d66049ad3723104e8f55a99b90afb2e1dfe74cf42919ae4ef4c8a117ee0 model-00023-of-00039.safetensors
28
+ 25d5c910e8270ede8c48a189549fc8818e26913f1a7421ba02b5b95e8e4e22ee model-00024-of-00039.safetensors
29
+ 64dec72f25781d1370290a1a67c908fe326e6e088b544e5c3598810d25fa4160 model-00025-of-00039.safetensors
30
+ f5c3a336a71bee7c2eb841c8a4a26b05ad034d691124108c7773b4b42809f0be model-00026-of-00039.safetensors
31
+ 4878787645006ae7b52fd7c53bbb26ff450d0ebdd179292d0bc532b6586492d2 model-00027-of-00039.safetensors
32
+ 0b7b39c7adc025284ad8e514487ecd4939bafc7386ae9deea94c528970b145d8 model-00028-of-00039.safetensors
33
+ 1e588bb3ca105a72e84a20e4230eb799e86539bd5e5e27009446af45ce139dff model-00029-of-00039.safetensors
34
+ 58294165ab3abb9ef2a73e7d93aaab5b638bdb419aae60249c50bd7deb088188 model-00030-of-00039.safetensors
35
+ c14e641970ea2f713977d63036547814ccd243f2681352ec941570d9df17312a model-00031-of-00039.safetensors
36
+ 2b2c94d4d9fd8996474fde5ff1b568fbbdafeb130c7a7027dd48acfbf2413274 model-00032-of-00039.safetensors
37
+ 03f06fe39f9c0fa4dd8dd18894a9c54ffc0267a5b29c677c8fc65ce7d4542010 model-00033-of-00039.safetensors
38
+ f241bf09bf2c482c01267eaca0d609ca76897ebb095f5811d17885bf376584b6 model-00034-of-00039.safetensors
39
+ 7dc056901ca382f1411315fdb058f5e81d94c84891eccd84f52f7305b55ce2af model-00035-of-00039.safetensors
40
+ 906664c2b302d64f59ac8b77f1574f96b4a8e050fd30a127d57ef3af119a68a1 model-00036-of-00039.safetensors
41
+ 57525a3d3d422788d35b394624fea656a5d8f7d1cc987d8377b7963bf006d34d model-00037-of-00039.safetensors
42
+ 1f6c9be67ffd7c39216759c94e4eb835ae455b9a1f15d3d2facd28a90774a0ce model-00038-of-00039.safetensors
43
+ cf35d1c660a0ff1e3715fafc0b3575c26e9ed2bc1a9ba618db23aaab1bd44cb2 model-00039-of-00039.safetensors