LoneStriker commited on
Commit
fdb7934
1 Parent(s): 368a4b1

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -1,35 +1,5 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
- *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
- *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
- *.tflite filter=lfs diff=lfs merge=lfs -text
30
- *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
- *.xz filter=lfs diff=lfs merge=lfs -text
33
- *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
- *tfevents* filter=lfs diff=lfs merge=lfs -text
 
1
+ zephyr-7b-gemma-sft-v0.1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
2
+ zephyr-7b-gemma-sft-v0.1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
3
+ zephyr-7b-gemma-sft-v0.1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
4
+ zephyr-7b-gemma-sft-v0.1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
5
+ zephyr-7b-gemma-sft-v0.1-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
README.md ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: other
3
+ license_name: gemma-terms-of-use
4
+ license_link: https://ai.google.dev/gemma/terms
5
+ base_model: google/gemma-7b
6
+ tags:
7
+ - alignment-handbook
8
+ - trl
9
+ - sft
10
+ - generated_from_trainer
11
+ - trl
12
+ - sft
13
+ - generated_from_trainer
14
+ datasets:
15
+ - HuggingFaceH4/deita-10k-v0-sft
16
+ model-index:
17
+ - name: zephyr-7b-gemma-sft
18
+ results: []
19
+ language:
20
+ - en
21
+ ---
22
+
23
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
24
+ should probably proofread and complete it, then remove this comment. -->
25
+
26
+ # zephyr-7b-gemma-sft
27
+
28
+ This model is a fine-tuned version of [google/gemma-7b](https://huggingface.co/google/gemma-7b) on the HuggingFaceH4/deita-10k-v0-sft dataset.
29
+ It achieves the following results on the evaluation set:
30
+ - Loss: 0.9732
31
+
32
+ ## Model description
33
+
34
+ More information needed
35
+
36
+ ## Intended uses & limitations
37
+
38
+ More information needed
39
+
40
+ ## Training and evaluation data
41
+
42
+ More information needed
43
+
44
+ ## Training procedure
45
+
46
+ ### Training hyperparameters
47
+
48
+ The following hyperparameters were used during training:
49
+ - learning_rate: 2e-05
50
+ - train_batch_size: 4
51
+ - eval_batch_size: 4
52
+ - seed: 42
53
+ - distributed_type: multi-GPU
54
+ - num_devices: 16
55
+ - gradient_accumulation_steps: 2
56
+ - total_train_batch_size: 128
57
+ - total_eval_batch_size: 64
58
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
59
+ - lr_scheduler_type: cosine
60
+ - lr_scheduler_warmup_ratio: 0.1
61
+ - num_epochs: 3
62
+
63
+ ### Training results
64
+
65
+ | Training Loss | Epoch | Step | Validation Loss |
66
+ |:-------------:|:-----:|:----:|:---------------:|
67
+ | 0.9482 | 1.0 | 299 | 0.9848 |
68
+ | 0.8139 | 2.0 | 599 | 0.9610 |
69
+ | 0.722 | 2.99 | 897 | 0.9732 |
70
+
71
+
72
+ ### Framework versions
73
+
74
+ - Transformers 4.39.0.dev0
75
+ - Pytorch 2.1.2+cu121
76
+ - Datasets 2.14.6
77
+ - Tokenizers 0.15.1
huggingface-metadata.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ url: https://huggingface.co/HuggingFaceH4/zephyr-7b-gemma-sft-v0.1
2
+ branch: main
3
+ download date: 2024-03-01 22:09:44
4
+ sha256sum:
5
+ 10276a0f87e08f62e2829230be70ff541d6e234ffe356ddbf25abeb57433c01b model-00001-of-00004.safetensors
6
+ ad38dd72c60feb83f5f94b7c637f876a74d27a50fc122da30bf35b3213802a41 model-00002-of-00004.safetensors
7
+ 291250b5d90bd318addab6e1df790bf70cb702814540fbeff26a67d06ee5371c model-00003-of-00004.safetensors
8
+ 809106cf81c8dfa99d1e3e223e42289fc3b51f1227bfdf9070c4fd113858a448 model-00004-of-00004.safetensors
9
+ 22449cb9ef4bad0db7dd93b46ddff7ab7d6a654dd4f903e130ddb6361eac3af5 tokenizer.json
zephyr-7b-gemma-sft-v0.1-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c007c6196700d1fbebbd42c3cbd8449a716201451fa1f293b8231bb548101f85
3
+ size 4401867488
zephyr-7b-gemma-sft-v0.1-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4618148cb74c4e0f8d495116fb2101169d59e46847c6c0a09805ba067e4e1d10
3
+ size 5127006944
zephyr-7b-gemma-sft-v0.1-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9af8f99fe03d289e8c7fa3ad0cc9741e991fb8ed3958d7fe41d2be087051593
3
+ size 6040054496
zephyr-7b-gemma-sft-v0.1-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b93cf53fc921cbec1fb2f80596b5bc8d19d998b41dea26fe3ffd8077e91a8128
3
+ size 7010167520
zephyr-7b-gemma-sft-v0.1-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc567366cd5dab0b6985d06c10a983a292836744d6936cc1c79b8b994f6e7ad0
3
+ size 9077844704