nblinh63 commited on
Commit
869aff3
·
verified ·
1 Parent(s): 729386f

End of training

Browse files
README.md CHANGED
@@ -96,7 +96,7 @@ xformers_attention: true
96
 
97
  This model is a fine-tuned version of [princeton-nlp/gemma-2-9b-it-SimPO](https://huggingface.co/princeton-nlp/gemma-2-9b-it-SimPO) on the None dataset.
98
  It achieves the following results on the evaluation set:
99
- - Loss: 2.9580
100
 
101
  ## Model description
102
 
@@ -128,7 +128,7 @@ The following hyperparameters were used during training:
128
 
129
  | Training Loss | Epoch | Step | Validation Loss |
130
  |:-------------:|:------:|:----:|:---------------:|
131
- | 2.9045 | 0.0002 | 10 | 2.9580 |
132
 
133
 
134
  ### Framework versions
 
96
 
97
  This model is a fine-tuned version of [princeton-nlp/gemma-2-9b-it-SimPO](https://huggingface.co/princeton-nlp/gemma-2-9b-it-SimPO) on the None dataset.
98
  It achieves the following results on the evaluation set:
99
+ - Loss: 2.9671
100
 
101
  ## Model description
102
 
 
128
 
129
  | Training Loss | Epoch | Step | Validation Loss |
130
  |:-------------:|:------:|:----:|:---------------:|
131
+ | 2.8899 | 0.0002 | 10 | 2.9671 |
132
 
133
 
134
  ### Framework versions
adapter_config.json CHANGED
@@ -21,12 +21,12 @@
21
  "revision": null,
22
  "target_modules": [
23
  "k_proj",
24
- "q_proj",
25
- "up_proj",
26
  "gate_proj",
 
 
27
  "o_proj",
28
- "down_proj",
29
- "v_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
21
  "revision": null,
22
  "target_modules": [
23
  "k_proj",
24
+ "down_proj",
 
25
  "gate_proj",
26
+ "q_proj",
27
+ "v_proj",
28
  "o_proj",
29
+ "up_proj"
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d87ee4da3889f67b16eedcdaacb3cabd224705b415104dba08bfbb8e0d31c73b
3
  size 216284090
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5588ed546ef6da45bfd35c12b2ff9441e49ac19faeb3df6a31632df2304b163
3
  size 216284090
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cfc4a7fc2e1a6f01d3c26dbd53f738d0dff2feaad7c5d23971468e32c6433cdc
3
  size 216151256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d36e12e1b7633339c50968901f943f5adb35fc727228026cf3163878f2ecca6f
3
  size 216151256
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e9874ead154c1a0a17075a08fb08acdd5dfa5877d65694ee03b49336cadfd53
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52a22b0f5c5928fba83552206be6cfa499a233f428eef8f31fb1b44e7059a810
3
  size 6776