baltop commited on
Commit
81e224a
·
1 Parent(s): 53b532d

baltop/mistral-instruct-finetune

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 0.0305
20
 
21
  ## Model description
22
 
@@ -48,18 +48,18 @@ The following hyperparameters were used during training:
48
 
49
  | Training Loss | Epoch | Step | Validation Loss |
50
  |:-------------:|:-----:|:----:|:---------------:|
51
- | 1.1899 | 0.17 | 25 | 0.3116 |
52
- | 0.1795 | 0.33 | 50 | 0.1088 |
53
- | 0.0819 | 0.5 | 75 | 0.0425 |
54
- | 0.0453 | 0.67 | 100 | 0.0419 |
55
- | 0.0534 | 0.83 | 125 | 0.0382 |
56
- | 0.0338 | 1.0 | 150 | 0.0315 |
57
- | 0.0358 | 1.17 | 175 | 0.0345 |
58
- | 0.0336 | 1.33 | 200 | 0.0334 |
59
- | 0.0401 | 1.5 | 225 | 0.0322 |
60
- | 0.0326 | 1.67 | 250 | 0.0308 |
61
- | 0.0396 | 1.83 | 275 | 0.0309 |
62
- | 0.0307 | 2.0 | 300 | 0.0305 |
63
 
64
 
65
  ### Framework versions
 
16
 
17
  This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 0.0307
20
 
21
  ## Model description
22
 
 
48
 
49
  | Training Loss | Epoch | Step | Validation Loss |
50
  |:-------------:|:-----:|:----:|:---------------:|
51
+ | 1.1806 | 0.17 | 25 | 0.3104 |
52
+ | 0.1789 | 0.33 | 50 | 0.1074 |
53
+ | 0.0665 | 0.5 | 75 | 0.0420 |
54
+ | 0.0444 | 0.67 | 100 | 0.0414 |
55
+ | 0.05 | 0.83 | 125 | 0.0351 |
56
+ | 0.0322 | 1.0 | 150 | 0.0311 |
57
+ | 0.0361 | 1.17 | 175 | 0.0343 |
58
+ | 0.0338 | 1.33 | 200 | 0.0319 |
59
+ | 0.039 | 1.5 | 225 | 0.0322 |
60
+ | 0.0324 | 1.67 | 250 | 0.0304 |
61
+ | 0.0392 | 1.83 | 275 | 0.0309 |
62
+ | 0.0305 | 2.0 | 300 | 0.0307 |
63
 
64
 
65
  ### Framework versions
adapter_config.json CHANGED
@@ -19,13 +19,13 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
 
22
  "k_proj",
23
  "up_proj",
24
- "down_proj",
25
  "q_proj",
26
  "lm_head",
27
  "gate_proj",
28
- "v_proj",
29
  "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "v_proj",
23
+ "down_proj",
24
  "k_proj",
25
  "up_proj",
 
26
  "q_proj",
27
  "lm_head",
28
  "gate_proj",
 
29
  "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8818e6ea4830b84464c905ac6f94cfe80a63f77e51c2638d2bd0bcefa4dc7252
3
  size 864513616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fc6264c501532bf987ee0a4a8b3abe92f6cd9f3401bd7a759de754e4ec0e795
3
  size 864513616
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3590f49eb926244738eba44f5a2a5b93f3455bb0c8fe39c90b692c6cf1ea1736
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e21b1c43d06392b0c9b0f537763c90b02516bd21d3eed626cd2a59d8380ef01a
3
  size 4664