laquythang commited on
Commit
9e1f312
1 Parent(s): 37ac2cc

End of training

Browse files
README.md CHANGED
@@ -105,7 +105,7 @@ xformers_attention: null
105
 
106
  This model is a fine-tuned version of [EleutherAI/pythia-1b](https://huggingface.co/EleutherAI/pythia-1b) on the None dataset.
107
  It achieves the following results on the evaluation set:
108
- - Loss: 3.6513
109
 
110
  ## Model description
111
 
@@ -140,9 +140,9 @@ The following hyperparameters were used during training:
140
  | Training Loss | Epoch | Step | Validation Loss |
141
  |:-------------:|:------:|:----:|:---------------:|
142
  | 26.2925 | 0.0022 | 1 | 6.3621 |
143
- | 31.4505 | 0.0065 | 3 | 6.0551 |
144
- | 24.3794 | 0.0130 | 6 | 4.7808 |
145
- | 17.7134 | 0.0196 | 9 | 3.6513 |
146
 
147
 
148
  ### Framework versions
 
105
 
106
  This model is a fine-tuned version of [EleutherAI/pythia-1b](https://huggingface.co/EleutherAI/pythia-1b) on the None dataset.
107
  It achieves the following results on the evaluation set:
108
+ - Loss: 3.6329
109
 
110
  ## Model description
111
 
 
140
  | Training Loss | Epoch | Step | Validation Loss |
141
  |:-------------:|:------:|:----:|:---------------:|
142
  | 26.2925 | 0.0022 | 1 | 6.3621 |
143
+ | 31.458 | 0.0065 | 3 | 6.0527 |
144
+ | 24.4518 | 0.0130 | 6 | 4.7729 |
145
+ | 17.4177 | 0.0196 | 9 | 3.6329 |
146
 
147
 
148
  ### Framework versions
adapter_config.json CHANGED
@@ -20,10 +20,10 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "dense",
24
  "query_key_value",
25
- "dense_4h_to_h",
26
- "dense_h_to_4h"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "dense_h_to_4h",
24
  "query_key_value",
25
+ "dense",
26
+ "dense_4h_to_h"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4f0d76be970bf2f086a9c154c6862f40882b7c43e1ee9100da508ad548e0ab6
3
  size 33601418
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5c4e31bdc6eb971f3f287de0adbcee7bc937f71022a21c6ecf8a82af24e1f51
3
  size 33601418
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57d10411134e4e8b7edda32ed065076e3056c883ffa784c0858322790cbad7b6
3
  size 33572288
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d45b8f2e0055ebb30f1397db12b068ac241a6c0352338292f386717953cc3b0d
3
  size 33572288
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7039ee5e93e39ae75f53f38b044442799d1e30cd7ff9a83e519c275615c657cc
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5626cd2613597d38b016ac503b35d867aeed1b5b31a1151465dc38b87f3fc7b
3
  size 6776