ingeniumacademy commited on
Commit
a6a46c9
1 Parent(s): 4770313

End of training

Browse files
README.md CHANGED
@@ -1,8 +1,9 @@
1
  ---
2
  license: mit
3
- base_model: ingeniumacademy/bart-cnn-samsum-finetuned
4
  tags:
5
  - generated_from_trainer
 
6
  datasets:
7
  - samsum
8
  model-index:
@@ -17,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [ingeniumacademy/bart-cnn-samsum-finetuned](https://huggingface.co/ingeniumacademy/bart-cnn-samsum-finetuned) on the samsum dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.2259
21
 
22
  ## Model description
23
 
@@ -48,16 +49,17 @@ The following hyperparameters were used during training:
48
 
49
  | Training Loss | Epoch | Step | Validation Loss |
50
  |:-------------:|:-----:|:----:|:---------------:|
51
- | 0.0766 | 1.0 | 74 | 0.2375 |
52
- | 0.0976 | 2.0 | 148 | 0.2499 |
53
- | 0.0684 | 3.0 | 222 | 0.2361 |
54
- | 0.085 | 4.0 | 296 | 0.2273 |
55
- | 0.0898 | 5.0 | 370 | 0.2259 |
56
 
57
 
58
  ### Framework versions
59
 
60
- - Transformers 4.33.1
61
- - Pytorch 2.0.1+cu118
62
- - Datasets 2.14.5
63
- - Tokenizers 0.13.3
 
 
1
  ---
2
  license: mit
3
+ library_name: peft
4
  tags:
5
  - generated_from_trainer
6
+ base_model: ingeniumacademy/bart-cnn-samsum-finetuned
7
  datasets:
8
  - samsum
9
  model-index:
 
18
 
19
  This model is a fine-tuned version of [ingeniumacademy/bart-cnn-samsum-finetuned](https://huggingface.co/ingeniumacademy/bart-cnn-samsum-finetuned) on the samsum dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.1345
22
 
23
  ## Model description
24
 
 
49
 
50
  | Training Loss | Epoch | Step | Validation Loss |
51
  |:-------------:|:-----:|:----:|:---------------:|
52
+ | 0.0788 | 1.0 | 19 | 0.1344 |
53
+ | 0.0873 | 2.0 | 38 | 0.1345 |
54
+ | 0.0777 | 3.0 | 57 | 0.1345 |
55
+ | 0.0796 | 4.0 | 76 | 0.1345 |
56
+ | 0.0924 | 5.0 | 95 | 0.1345 |
57
 
58
 
59
  ### Framework versions
60
 
61
+ - PEFT 0.11.1
62
+ - Transformers 4.41.1
63
+ - Pytorch 2.3.0+cu121
64
+ - Datasets 2.19.2
65
+ - Tokenizers 0.19.1
adapter_config.json CHANGED
@@ -1,21 +1,29 @@
1
  {
 
2
  "auto_mapping": null,
3
  "base_model_name_or_path": "ingeniumacademy/bart-cnn-samsum-finetuned",
4
  "bias": "none",
5
  "fan_in_fan_out": false,
6
  "inference_mode": true,
7
  "init_lora_weights": true,
 
8
  "layers_pattern": null,
9
  "layers_to_transform": null,
 
10
  "lora_alpha": 32,
11
  "lora_dropout": 0.05,
 
 
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
  "r": 32,
 
15
  "revision": null,
16
  "target_modules": [
17
- "q_proj",
18
- "v_proj"
19
  ],
20
- "task_type": "SEQ_2_SEQ_LM"
 
 
21
  }
 
1
  {
2
+ "alpha_pattern": {},
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "ingeniumacademy/bart-cnn-samsum-finetuned",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
9
+ "layer_replication": null,
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
+ "loftq_config": {},
13
  "lora_alpha": 32,
14
  "lora_dropout": 0.05,
15
+ "megatron_config": null,
16
+ "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
  "r": 32,
20
+ "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "v_proj",
24
+ "q_proj"
25
  ],
26
+ "task_type": "SEQ_2_SEQ_LM",
27
+ "use_dora": false,
28
+ "use_rslora": false
29
  }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f14af5af655aaaff69b44b1ee96dd0a677628792760c7ce34ff77b02ca7a0a41
3
+ size 18894856
runs/Jun04_22-07-00_cc5be8c71c42/events.out.tfevents.1717538832.cc5be8c71c42.1105.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c39ab76bf910ce9020dcdd8c915d6428d7cd9643557227ebbd408d09a5a0d8d
3
+ size 9428
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:764892d477e05d8518acbe79d09ab1449f98bf0df54f3f33bd5e0402781b9c23
3
- size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad94524b00b5316b85621bf7860a5ae3d6ba8f096f76583efc55c36c3983bea8
3
+ size 5176