nandavikas16 commited on
Commit
1eb2d66
1 Parent(s): 4eb5543

Model save

Browse files
README.md CHANGED
@@ -17,11 +17,11 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [facebook/bart-large-cnn](https://huggingface.co/facebook/bart-large-cnn) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.1209
21
- - Rouge1: 55.1221
22
- - Rouge2: 41.5118
23
- - Rougel: 44.1055
24
- - Rougelsum: 44.1111
25
 
26
  ## Model description
27
 
@@ -52,21 +52,21 @@ The following hyperparameters were used during training:
52
 
53
  | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum |
54
  |:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|
55
- | 0.6833 | 1.0 | 40 | 0.2361 | 49.6521 | 32.0116 | 37.6798 | 37.6414 |
56
- | 0.2662 | 2.0 | 80 | 0.2113 | 51.0105 | 34.9383 | 38.5987 | 38.7128 |
57
- | 0.2372 | 3.0 | 120 | 0.1899 | 49.9708 | 34.1358 | 39.2319 | 39.256 |
58
- | 0.2295 | 4.0 | 160 | 0.1781 | 52.0623 | 36.7753 | 39.7153 | 39.7944 |
59
- | 0.2022 | 5.0 | 200 | 0.1613 | 53.525 | 37.8889 | 42.8148 | 42.8252 |
60
- | 0.204 | 6.0 | 240 | 0.1561 | 54.6369 | 39.0632 | 42.0898 | 42.0239 |
61
- | 0.1801 | 7.0 | 280 | 0.1409 | 54.6083 | 39.9751 | 43.8491 | 43.8897 |
62
- | 0.175 | 8.0 | 320 | 0.1329 | 54.9258 | 40.6335 | 44.7135 | 44.6887 |
63
- | 0.1715 | 9.0 | 360 | 0.1331 | 56.8449 | 41.313 | 43.4297 | 43.56 |
64
- | 0.1551 | 10.0 | 400 | 0.1209 | 55.1221 | 41.5118 | 44.1055 | 44.1111 |
65
 
66
 
67
  ### Framework versions
68
 
69
- - Transformers 4.40.1
70
- - Pytorch 2.3.0+cu121
71
- - Datasets 2.19.0
72
  - Tokenizers 0.19.1
 
17
 
18
  This model is a fine-tuned version of [facebook/bart-large-cnn](https://huggingface.co/facebook/bart-large-cnn) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.1309
21
+ - Rouge1: 52.6236
22
+ - Rouge2: 39.8632
23
+ - Rougel: 43.4607
24
+ - Rougelsum: 43.3561
25
 
26
  ## Model description
27
 
 
52
 
53
  | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum |
54
  |:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|
55
+ | 0.5104 | 1.0 | 34 | 0.2207 | 41.732 | 26.7717 | 31.2807 | 31.3611 |
56
+ | 0.2181 | 2.0 | 68 | 0.2001 | 44.5268 | 30.0523 | 34.7912 | 35.0095 |
57
+ | 0.1824 | 3.0 | 102 | 0.1995 | 45.4038 | 32.6808 | 36.3856 | 36.4004 |
58
+ | 0.1851 | 4.0 | 136 | 0.1728 | 48.85 | 35.9202 | 39.2826 | 39.1813 |
59
+ | 0.1692 | 5.0 | 170 | 0.1663 | 47.1374 | 34.5505 | 37.8192 | 37.8176 |
60
+ | 0.164 | 6.0 | 204 | 0.1594 | 50.3895 | 37.8751 | 40.4181 | 40.3778 |
61
+ | 0.1534 | 7.0 | 238 | 0.1526 | 50.7178 | 38.8207 | 41.5719 | 41.6111 |
62
+ | 0.1421 | 8.0 | 272 | 0.1424 | 51.3382 | 38.6796 | 40.4545 | 40.3891 |
63
+ | 0.1423 | 9.0 | 306 | 0.1354 | 53.8161 | 41.0736 | 45.1571 | 45.0427 |
64
+ | 0.1336 | 10.0 | 340 | 0.1309 | 52.6236 | 39.8632 | 43.4607 | 43.3561 |
65
 
66
 
67
  ### Framework versions
68
 
69
+ - Transformers 4.41.2
70
+ - Pytorch 2.3.1+cu121
71
+ - Datasets 2.20.0
72
  - Tokenizers 0.19.1
config.json CHANGED
@@ -65,7 +65,7 @@
65
  }
66
  },
67
  "torch_dtype": "float32",
68
- "transformers_version": "4.40.1",
69
  "use_cache": false,
70
  "vocab_size": 50264
71
  }
 
65
  }
66
  },
67
  "torch_dtype": "float32",
68
+ "transformers_version": "4.41.2",
69
  "use_cache": false,
70
  "vocab_size": 50264
71
  }
generation_config.json CHANGED
@@ -11,6 +11,6 @@
11
  "no_repeat_ngram_size": 3,
12
  "num_beams": 4,
13
  "pad_token_id": 1,
14
- "transformers_version": "4.40.1",
15
  "use_cache": false
16
  }
 
11
  "no_repeat_ngram_size": 3,
12
  "num_beams": 4,
13
  "pad_token_id": 1,
14
+ "transformers_version": "4.41.2",
15
  "use_cache": false
16
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:238de40f0c150736b32683a76be68b3534141f618d53da8a915d68df4040939b
3
  size 1625422896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f8a2b7a5c5d36dea3021ffa0a2ea474abb1d9a6c6c749acbbd8bca4543f3be2
3
  size 1625422896
runs/Jun18_20-50-06_nhva9sd5jo/events.out.tfevents.1718744436.nhva9sd5jo.455.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc26455f2d0ef6e2932a122fbb051c3f2d8d9d1e5bc356125c4ca1d00878f5be
3
+ size 13207
runs/Jun18_20-50-06_nhva9sd5jo/events.out.tfevents.1718748010.nhva9sd5jo.455.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f198a789ca896f4b46742a20d9ffc0b1c4e4e34e2a56a857e44a37a2727a6ac4
3
+ size 514
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a944bc09dc8d916d3117d2a2992809bdb3357cb5a3741bc4ec716fdf4988dc5
3
- size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e84ce033218d186f2869281b79882a8cfc2a7a820ecc77b553552f0ac2b342e
3
+ size 5304