nandavikas16 commited on
Commit
1c222d4
1 Parent(s): 0e9e5da

Model save

Browse files
README.md CHANGED
@@ -16,11 +16,11 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [transformer3/H2-keywordextractor](https://huggingface.co/transformer3/H2-keywordextractor) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 0.0530
20
- - Rouge1: 27.6565
21
- - Rouge2: 24.482
22
- - Rougel: 27.5611
23
- - Rougelsum: 27.679
24
 
25
  ## Model description
26
 
@@ -51,31 +51,31 @@ The following hyperparameters were used during training:
51
 
52
  | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum |
53
  |:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|
54
- | 1.1006 | 1.0 | 23 | 0.4121 | 21.1334 | 15.2908 | 21.0076 | 21.0354 |
55
- | 0.4296 | 2.0 | 46 | 0.3515 | 23.1524 | 16.6481 | 23.1602 | 23.1359 |
56
- | 0.366 | 3.0 | 69 | 0.3156 | 24.2342 | 17.9896 | 24.1637 | 24.1872 |
57
- | 0.3263 | 4.0 | 92 | 0.2776 | 25.3692 | 20.5006 | 25.2976 | 25.3696 |
58
- | 0.2951 | 5.0 | 115 | 0.2587 | 25.929 | 21.3159 | 25.7701 | 25.7813 |
59
- | 0.2798 | 6.0 | 138 | 0.2455 | 27.017 | 23.0395 | 26.8045 | 26.8927 |
60
- | 0.2495 | 7.0 | 161 | 0.2234 | 27.5471 | 24.2424 | 27.3809 | 27.4542 |
61
- | 0.2442 | 8.0 | 184 | 0.2100 | 27.1387 | 23.3789 | 27.0447 | 27.141 |
62
- | 0.2203 | 9.0 | 207 | 0.1937 | 27.4281 | 24.1191 | 27.3809 | 27.4542 |
63
- | 0.2138 | 10.0 | 230 | 0.1733 | 27.2385 | 23.6012 | 27.1529 | 27.2287 |
64
- | 0.1921 | 11.0 | 253 | 0.1512 | 27.5491 | 24.2352 | 27.4878 | 27.5915 |
65
- | 0.1687 | 12.0 | 276 | 0.1339 | 27.5491 | 24.2352 | 27.4878 | 27.5915 |
66
- | 0.1615 | 13.0 | 299 | 0.1153 | 27.3214 | 23.9474 | 27.2381 | 27.3508 |
67
- | 0.1367 | 14.0 | 322 | 0.0990 | 27.3214 | 23.8383 | 27.2381 | 27.3508 |
68
- | 0.1282 | 15.0 | 345 | 0.0845 | 27.3214 | 23.8383 | 27.2381 | 27.3508 |
69
- | 0.1085 | 16.0 | 368 | 0.0784 | 27.4178 | 24.1053 | 27.3275 | 27.4506 |
70
- | 0.1018 | 17.0 | 391 | 0.0631 | 27.4471 | 24.1378 | 27.3612 | 27.4531 |
71
- | 0.085 | 18.0 | 414 | 0.0576 | 27.6565 | 24.482 | 27.5611 | 27.679 |
72
- | 0.0814 | 19.0 | 437 | 0.0545 | 27.6565 | 24.482 | 27.5611 | 27.679 |
73
- | 0.0708 | 20.0 | 460 | 0.0530 | 27.6565 | 24.482 | 27.5611 | 27.679 |
74
 
75
 
76
  ### Framework versions
77
 
78
- - Transformers 4.38.2
79
- - Pytorch 2.2.1+cu121
80
  - Datasets 2.18.0
81
  - Tokenizers 0.15.2
 
16
 
17
  This model is a fine-tuned version of [transformer3/H2-keywordextractor](https://huggingface.co/transformer3/H2-keywordextractor) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 0.2073
20
+ - Rouge1: 13.0222
21
+ - Rouge2: 10.4851
22
+ - Rougel: 13.0872
23
+ - Rougelsum: 13.1095
24
 
25
  ## Model description
26
 
 
51
 
52
  | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum |
53
  |:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|
54
+ | 0.8852 | 1.0 | 23 | 0.3103 | 10.3278 | 6.2988 | 10.3528 | 10.3293 |
55
+ | 0.2901 | 2.0 | 46 | 0.2825 | 10.8308 | 7.5214 | 10.8428 | 10.8103 |
56
+ | 0.2625 | 3.0 | 69 | 0.2711 | 12.0182 | 8.6415 | 12.0115 | 12.0537 |
57
+ | 0.2453 | 4.0 | 92 | 0.2550 | 12.9535 | 9.6936 | 12.9952 | 13.0384 |
58
+ | 0.2353 | 5.0 | 115 | 0.2464 | 11.2808 | 7.8603 | 11.3196 | 11.281 |
59
+ | 0.2338 | 6.0 | 138 | 0.2389 | 12.6604 | 9.6355 | 12.6519 | 12.6377 |
60
+ | 0.2183 | 7.0 | 161 | 0.2307 | 13.2591 | 10.6628 | 13.2399 | 13.2554 |
61
+ | 0.2143 | 8.0 | 184 | 0.2252 | 13.537 | 11.1632 | 13.5668 | 13.5957 |
62
+ | 0.2055 | 9.0 | 207 | 0.2206 | 13.7032 | 11.6575 | 13.7226 | 13.774 |
63
+ | 0.2022 | 10.0 | 230 | 0.2158 | 13.7727 | 11.5365 | 13.7404 | 13.8018 |
64
+ | 0.1961 | 11.0 | 253 | 0.2166 | 13.4062 | 11.2919 | 13.4698 | 13.4854 |
65
+ | 0.2018 | 12.0 | 276 | 0.2116 | 13.8406 | 11.852 | 13.8309 | 13.8995 |
66
+ | 0.1946 | 13.0 | 299 | 0.2131 | 12.5757 | 9.5775 | 12.5738 | 12.6535 |
67
+ | 0.1943 | 14.0 | 322 | 0.2142 | 11.617 | 9.0291 | 11.5311 | 11.7201 |
68
+ | 0.2068 | 15.0 | 345 | 0.2080 | 12.9136 | 10.2865 | 12.9659 | 12.9787 |
69
+ | 0.2051 | 16.0 | 368 | 0.2041 | 13.6492 | 11.6388 | 13.6506 | 13.7041 |
70
+ | 0.1887 | 17.0 | 391 | 0.2119 | 11.4317 | 8.2482 | 11.386 | 11.4313 |
71
+ | 0.1886 | 18.0 | 414 | 0.2097 | 13.0287 | 10.6547 | 13.0829 | 13.118 |
72
+ | 0.1887 | 19.0 | 437 | 0.2079 | 13.0073 | 10.5381 | 13.0514 | 13.1089 |
73
+ | 0.186 | 20.0 | 460 | 0.2073 | 13.0222 | 10.4851 | 13.0872 | 13.1095 |
74
 
75
 
76
  ### Framework versions
77
 
78
+ - Transformers 4.39.3
79
+ - Pytorch 2.2.2+cu121
80
  - Datasets 2.18.0
81
  - Tokenizers 0.15.2
config.json CHANGED
@@ -68,7 +68,7 @@
68
  }
69
  },
70
  "torch_dtype": "float32",
71
- "transformers_version": "4.38.2",
72
  "use_cache": false,
73
  "vocab_size": 50265
74
  }
 
68
  }
69
  },
70
  "torch_dtype": "float32",
71
+ "transformers_version": "4.39.3",
72
  "use_cache": false,
73
  "vocab_size": 50265
74
  }
generation_config.json CHANGED
@@ -7,6 +7,6 @@
7
  "no_repeat_ngram_size": 3,
8
  "num_beams": 4,
9
  "pad_token_id": 1,
10
- "transformers_version": "4.38.2",
11
  "use_cache": false
12
  }
 
7
  "no_repeat_ngram_size": 3,
8
  "num_beams": 4,
9
  "pad_token_id": 1,
10
+ "transformers_version": "4.39.3",
11
  "use_cache": false
12
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e59cbf7a1946d155989146a15398f61611bb82d64d60fa2729e7eaf3e5618487
3
  size 1625426996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd223c94e8561eeddc6f992bf6ce7b86a2c53d50f8cc607ac210ea3b4e572f7b
3
  size 1625426996
runs/Apr13_21-13-22_n7nm3al89c/events.out.tfevents.1713042808.n7nm3al89c.401.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd0df98880928abbe6c9e2c7a7a767d44fb4c3db89ad6cf0a08c36dfeab8884f
3
+ size 19917
runs/Apr13_21-13-22_n7nm3al89c/events.out.tfevents.1713044210.n7nm3al89c.401.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7009be83269c9e7f2f6df71273ebcf94b65e770e555071afc35052ad2053dee9
3
+ size 514
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 128,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 128
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 512,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 512
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:191a52283965306150907b02097ad74aebf797219a79dff27f12075ac6f90e25
3
- size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:253e502d761ea5b1935a8c4f23099ce53d0cf6afcbe227c2dd155d59191ca693
3
+ size 5176