cdcvd commited on
Commit
d60176e
1 Parent(s): 06cb419

End of training

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [roberta-large](https://huggingface.co/roberta-large) on the cdcvd/ejpfepj dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 1.0886
20
 
21
  ## Model description
22
 
@@ -45,58 +45,58 @@ The following hyperparameters were used during training:
45
 
46
  ### Training results
47
 
48
- | Training Loss | Epoch | Step | Validation Loss |
49
- |:-------------:|:-----:|:----:|:---------------:|
50
- | No log | 1.0 | 13 | 0.2459 |
51
- | No log | 2.0 | 26 | 0.1373 |
52
- | No log | 3.0 | 39 | 0.1105 |
53
- | No log | 4.0 | 52 | 0.1414 |
54
- | No log | 5.0 | 65 | 0.1707 |
55
- | No log | 6.0 | 78 | 0.1172 |
56
- | No log | 7.0 | 91 | 0.3309 |
57
- | No log | 8.0 | 104 | 0.5585 |
58
- | No log | 9.0 | 117 | 0.5192 |
59
- | No log | 10.0 | 130 | 0.5445 |
60
- | No log | 11.0 | 143 | 0.6039 |
61
- | No log | 12.0 | 156 | 0.5424 |
62
- | No log | 13.0 | 169 | 0.5210 |
63
- | No log | 14.0 | 182 | 0.5190 |
64
- | No log | 15.0 | 195 | 0.5433 |
65
- | No log | 16.0 | 208 | 0.5199 |
66
- | No log | 17.0 | 221 | 0.5309 |
67
- | No log | 18.0 | 234 | 0.5507 |
68
- | No log | 19.0 | 247 | 0.5427 |
69
- | No log | 20.0 | 260 | 0.5223 |
70
- | No log | 21.0 | 273 | 0.5194 |
71
- | No log | 22.0 | 286 | 0.5216 |
72
- | No log | 23.0 | 299 | 0.5248 |
73
- | No log | 24.0 | 312 | 0.5192 |
74
- | No log | 25.0 | 325 | 0.5409 |
75
- | No log | 26.0 | 338 | 0.5223 |
76
- | No log | 27.0 | 351 | 0.5719 |
77
- | No log | 28.0 | 364 | 0.5307 |
78
- | No log | 29.0 | 377 | 0.5576 |
79
- | No log | 30.0 | 390 | 0.5272 |
80
- | No log | 31.0 | 403 | 0.5193 |
81
- | No log | 32.0 | 416 | 0.5489 |
82
- | No log | 33.0 | 429 | 0.5215 |
83
- | No log | 34.0 | 442 | 0.5359 |
84
- | No log | 35.0 | 455 | 0.5728 |
85
- | No log | 36.0 | 468 | 0.5560 |
86
- | No log | 37.0 | 481 | 0.5765 |
87
- | No log | 38.0 | 494 | 0.5562 |
88
- | 0.4913 | 39.0 | 507 | 0.6608 |
89
- | 0.4913 | 40.0 | 520 | 0.7299 |
90
- | 0.4913 | 41.0 | 533 | 0.5850 |
91
- | 0.4913 | 42.0 | 546 | 0.7992 |
92
- | 0.4913 | 43.0 | 559 | 0.7670 |
93
- | 0.4913 | 44.0 | 572 | 0.9654 |
94
- | 0.4913 | 45.0 | 585 | 1.0347 |
95
- | 0.4913 | 46.0 | 598 | 0.9568 |
96
- | 0.4913 | 47.0 | 611 | 1.0205 |
97
- | 0.4913 | 48.0 | 624 | 1.0679 |
98
- | 0.4913 | 49.0 | 637 | 1.1054 |
99
- | 0.4913 | 50.0 | 650 | 1.0886 |
100
 
101
 
102
  ### Framework versions
 
16
 
17
  This model is a fine-tuned version of [roberta-large](https://huggingface.co/roberta-large) on the cdcvd/ejpfepj dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 1.0401
20
 
21
  ## Model description
22
 
 
45
 
46
  ### Training results
47
 
48
+ | Training Loss | Epoch | Step | Validation Loss |
49
+ |:-------------:|:-----:|:-----:|:---------------:|
50
+ | No log | 1.0 | 282 | 0.2349 |
51
+ | 0.3151 | 2.0 | 564 | 0.2351 |
52
+ | 0.3151 | 3.0 | 846 | 1.0534 |
53
+ | 0.7392 | 4.0 | 1128 | 1.0375 |
54
+ | 0.7392 | 5.0 | 1410 | 1.0487 |
55
+ | 1.0405 | 6.0 | 1692 | 1.0723 |
56
+ | 1.0405 | 7.0 | 1974 | 1.0318 |
57
+ | 1.0417 | 8.0 | 2256 | 1.0493 |
58
+ | 1.0345 | 9.0 | 2538 | 1.0539 |
59
+ | 1.0345 | 10.0 | 2820 | 1.0324 |
60
+ | 1.0339 | 11.0 | 3102 | 1.0663 |
61
+ | 1.0339 | 12.0 | 3384 | 1.0691 |
62
+ | 1.0303 | 13.0 | 3666 | 1.0563 |
63
+ | 1.0303 | 14.0 | 3948 | 1.0330 |
64
+ | 1.0369 | 15.0 | 4230 | 1.0519 |
65
+ | 1.0312 | 16.0 | 4512 | 1.0440 |
66
+ | 1.0312 | 17.0 | 4794 | 1.0440 |
67
+ | 1.0321 | 18.0 | 5076 | 1.0376 |
68
+ | 1.0321 | 19.0 | 5358 | 1.0358 |
69
+ | 1.0246 | 20.0 | 5640 | 1.0331 |
70
+ | 1.0246 | 21.0 | 5922 | 1.0538 |
71
+ | 1.0343 | 22.0 | 6204 | 1.0440 |
72
+ | 1.0343 | 23.0 | 6486 | 1.0444 |
73
+ | 1.0273 | 24.0 | 6768 | 1.0497 |
74
+ | 1.0277 | 25.0 | 7050 | 1.0471 |
75
+ | 1.0277 | 26.0 | 7332 | 1.0393 |
76
+ | 1.0216 | 27.0 | 7614 | 1.0835 |
77
+ | 1.0216 | 28.0 | 7896 | 1.0508 |
78
+ | 1.0312 | 29.0 | 8178 | 1.0246 |
79
+ | 1.0312 | 30.0 | 8460 | 1.0448 |
80
+ | 1.0297 | 31.0 | 8742 | 1.0344 |
81
+ | 1.0288 | 32.0 | 9024 | 1.0446 |
82
+ | 1.0288 | 33.0 | 9306 | 1.0415 |
83
+ | 1.0252 | 34.0 | 9588 | 1.0460 |
84
+ | 1.0252 | 35.0 | 9870 | 1.0295 |
85
+ | 1.0274 | 36.0 | 10152 | 1.0508 |
86
+ | 1.0274 | 37.0 | 10434 | 1.0470 |
87
+ | 1.0263 | 38.0 | 10716 | 1.0345 |
88
+ | 1.0263 | 39.0 | 10998 | 1.0322 |
89
+ | 1.0275 | 40.0 | 11280 | 1.0398 |
90
+ | 1.0263 | 41.0 | 11562 | 1.0496 |
91
+ | 1.0263 | 42.0 | 11844 | 1.0449 |
92
+ | 1.0248 | 43.0 | 12126 | 1.0404 |
93
+ | 1.0248 | 44.0 | 12408 | 1.0387 |
94
+ | 1.025 | 45.0 | 12690 | 1.0455 |
95
+ | 1.025 | 46.0 | 12972 | 1.0415 |
96
+ | 1.0222 | 47.0 | 13254 | 1.0497 |
97
+ | 1.0233 | 48.0 | 13536 | 1.0362 |
98
+ | 1.0233 | 49.0 | 13818 | 1.0392 |
99
+ | 1.0273 | 50.0 | 14100 | 1.0401 |
100
 
101
 
102
  ### Framework versions
adapter_config.json CHANGED
@@ -19,10 +19,10 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "value",
23
- "key",
24
  "query",
25
- "dense"
 
26
  ],
27
  "task_type": "TOKEN_CLS"
28
  }
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "dense",
 
23
  "query",
24
+ "value",
25
+ "key"
26
  ],
27
  "task_type": "TOKEN_CLS"
28
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c26b6150126b58ea3e42ffeedd71144ebb62028417f004de571da6f028b48c3
3
- size 28361760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75f8e9df83d7f584b872e3fe1928cfdb79b2e589b48ae00d70554425871b5d2b
3
+ size 28402776
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:457e660e78bee391797114873ca0ae5a1e385c88c7a29845907ac5623a01b3bb
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a055807ccad94dd2d8b4c734004e2df3b97d3ce636914eb3f45e999638a3366f
3
  size 4792