gyr66 commited on
Commit
fcc7a18
β€’
1 Parent(s): df70323

End of training

Browse files
Files changed (4) hide show
  1. README.md +27 -10
  2. config.json +2 -5
  3. model.safetensors +1 -1
  4. training_args.bin +1 -1
README.md CHANGED
@@ -1,6 +1,11 @@
1
  ---
2
  tags:
3
  - generated_from_trainer
 
 
 
 
 
4
  model-index:
5
  - name: RoBERTa-ext-large-crf-chinese-finetuned-ner
6
  results: []
@@ -13,15 +18,11 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
- - eval_loss: 93.6921
17
- - eval_precision: 0.6788
18
- - eval_recall: 0.7538
19
- - eval_f1: 0.7143
20
- - eval_accuracy: 0.9634
21
- - eval_runtime: 23.7231
22
- - eval_samples_per_second: 21.203
23
- - eval_steps_per_second: 2.656
24
- - step: 0
25
 
26
  ## Model description
27
 
@@ -46,7 +47,23 @@ The following hyperparameters were used during training:
46
  - seed: 42
47
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
48
  - lr_scheduler_type: linear
49
- - num_epochs: 1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
50
 
51
  ### Framework versions
52
 
 
1
  ---
2
  tags:
3
  - generated_from_trainer
4
+ metrics:
5
+ - precision
6
+ - recall
7
+ - f1
8
+ - accuracy
9
  model-index:
10
  - name: RoBERTa-ext-large-crf-chinese-finetuned-ner
11
  results: []
 
18
 
19
  This model was trained from scratch on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.7186
22
+ - Precision: 0.6813
23
+ - Recall: 0.7573
24
+ - F1: 0.7173
25
+ - Accuracy: 0.9639
 
 
 
 
26
 
27
  ## Model description
28
 
 
47
  - seed: 42
48
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
49
  - lr_scheduler_type: linear
50
+ - num_epochs: 10
51
+
52
+ ### Training results
53
+
54
+ | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
55
+ |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
56
+ | 0.0197 | 1.0 | 503 | 0.6375 | 0.6663 | 0.7314 | 0.6973 | 0.9621 |
57
+ | 0.0251 | 2.0 | 1006 | 0.6048 | 0.6494 | 0.7435 | 0.6933 | 0.9611 |
58
+ | 0.0176 | 3.0 | 1509 | 0.6196 | 0.6669 | 0.7389 | 0.7011 | 0.9618 |
59
+ | 0.0116 | 4.0 | 2012 | 0.6361 | 0.6511 | 0.7560 | 0.6997 | 0.9624 |
60
+ | 0.0082 | 5.0 | 2515 | 0.6682 | 0.6746 | 0.7387 | 0.7052 | 0.9622 |
61
+ | 0.0067 | 6.0 | 3018 | 0.6587 | 0.6715 | 0.7409 | 0.7045 | 0.9635 |
62
+ | 0.0046 | 7.0 | 3521 | 0.6846 | 0.6770 | 0.7613 | 0.7167 | 0.9636 |
63
+ | 0.0019 | 8.0 | 4024 | 0.7081 | 0.6766 | 0.7510 | 0.7118 | 0.9630 |
64
+ | 0.0014 | 9.0 | 4527 | 0.7064 | 0.6812 | 0.7553 | 0.7163 | 0.9641 |
65
+ | 0.001 | 10.0 | 5030 | 0.7186 | 0.6813 | 0.7573 | 0.7173 | 0.9639 |
66
+
67
 
68
  ### Framework versions
69
 
config.json CHANGED
@@ -1,12 +1,9 @@
1
  {
2
- "_name_or_path": "gyr66/RoBERTa-ext-large-crf-chinese-finetuned-ner",
3
  "architectures": [
4
  "BertCrfForTokenClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
- "auto_map": {
8
- "AutoModelForTokenClassification": "model.BertCrfForTokenClassification"
9
- },
10
  "bos_token_id": 0,
11
  "classifier_dropout": null,
12
  "directionality": "bidi",
@@ -92,7 +89,7 @@
92
  "pooler_type": "first_token_transform",
93
  "position_embedding_type": "absolute",
94
  "torch_dtype": "float32",
95
- "transformers_version": "4.36.2",
96
  "type_vocab_size": 2,
97
  "use_cache": true,
98
  "vocab_size": 21128
 
1
  {
2
+ "_name_or_path": "./RoBERTa-ext-large-chinese-finetuned-ner",
3
  "architectures": [
4
  "BertCrfForTokenClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
 
 
7
  "bos_token_id": 0,
8
  "classifier_dropout": null,
9
  "directionality": "bidi",
 
89
  "pooler_type": "first_token_transform",
90
  "position_embedding_type": "absolute",
91
  "torch_dtype": "float32",
92
+ "transformers_version": "4.35.2",
93
  "type_vocab_size": 2,
94
  "use_cache": true,
95
  "vocab_size": 21128
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74054eb7525f1811fa4d9eb645e99008be1db9a50cf9a058f271ef4bbf641458
3
  size 1298060872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e59832720d5c9f592f83c8d61fb253d5ae9b360190d7833f8d214c8017e0050
3
  size 1298060872
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1dca0bbb1c7d575f8c093b1d4826a8230a7cb1937f36a0f5b4f0536003486723
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d8ac636c9476822572910e287b4304549222e1270ea149729a3156f35fb5841
3
  size 4600