lltala commited on
Commit
a2fed2a
1 Parent(s): 9882a6e

End of training

Browse files
Files changed (5) hide show
  1. README.md +21 -1
  2. all_results.json +30 -0
  3. eval_results.json +24 -0
  4. train_results.json +9 -0
  5. trainer_state.json +28 -0
README.md CHANGED
@@ -3,6 +3,8 @@ license: mit
3
  base_model: roberta-base
4
  tags:
5
  - generated_from_trainer
 
 
6
  model-index:
7
  - name: ner__edgar_all_4-simple-no-valid-roberta-base__roberta-base
8
  results: []
@@ -13,7 +15,25 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # ner__edgar_all_4-simple-no-valid-roberta-base__roberta-base
15
 
16
- This model is a fine-tuned version of [roberta-base](https://huggingface.co/roberta-base) on an unknown dataset.
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
 
18
  ## Model description
19
 
 
3
  base_model: roberta-base
4
  tags:
5
  - generated_from_trainer
6
+ datasets:
7
+ - lltala/edgar_all_4-simple-no-valid-roberta-base
8
  model-index:
9
  - name: ner__edgar_all_4-simple-no-valid-roberta-base__roberta-base
10
  results: []
 
15
 
16
  # ner__edgar_all_4-simple-no-valid-roberta-base__roberta-base
17
 
18
+ This model is a fine-tuned version of [roberta-base](https://huggingface.co/roberta-base) on the lltala/edgar_all_4-simple-no-valid-roberta-base dataset.
19
+ It achieves the following results on the evaluation set:
20
+ - Loss: 0.0045
21
+ - Loc Precision: 0.8614
22
+ - Loc Recall: 0.9355
23
+ - Loc F1: 0.8969
24
+ - Loc Number: 93
25
+ - Org Precision: 0.9807
26
+ - Org Recall: 0.9880
27
+ - Org F1: 0.9844
28
+ - Org Number: 669
29
+ - Per Precision: 0.9432
30
+ - Per Recall: 0.9881
31
+ - Per F1: 0.9651
32
+ - Per Number: 84
33
+ - Overall Precision: 0.9629
34
+ - Overall Recall: 0.9823
35
+ - Overall F1: 0.9725
36
+ - Overall Accuracy: 0.9987
37
 
38
  ## Model description
39
 
all_results.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_LOC_f1": 0.8969072164948454,
4
+ "eval_LOC_number": 93,
5
+ "eval_LOC_precision": 0.8613861386138614,
6
+ "eval_LOC_recall": 0.9354838709677419,
7
+ "eval_ORG_f1": 0.9843633655994043,
8
+ "eval_ORG_number": 669,
9
+ "eval_ORG_precision": 0.9807121661721068,
10
+ "eval_ORG_recall": 0.9880418535127056,
11
+ "eval_PER_f1": 0.9651162790697674,
12
+ "eval_PER_number": 84,
13
+ "eval_PER_precision": 0.9431818181818182,
14
+ "eval_PER_recall": 0.9880952380952381,
15
+ "eval_loss": 0.0044641378335654736,
16
+ "eval_overall_accuracy": 0.9986757283494079,
17
+ "eval_overall_f1": 0.9724985371562317,
18
+ "eval_overall_precision": 0.9629200463499421,
19
+ "eval_overall_recall": 0.9822695035460993,
20
+ "eval_runtime": 4.1653,
21
+ "eval_samples": 90,
22
+ "eval_samples_per_second": 21.607,
23
+ "eval_steps_per_second": 1.44,
24
+ "total_flos": 729031133306880.0,
25
+ "train_loss": 0.039226553534383826,
26
+ "train_runtime": 272.0205,
27
+ "train_samples": 930,
28
+ "train_samples_per_second": 10.257,
29
+ "train_steps_per_second": 0.651
30
+ }
eval_results.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_LOC_f1": 0.8969072164948454,
4
+ "eval_LOC_number": 93,
5
+ "eval_LOC_precision": 0.8613861386138614,
6
+ "eval_LOC_recall": 0.9354838709677419,
7
+ "eval_ORG_f1": 0.9843633655994043,
8
+ "eval_ORG_number": 669,
9
+ "eval_ORG_precision": 0.9807121661721068,
10
+ "eval_ORG_recall": 0.9880418535127056,
11
+ "eval_PER_f1": 0.9651162790697674,
12
+ "eval_PER_number": 84,
13
+ "eval_PER_precision": 0.9431818181818182,
14
+ "eval_PER_recall": 0.9880952380952381,
15
+ "eval_loss": 0.0044641378335654736,
16
+ "eval_overall_accuracy": 0.9986757283494079,
17
+ "eval_overall_f1": 0.9724985371562317,
18
+ "eval_overall_precision": 0.9629200463499421,
19
+ "eval_overall_recall": 0.9822695035460993,
20
+ "eval_runtime": 4.1653,
21
+ "eval_samples": 90,
22
+ "eval_samples_per_second": 21.607,
23
+ "eval_steps_per_second": 1.44
24
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "total_flos": 729031133306880.0,
4
+ "train_loss": 0.039226553534383826,
5
+ "train_runtime": 272.0205,
6
+ "train_samples": 930,
7
+ "train_samples_per_second": 10.257,
8
+ "train_steps_per_second": 0.651
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
+ "eval_steps": 500,
6
+ "global_step": 177,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 3.0,
13
+ "step": 177,
14
+ "total_flos": 729031133306880.0,
15
+ "train_loss": 0.039226553534383826,
16
+ "train_runtime": 272.0205,
17
+ "train_samples_per_second": 10.257,
18
+ "train_steps_per_second": 0.651
19
+ }
20
+ ],
21
+ "logging_steps": 500,
22
+ "max_steps": 177,
23
+ "num_train_epochs": 3,
24
+ "save_steps": 500,
25
+ "total_flos": 729031133306880.0,
26
+ "trial_name": null,
27
+ "trial_params": null
28
+ }