napsternxg commited on
Commit
dfd648e
1 Parent(s): e70cca1

End of training

Browse files
README.md CHANGED
@@ -17,16 +17,16 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [sentence-transformers/paraphrase-MiniLM-L3-v2](https://huggingface.co/sentence-transformers/paraphrase-MiniLM-L3-v2) on the nyt_ingredients dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 10.2590
21
- - Comment: {'precision': 0.03657262277951933, 'recall': 0.0264750378214826, 'f1': 0.030715225976305396, 'number': 1322}
22
- - Name: {'precision': 0.5238095238095238, 'recall': 0.01245753114382786, 'f1': 0.024336283185840708, 'number': 1766}
23
- - Qty: {'precision': 0.0234375, 'recall': 0.0020920502092050207, 'f1': 0.003841229193341869, 'number': 1434}
24
- - Range End: {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 17}
25
- - Unit: {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1166}
26
- - Overall Precision: 0.0419
27
- - Overall Recall: 0.0105
28
- - Overall F1: 0.0168
29
- - Overall Accuracy: 0.1284
30
 
31
  ## Model description
32
 
@@ -55,10 +55,10 @@ The following hyperparameters were used during training:
55
 
56
  ### Training results
57
 
58
- | Training Loss | Epoch | Step | Validation Loss | Comment | Name | Qty | Range End | Unit | Overall Precision | Overall Recall | Overall F1 | Overall Accuracy |
59
- |:-------------:|:-----:|:----:|:---------------:|:------------------------------------------------------------------------------------------------------------:|:-------------------------------------------------------------------------------------------------------------:|:-----------------------------------------------------------------------------------------------------:|:----------------------------------------------------------:|:------------------------------------------------------------:|:-----------------:|:--------------:|:----------:|:----------------:|
60
- | No log | 1.0 | 54 | 11.5992 | {'precision': 0.03826530612244898, 'recall': 0.0340393343419062, 'f1': 0.036028823058446756, 'number': 1322} | {'precision': 0.9047619047619048, 'recall': 0.010758776896942242, 'f1': 0.021264689423614997, 'number': 1766} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1434} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 17} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1166} | 0.0526 | 0.0112 | 0.0185 | 0.1319 |
61
- | No log | 2.0 | 108 | 10.2590 | {'precision': 0.03657262277951933, 'recall': 0.0264750378214826, 'f1': 0.030715225976305396, 'number': 1322} | {'precision': 0.5238095238095238, 'recall': 0.01245753114382786, 'f1': 0.024336283185840708, 'number': 1766} | {'precision': 0.0234375, 'recall': 0.0020920502092050207, 'f1': 0.003841229193341869, 'number': 1434} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 17} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1166} | 0.0419 | 0.0105 | 0.0168 | 0.1284 |
62
 
63
 
64
  ### Framework versions
 
17
 
18
  This model is a fine-tuned version of [sentence-transformers/paraphrase-MiniLM-L3-v2](https://huggingface.co/sentence-transformers/paraphrase-MiniLM-L3-v2) on the nyt_ingredients dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 11.3870
21
+ - Comment: {'precision': 0.018842530282637954, 'recall': 0.010174418604651164, 'f1': 0.01321378008494573, 'number': 1376}
22
+ - Name: {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1758}
23
+ - Qty: {'precision': 0.1499119991717569, 'recall': 0.9986206896551724, 'f1': 0.26068953101089204, 'number': 1450}
24
+ - Range End: {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 14}
25
+ - Unit: {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1163}
26
+ - Overall Precision: 0.1405
27
+ - Overall Recall: 0.2538
28
+ - Overall F1: 0.1809
29
+ - Overall Accuracy: 0.1528
30
 
31
  ## Model description
32
 
 
55
 
56
  ### Training results
57
 
58
+ | Training Loss | Epoch | Step | Validation Loss | Comment | Name | Qty | Range End | Unit | Overall Precision | Overall Recall | Overall F1 | Overall Accuracy |
59
+ |:-------------:|:-----:|:----:|:---------------:|:----------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------:|:----------------------------------------------------------------------------------------------------------:|:----------------------------------------------------------:|:------------------------------------------------------------:|:-----------------:|:--------------:|:----------:|:----------------:|
60
+ | No log | 1.0 | 54 | 13.0360 | {'precision': 0.003246753246753247, 'recall': 0.0007267441860465116, 'f1': 0.001187648456057007, 'number': 1376} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1758} | {'precision': 0.142309205350118, 'recall': 0.9979310344827587, 'f1': 0.24909622998794975, 'number': 1450} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 14} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1163} | 0.1382 | 0.2513 | 0.1784 | 0.1432 |
61
+ | No log | 2.0 | 108 | 11.3870 | {'precision': 0.018842530282637954, 'recall': 0.010174418604651164, 'f1': 0.01321378008494573, 'number': 1376} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1758} | {'precision': 0.1499119991717569, 'recall': 0.9986206896551724, 'f1': 0.26068953101089204, 'number': 1450} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 14} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 1163} | 0.1405 | 0.2538 | 0.1809 | 0.1528 |
62
 
63
 
64
  ### Framework versions
all_results.json CHANGED
@@ -1,41 +1,41 @@
1
  {
2
  "epoch": 2.0,
3
  "eval_COMMENT": {
4
- "f1": 0.030715225976305396,
5
- "number": 1322,
6
- "precision": 0.03657262277951933,
7
- "recall": 0.0264750378214826
8
  },
9
  "eval_NAME": {
10
- "f1": 0.024336283185840708,
11
- "number": 1766,
12
- "precision": 0.5238095238095238,
13
- "recall": 0.01245753114382786
14
  },
15
  "eval_QTY": {
16
- "f1": 0.003841229193341869,
17
- "number": 1434,
18
- "precision": 0.0234375,
19
- "recall": 0.0020920502092050207
20
  },
21
  "eval_RANGE_END": {
22
  "f1": 0.0,
23
- "number": 17,
24
  "precision": 0.0,
25
  "recall": 0.0
26
  },
27
  "eval_UNIT": {
28
  "f1": 0.0,
29
- "number": 1166,
30
  "precision": 0.0,
31
  "recall": 0.0
32
  },
33
- "eval_loss": 10.259025573730469,
34
- "eval_overall_accuracy": 0.12838815472171314,
35
- "eval_overall_f1": 0.016813787305590584,
36
- "eval_overall_precision": 0.04189944134078212,
37
- "eval_overall_recall": 0.010517090271691499,
38
- "eval_runtime": 15.7061,
39
- "eval_samples_per_second": 108.365,
40
- "eval_steps_per_second": 3.438
41
  }
 
1
  {
2
  "epoch": 2.0,
3
  "eval_COMMENT": {
4
+ "f1": 0.01321378008494573,
5
+ "number": 1376,
6
+ "precision": 0.018842530282637954,
7
+ "recall": 0.010174418604651164
8
  },
9
  "eval_NAME": {
10
+ "f1": 0.0,
11
+ "number": 1758,
12
+ "precision": 0.0,
13
+ "recall": 0.0
14
  },
15
  "eval_QTY": {
16
+ "f1": 0.26068953101089204,
17
+ "number": 1450,
18
+ "precision": 0.1499119991717569,
19
+ "recall": 0.9986206896551724
20
  },
21
  "eval_RANGE_END": {
22
  "f1": 0.0,
23
+ "number": 14,
24
  "precision": 0.0,
25
  "recall": 0.0
26
  },
27
  "eval_UNIT": {
28
  "f1": 0.0,
29
+ "number": 1163,
30
  "precision": 0.0,
31
  "recall": 0.0
32
  },
33
+ "eval_loss": 11.38698959350586,
34
+ "eval_overall_accuracy": 0.15278303672851193,
35
+ "eval_overall_f1": 0.1809070098372827,
36
+ "eval_overall_precision": 0.14054989425110556,
37
+ "eval_overall_recall": 0.25377538621767054,
38
+ "eval_runtime": 15.4103,
39
+ "eval_samples_per_second": 110.445,
40
+ "eval_steps_per_second": 3.504
41
  }
config.json CHANGED
@@ -4,9 +4,6 @@
4
  "PretrainedCRFModel"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
- "auto_map": {
8
- "AutoModel": "crf_model.PretrainedCRFModel"
9
- },
10
  "classifier_dropout": null,
11
  "gradient_checkpointing": false,
12
  "hidden_act": "gelu",
 
4
  "PretrainedCRFModel"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
 
 
7
  "classifier_dropout": null,
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:957a43de6de74f7ecd4ba71f7c05807847718572ae4a3af8cd70c7f799baf978
3
  size 69004255
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bc0aa155e841d43ed8fb5a8293f148b0505c438f359a802417121f401313821
3
  size 69004255
trainer_state.json CHANGED
@@ -11,102 +11,102 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_COMMENT": {
14
- "f1": 0.036028823058446756,
15
- "number": 1322,
16
- "precision": 0.03826530612244898,
17
- "recall": 0.0340393343419062
18
  },
19
  "eval_NAME": {
20
- "f1": 0.021264689423614997,
21
- "number": 1766,
22
- "precision": 0.9047619047619048,
23
- "recall": 0.010758776896942242
24
- },
25
- "eval_QTY": {
26
  "f1": 0.0,
27
- "number": 1434,
28
  "precision": 0.0,
29
  "recall": 0.0
30
  },
 
 
 
 
 
 
31
  "eval_RANGE_END": {
32
  "f1": 0.0,
33
- "number": 17,
34
  "precision": 0.0,
35
  "recall": 0.0
36
  },
37
  "eval_UNIT": {
38
  "f1": 0.0,
39
- "number": 1166,
40
  "precision": 0.0,
41
  "recall": 0.0
42
  },
43
- "eval_loss": 11.59915828704834,
44
- "eval_overall_accuracy": 0.13186071187421627,
45
- "eval_overall_f1": 0.018494437220054907,
46
- "eval_overall_precision": 0.05263157894736842,
47
- "eval_overall_recall": 0.011218229623137599,
48
- "eval_runtime": 14.249,
49
- "eval_samples_per_second": 119.447,
50
- "eval_steps_per_second": 3.79,
51
  "step": 54
52
  },
53
  {
54
  "epoch": 2.0,
55
  "eval_COMMENT": {
56
- "f1": 0.030715225976305396,
57
- "number": 1322,
58
- "precision": 0.03657262277951933,
59
- "recall": 0.0264750378214826
60
  },
61
  "eval_NAME": {
62
- "f1": 0.024336283185840708,
63
- "number": 1766,
64
- "precision": 0.5238095238095238,
65
- "recall": 0.01245753114382786
66
  },
67
  "eval_QTY": {
68
- "f1": 0.003841229193341869,
69
- "number": 1434,
70
- "precision": 0.0234375,
71
- "recall": 0.0020920502092050207
72
  },
73
  "eval_RANGE_END": {
74
  "f1": 0.0,
75
- "number": 17,
76
  "precision": 0.0,
77
  "recall": 0.0
78
  },
79
  "eval_UNIT": {
80
  "f1": 0.0,
81
- "number": 1166,
82
  "precision": 0.0,
83
  "recall": 0.0
84
  },
85
- "eval_loss": 10.259025573730469,
86
- "eval_overall_accuracy": 0.12838815472171314,
87
- "eval_overall_f1": 0.016813787305590584,
88
- "eval_overall_precision": 0.04189944134078212,
89
- "eval_overall_recall": 0.010517090271691499,
90
- "eval_runtime": 15.3099,
91
- "eval_samples_per_second": 111.17,
92
- "eval_steps_per_second": 3.527,
93
  "step": 108
94
  },
95
  {
96
  "epoch": 2.0,
97
  "step": 108,
98
- "total_flos": 3334407253032.0,
99
- "train_loss": 12.8824462890625,
100
- "train_runtime": 151.3626,
101
- "train_samples_per_second": 22.489,
102
- "train_steps_per_second": 0.714
103
  }
104
  ],
105
  "logging_steps": 500,
106
  "max_steps": 108,
107
  "num_train_epochs": 2,
108
  "save_steps": 500,
109
- "total_flos": 3334407253032.0,
110
  "trial_name": null,
111
  "trial_params": null
112
  }
 
11
  {
12
  "epoch": 1.0,
13
  "eval_COMMENT": {
14
+ "f1": 0.001187648456057007,
15
+ "number": 1376,
16
+ "precision": 0.003246753246753247,
17
+ "recall": 0.0007267441860465116
18
  },
19
  "eval_NAME": {
 
 
 
 
 
 
20
  "f1": 0.0,
21
+ "number": 1758,
22
  "precision": 0.0,
23
  "recall": 0.0
24
  },
25
+ "eval_QTY": {
26
+ "f1": 0.24909622998794975,
27
+ "number": 1450,
28
+ "precision": 0.142309205350118,
29
+ "recall": 0.9979310344827587
30
+ },
31
  "eval_RANGE_END": {
32
  "f1": 0.0,
33
+ "number": 14,
34
  "precision": 0.0,
35
  "recall": 0.0
36
  },
37
  "eval_UNIT": {
38
  "f1": 0.0,
39
+ "number": 1163,
40
  "precision": 0.0,
41
  "recall": 0.0
42
  },
43
+ "eval_loss": 13.036046981811523,
44
+ "eval_overall_accuracy": 0.1432222642938281,
45
+ "eval_overall_f1": 0.17835807107224239,
46
+ "eval_overall_precision": 0.13822069492172584,
47
+ "eval_overall_recall": 0.25134525256031937,
48
+ "eval_runtime": 14.6529,
49
+ "eval_samples_per_second": 116.155,
50
+ "eval_steps_per_second": 3.685,
51
  "step": 54
52
  },
53
  {
54
  "epoch": 2.0,
55
  "eval_COMMENT": {
56
+ "f1": 0.01321378008494573,
57
+ "number": 1376,
58
+ "precision": 0.018842530282637954,
59
+ "recall": 0.010174418604651164
60
  },
61
  "eval_NAME": {
62
+ "f1": 0.0,
63
+ "number": 1758,
64
+ "precision": 0.0,
65
+ "recall": 0.0
66
  },
67
  "eval_QTY": {
68
+ "f1": 0.26068953101089204,
69
+ "number": 1450,
70
+ "precision": 0.1499119991717569,
71
+ "recall": 0.9986206896551724
72
  },
73
  "eval_RANGE_END": {
74
  "f1": 0.0,
75
+ "number": 14,
76
  "precision": 0.0,
77
  "recall": 0.0
78
  },
79
  "eval_UNIT": {
80
  "f1": 0.0,
81
+ "number": 1163,
82
  "precision": 0.0,
83
  "recall": 0.0
84
  },
85
+ "eval_loss": 11.38698959350586,
86
+ "eval_overall_accuracy": 0.15278303672851193,
87
+ "eval_overall_f1": 0.1809070098372827,
88
+ "eval_overall_precision": 0.14054989425110556,
89
+ "eval_overall_recall": 0.25377538621767054,
90
+ "eval_runtime": 17.2137,
91
+ "eval_samples_per_second": 98.875,
92
+ "eval_steps_per_second": 3.137,
93
  "step": 108
94
  },
95
  {
96
  "epoch": 2.0,
97
  "step": 108,
98
+ "total_flos": 3333512058648.0,
99
+ "train_loss": 14.639327437789351,
100
+ "train_runtime": 158.5609,
101
+ "train_samples_per_second": 21.468,
102
+ "train_steps_per_second": 0.681
103
  }
104
  ],
105
  "logging_steps": 500,
106
  "max_steps": 108,
107
  "num_train_epochs": 2,
108
  "save_steps": 500,
109
+ "total_flos": 3333512058648.0,
110
  "trial_name": null,
111
  "trial_params": null
112
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c5254dbe381bcf40ffb21d73c66be21031100bd1243da923a4f4347812cc60c
3
  size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96c214e97b6f20cd8938a61602e67132038a6f6d693fd46193ea1ba0693eda35
3
  size 4155
validation_results.json CHANGED
@@ -1,41 +1,41 @@
1
  {
2
  "epoch": 2.0,
3
  "eval_COMMENT": {
4
- "f1": 0.030715225976305396,
5
- "number": 1322,
6
- "precision": 0.03657262277951933,
7
- "recall": 0.0264750378214826
8
  },
9
  "eval_NAME": {
10
- "f1": 0.024336283185840708,
11
- "number": 1766,
12
- "precision": 0.5238095238095238,
13
- "recall": 0.01245753114382786
14
  },
15
  "eval_QTY": {
16
- "f1": 0.003841229193341869,
17
- "number": 1434,
18
- "precision": 0.0234375,
19
- "recall": 0.0020920502092050207
20
  },
21
  "eval_RANGE_END": {
22
  "f1": 0.0,
23
- "number": 17,
24
  "precision": 0.0,
25
  "recall": 0.0
26
  },
27
  "eval_UNIT": {
28
  "f1": 0.0,
29
- "number": 1166,
30
  "precision": 0.0,
31
  "recall": 0.0
32
  },
33
- "eval_loss": 10.259025573730469,
34
- "eval_overall_accuracy": 0.12838815472171314,
35
- "eval_overall_f1": 0.016813787305590584,
36
- "eval_overall_precision": 0.04189944134078212,
37
- "eval_overall_recall": 0.010517090271691499,
38
- "eval_runtime": 15.7061,
39
- "eval_samples_per_second": 108.365,
40
- "eval_steps_per_second": 3.438
41
  }
 
1
  {
2
  "epoch": 2.0,
3
  "eval_COMMENT": {
4
+ "f1": 0.01321378008494573,
5
+ "number": 1376,
6
+ "precision": 0.018842530282637954,
7
+ "recall": 0.010174418604651164
8
  },
9
  "eval_NAME": {
10
+ "f1": 0.0,
11
+ "number": 1758,
12
+ "precision": 0.0,
13
+ "recall": 0.0
14
  },
15
  "eval_QTY": {
16
+ "f1": 0.26068953101089204,
17
+ "number": 1450,
18
+ "precision": 0.1499119991717569,
19
+ "recall": 0.9986206896551724
20
  },
21
  "eval_RANGE_END": {
22
  "f1": 0.0,
23
+ "number": 14,
24
  "precision": 0.0,
25
  "recall": 0.0
26
  },
27
  "eval_UNIT": {
28
  "f1": 0.0,
29
+ "number": 1163,
30
  "precision": 0.0,
31
  "recall": 0.0
32
  },
33
+ "eval_loss": 11.38698959350586,
34
+ "eval_overall_accuracy": 0.15278303672851193,
35
+ "eval_overall_f1": 0.1809070098372827,
36
+ "eval_overall_precision": 0.14054989425110556,
37
+ "eval_overall_recall": 0.25377538621767054,
38
+ "eval_runtime": 15.4103,
39
+ "eval_samples_per_second": 110.445,
40
+ "eval_steps_per_second": 3.504
41
  }