napsternxg commited on
Commit
05ed773
1 Parent(s): ca2e188

End of training

Browse files
README.md ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: napsternxg/gte-small-L3-ingredient-v2
3
+ tags:
4
+ - generated_from_trainer
5
+ datasets:
6
+ - nyt_ingredients
7
+ model-index:
8
+ - name: nyt_ingredients-tagger-gte-small-L3-ingredient-v2
9
+ results: []
10
+ ---
11
+
12
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
+ should probably proofread and complete it, then remove this comment. -->
14
+
15
+ # nyt_ingredients-tagger-gte-small-L3-ingredient-v2
16
+
17
+ This model is a fine-tuned version of [napsternxg/gte-small-L3-ingredient-v2](https://huggingface.co/napsternxg/gte-small-L3-ingredient-v2) on the nyt_ingredients dataset.
18
+ It achieves the following results on the evaluation set:
19
+ - Loss: 0.4705
20
+ - Comment: {'precision': 0.6653720111664037, 'recall': 0.7644679960953842, 'f1': 0.7114860480207656, 'number': 7171}
21
+ - Name: {'precision': 0.7963734889537307, 'recall': 0.8212788823213326, 'f1': 0.8086344637849849, 'number': 9305}
22
+ - Qty: {'precision': 0.981755684822845, 'recall': 0.9907938625750501, 'f1': 0.9862540673351484, 'number': 7495}
23
+ - Range End: {'precision': 0.6240601503759399, 'recall': 0.9222222222222223, 'f1': 0.7443946188340806, 'number': 90}
24
+ - Unit: {'precision': 0.923100969052829, 'recall': 0.9861412589747871, 'f1': 0.95358036651328, 'number': 5989}
25
+ - Overall Precision: 0.8312
26
+ - Overall Recall: 0.8832
27
+ - Overall F1: 0.8564
28
+ - Overall Accuracy: 0.8350
29
+
30
+ ## Model description
31
+
32
+ More information needed
33
+
34
+ ## Intended uses & limitations
35
+
36
+ More information needed
37
+
38
+ ## Training and evaluation data
39
+
40
+ More information needed
41
+
42
+ ## Training procedure
43
+
44
+ ### Training hyperparameters
45
+
46
+ The following hyperparameters were used during training:
47
+ - learning_rate: 5e-05
48
+ - train_batch_size: 32
49
+ - eval_batch_size: 32
50
+ - seed: 42
51
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
52
+ - lr_scheduler_type: linear
53
+ - num_epochs: 10
54
+
55
+ ### Training results
56
+
57
+ | Training Loss | Epoch | Step | Validation Loss | Comment | Name | Qty | Range End | Unit | Overall Precision | Overall Recall | Overall F1 | Overall Accuracy |
58
+ |:-------------:|:-----:|:-----:|:---------------:|:---------------------------------------------------------------------------------------------------------:|:---------------------------------------------------------------------------------------------------------:|:---------------------------------------------------------------------------------------------------------:|:-------------------------------------------------------------------------------------------------------:|:---------------------------------------------------------------------------------------------------------:|:-----------------:|:--------------:|:----------:|:----------------:|
59
+ | 0.6931 | 0.2 | 1000 | 0.6230 | {'precision': 0.5236127508854782, 'recall': 0.6426604839878278, 'f1': 0.5770606987183658, 'number': 6901} | {'precision': 0.7773012207192346, 'recall': 0.7980128711753416, 'f1': 0.7875208913649026, 'number': 8857} | {'precision': 0.9824561403508771, 'recall': 0.9737098344693281, 'f1': 0.9780634343998882, 'number': 7189} | {'precision': 0.0, 'recall': 0.0, 'f1': 0.0, 'number': 92} | {'precision': 0.9192320423700762, 'recall': 0.9689462665736218, 'f1': 0.9434346865975879, 'number': 5732} | 0.7829 | 0.8362 | 0.8086 | 0.7986 |
60
+ | 0.5826 | 0.4 | 2000 | 0.5531 | {'precision': 0.5435365427205968, 'recall': 0.6756991740327489, 'f1': 0.602454780361757, 'number': 6901} | {'precision': 0.7757141305528402, 'recall': 0.8063678446426555, 'f1': 0.7907440212577502, 'number': 8857} | {'precision': 0.9659028914348063, 'recall': 0.9851161496731117, 'f1': 0.9754149163280765, 'number': 7189} | {'precision': 0.6055045871559633, 'recall': 0.717391304347826, 'f1': 0.6567164179104478, 'number': 92} | {'precision': 0.9177049180327869, 'recall': 0.9766224703419399, 'f1': 0.9462474645030426, 'number': 5732} | 0.7837 | 0.8533 | 0.8170 | 0.8079 |
61
+ | 0.5435 | 0.59 | 3000 | 0.5327 | {'precision': 0.5801165331391115, 'recall': 0.6925083321257789, 'f1': 0.6313494946826079, 'number': 6901} | {'precision': 0.7839085513299626, 'recall': 0.8052387941740996, 'f1': 0.7944305207463102, 'number': 8857} | {'precision': 0.9771436487048067, 'recall': 0.9812213103352344, 'f1': 0.9791782343142699, 'number': 7189} | {'precision': 0.6302521008403361, 'recall': 0.8152173913043478, 'f1': 0.7109004739336493, 'number': 92} | {'precision': 0.9126637554585153, 'recall': 0.9844731332868109, 'f1': 0.9472093999160722, 'number': 5732} | 0.7999 | 0.8579 | 0.8279 | 0.8150 |
62
+ | 0.5333 | 0.79 | 4000 | 0.5212 | {'precision': 0.5875760104924288, 'recall': 0.7140994058832053, 'f1': 0.6446886446886447, 'number': 6901} | {'precision': 0.786660777385159, 'recall': 0.8043355537992548, 'f1': 0.7953999888349244, 'number': 8857} | {'precision': 0.9837716843872412, 'recall': 0.9781610794269022, 'f1': 0.9809583594894328, 'number': 7189} | {'precision': 0.6390977443609023, 'recall': 0.9239130434782609, 'f1': 0.7555555555555556, 'number': 92} | {'precision': 0.9263366992219831, 'recall': 0.9762735519888346, 'f1': 0.9506497918967128, 'number': 5732} | 0.8050 | 0.8608 | 0.8319 | 0.8183 |
63
+ | 0.5199 | 0.99 | 5000 | 0.5121 | {'precision': 0.5873457536898137, 'recall': 0.7035212288074192, 'f1': 0.6402057097646205, 'number': 6901} | {'precision': 0.7890984865101996, 'recall': 0.812351812126002, 'f1': 0.8005563282336579, 'number': 8857} | {'precision': 0.978519955654102, 'recall': 0.9821950201697037, 'f1': 0.9803540437348144, 'number': 7189} | {'precision': 0.6615384615384615, 'recall': 0.9347826086956522, 'f1': 0.7747747747747747, 'number': 92} | {'precision': 0.9197843489625878, 'recall': 0.9822051639916259, 'f1': 0.9499704716105627, 'number': 5732} | 0.8047 | 0.8629 | 0.8328 | 0.8186 |
64
+ | 0.4983 | 1.19 | 6000 | 0.5088 | {'precision': 0.6041901894367081, 'recall': 0.6978698739313143, 'f1': 0.6476600322754169, 'number': 6901} | {'precision': 0.7801047120418848, 'recall': 0.8074968951112115, 'f1': 0.7935644937586686, 'number': 8857} | {'precision': 0.980998613037448, 'recall': 0.983864237028794, 'f1': 0.9824293353705119, 'number': 7189} | {'precision': 0.6511627906976745, 'recall': 0.9130434782608695, 'f1': 0.7601809954751132, 'number': 92} | {'precision': 0.9193864229765013, 'recall': 0.9829030006978368, 'f1': 0.9500843170320405, 'number': 5732} | 0.8090 | 0.8606 | 0.8340 | 0.8192 |
65
+ | 0.5031 | 1.39 | 7000 | 0.5031 | {'precision': 0.6055345911949686, 'recall': 0.6975800608607449, 'f1': 0.6483065113460373, 'number': 6901} | {'precision': 0.7835422343324251, 'recall': 0.8116743818448685, 'f1': 0.797360248447205, 'number': 8857} | {'precision': 0.9752815160670145, 'recall': 0.9878981777715955, 'f1': 0.9815493055075669, 'number': 7189} | {'precision': 0.6666666666666666, 'recall': 0.9130434782608695, 'f1': 0.7706422018348623, 'number': 92} | {'precision': 0.9269467043001827, 'recall': 0.9740055826936497, 'f1': 0.9498936622713738, 'number': 5732} | 0.8107 | 0.8610 | 0.8351 | 0.8199 |
66
+ | 0.492 | 1.58 | 8000 | 0.5041 | {'precision': 0.6209482341557814, 'recall': 0.743950152151862, 'f1': 0.6769068494956819, 'number': 6901} | {'precision': 0.7778260869565218, 'recall': 0.8079485152986339, 'f1': 0.7926012072880323, 'number': 8857} | {'precision': 0.983001254005852, 'recall': 0.9813604117401585, 'f1': 0.9821801475706529, 'number': 7189} | {'precision': 0.6423357664233577, 'recall': 0.9565217391304348, 'f1': 0.7685589519650656, 'number': 92} | {'precision': 0.9215493188905302, 'recall': 0.9795882763433357, 'f1': 0.9496828752642706, 'number': 5732} | 0.8113 | 0.8706 | 0.8399 | 0.8246 |
67
+ | 0.4817 | 1.78 | 9000 | 0.4901 | {'precision': 0.6196705426356589, 'recall': 0.7413418345167367, 'f1': 0.6750676255195619, 'number': 6901} | {'precision': 0.7891447368421053, 'recall': 0.8125776222197132, 'f1': 0.8006897702620014, 'number': 8857} | {'precision': 0.9798370390829996, 'recall': 0.9869244679371262, 'f1': 0.9833679833679833, 'number': 7189} | {'precision': 0.6474820143884892, 'recall': 0.9782608695652174, 'f1': 0.7792207792207793, 'number': 92} | {'precision': 0.9168422758956071, 'recall': 0.9867411025819958, 'f1': 0.9505083606419629, 'number': 5732} | 0.8134 | 0.8743 | 0.8427 | 0.8293 |
68
+ | 0.4905 | 1.98 | 10000 | 0.4892 | {'precision': 0.6241463414634146, 'recall': 0.7416316475873062, 'f1': 0.6778359049069598, 'number': 6901} | {'precision': 0.7911287653095002, 'recall': 0.8095291859546122, 'f1': 0.8002232142857143, 'number': 8857} | {'precision': 0.9846860643185299, 'recall': 0.983864237028794, 'f1': 0.9842749791260784, 'number': 7189} | {'precision': 0.6717557251908397, 'recall': 0.9565217391304348, 'f1': 0.789237668161435, 'number': 92} | {'precision': 0.9170723790976956, 'recall': 0.9858688066992324, 'f1': 0.9502270052127123, 'number': 5732} | 0.8166 | 0.8724 | 0.8436 | 0.8288 |
69
+ | 0.4757 | 2.18 | 11000 | 0.4954 | {'precision': 0.6271186440677966, 'recall': 0.7398927691638892, 'f1': 0.6788539520042544, 'number': 6901} | {'precision': 0.7921020789792103, 'recall': 0.8130292424071356, 'f1': 0.802429240026744, 'number': 8857} | {'precision': 0.9801077496891836, 'recall': 0.9869244679371262, 'f1': 0.9835042971998891, 'number': 7189} | {'precision': 0.6428571428571429, 'recall': 0.9782608695652174, 'f1': 0.7758620689655172, 'number': 92} | {'precision': 0.9226609864001311, 'recall': 0.9823796231681786, 'f1': 0.9515842839036756, 'number': 5732} | 0.8179 | 0.8732 | 0.8447 | 0.8274 |
70
+ | 0.4691 | 2.38 | 12000 | 0.4903 | {'precision': 0.6292872780345414, 'recall': 0.7497464135632517, 'f1': 0.6842557693579316, 'number': 6901} | {'precision': 0.7935547734271887, 'recall': 0.8146099130631139, 'f1': 0.803944509443423, 'number': 8857} | {'precision': 0.9806816613771215, 'recall': 0.9885936847962165, 'f1': 0.984621778886118, 'number': 7189} | {'precision': 0.6544117647058824, 'recall': 0.967391304347826, 'f1': 0.780701754385965, 'number': 92} | {'precision': 0.9238204456094364, 'recall': 0.9837752965806001, 'f1': 0.9528556944913822, 'number': 5732} | 0.8189 | 0.8767 | 0.8468 | 0.8301 |
71
+ | 0.4765 | 2.57 | 13000 | 0.4846 | {'precision': 0.6338439095550693, 'recall': 0.7555426749746413, 'f1': 0.6893633899649634, 'number': 6901} | {'precision': 0.7977640026566305, 'recall': 0.8137066726882691, 'f1': 0.805656475322788, 'number': 8857} | {'precision': 0.9850891861761427, 'recall': 0.9833078314090973, 'f1': 0.9841977027497391, 'number': 7189} | {'precision': 0.6774193548387096, 'recall': 0.9130434782608695, 'f1': 0.7777777777777777, 'number': 92} | {'precision': 0.9219950940310712, 'recall': 0.9836008374040475, 'f1': 0.9518021440027011, 'number': 5732} | 0.8219 | 0.8763 | 0.8482 | 0.8307 |
72
+ | 0.4747 | 2.77 | 14000 | 0.4844 | {'precision': 0.6380844929171368, 'recall': 0.7375742645993334, 'f1': 0.6842317515795134, 'number': 6901} | {'precision': 0.791246160596753, 'recall': 0.8143841029694028, 'f1': 0.8026484170700496, 'number': 8857} | {'precision': 0.9796255506607929, 'recall': 0.9898455974405341, 'f1': 0.9847090569431951, 'number': 7189} | {'precision': 0.6546762589928058, 'recall': 0.9891304347826086, 'f1': 0.7878787878787878, 'number': 92} | {'precision': 0.9195252804422045, 'recall': 0.9867411025819958, 'f1': 0.9519481612387444, 'number': 5732} | 0.8212 | 0.8747 | 0.8471 | 0.8314 |
73
+ | 0.4654 | 2.97 | 15000 | 0.4808 | {'precision': 0.6453574975173784, 'recall': 0.7533690769453703, 'f1': 0.6951928862739855, 'number': 6901} | {'precision': 0.7925608011444921, 'recall': 0.8131421474539912, 'f1': 0.8027195720017833, 'number': 8857} | {'precision': 0.9827013562136728, 'recall': 0.9877590763666713, 'f1': 0.9852237252861602, 'number': 7189} | {'precision': 0.6641221374045801, 'recall': 0.9456521739130435, 'f1': 0.7802690582959643, 'number': 92} | {'precision': 0.9255791030064071, 'recall': 0.9829030006978368, 'f1': 0.9533801506049582, 'number': 5732} | 0.8246 | 0.8767 | 0.8499 | 0.8332 |
74
+ | 0.4586 | 3.17 | 16000 | 0.4827 | {'precision': 0.6517362858580775, 'recall': 0.7506158527749601, 'f1': 0.6976900801400768, 'number': 6901} | {'precision': 0.7901383703052932, 'recall': 0.812351812126002, 'f1': 0.8010911317708622, 'number': 8857} | {'precision': 0.979906413432425, 'recall': 0.990402003060231, 'f1': 0.9851262538913871, 'number': 7189} | {'precision': 0.6641221374045801, 'recall': 0.9456521739130435, 'f1': 0.7802690582959643, 'number': 92} | {'precision': 0.9193364774760123, 'recall': 0.9862177250523377, 'f1': 0.9516034003871727, 'number': 5732} | 0.8247 | 0.8771 | 0.8501 | 0.8317 |
75
+ | 0.4612 | 3.37 | 17000 | 0.4869 | {'precision': 0.6441053408811224, 'recall': 0.7584408056803362, 'f1': 0.6966127636920211, 'number': 6901} | {'precision': 0.7845718637797846, 'recall': 0.8141582928756915, 'f1': 0.7990913120567377, 'number': 8857} | {'precision': 0.9844271412680756, 'recall': 0.9848379468632633, 'f1': 0.9846325012168833, 'number': 7189} | {'precision': 0.6641221374045801, 'recall': 0.9456521739130435, 'f1': 0.7802690582959643, 'number': 92} | {'precision': 0.9158439877002751, 'recall': 0.9872644801116539, 'f1': 0.9502140878179833, 'number': 5732} | 0.8200 | 0.8783 | 0.8482 | 0.8308 |
76
+ | 0.4546 | 3.56 | 18000 | 0.4806 | {'precision': 0.6482188295165394, 'recall': 0.7382987972757571, 'f1': 0.6903326332904275, 'number': 6901} | {'precision': 0.788654181184669, 'recall': 0.8177712543750706, 'f1': 0.8029488387561666, 'number': 8857} | {'precision': 0.9817704736914791, 'recall': 0.9888718876060648, 'f1': 0.9853083853083853, 'number': 7189} | {'precision': 0.6854838709677419, 'recall': 0.9239130434782609, 'f1': 0.787037037037037, 'number': 92} | {'precision': 0.9236179260713118, 'recall': 0.9851709699930217, 'f1': 0.9534019922336655, 'number': 5732} | 0.8249 | 0.8752 | 0.8493 | 0.8315 |
77
+ | 0.4471 | 3.76 | 19000 | 0.4823 | {'precision': 0.6466100652147164, 'recall': 0.7614838429213158, 'f1': 0.6993611924407772, 'number': 6901} | {'precision': 0.7929254092057564, 'recall': 0.8149486282036807, 'f1': 0.8037861915367484, 'number': 8857} | {'precision': 0.983906770255272, 'recall': 0.9865071637223536, 'f1': 0.9852052510939778, 'number': 7189} | {'precision': 0.676923076923077, 'recall': 0.9565217391304348, 'f1': 0.7927927927927929, 'number': 92} | {'precision': 0.9211943220753793, 'recall': 0.984996510816469, 'f1': 0.9520276536548351, 'number': 5732} | 0.8242 | 0.8793 | 0.8508 | 0.8328 |
78
+ | 0.4542 | 3.96 | 20000 | 0.4758 | {'precision': 0.6508980521123198, 'recall': 0.7456890305752789, 'f1': 0.6950766529344229, 'number': 6901} | {'precision': 0.7868081382629621, 'recall': 0.8121260020322908, 'f1': 0.7992666259236624, 'number': 8857} | {'precision': 0.9829734219269103, 'recall': 0.9877590763666713, 'f1': 0.9853604384930272, 'number': 7189} | {'precision': 0.6744186046511628, 'recall': 0.9456521739130435, 'f1': 0.7873303167420815, 'number': 92} | {'precision': 0.920559986977047, 'recall': 0.9865666434054431, 'f1': 0.9524210526315788, 'number': 5732} | 0.8244 | 0.8753 | 0.8491 | 0.8326 |
79
+ | 0.4452 | 4.16 | 21000 | 0.4833 | {'precision': 0.6566687938736439, 'recall': 0.7455441240399941, 'f1': 0.6982899022801302, 'number': 6901} | {'precision': 0.7843478260869565, 'recall': 0.8147228181099695, 'f1': 0.7992468294844105, 'number': 8857} | {'precision': 0.981750311074243, 'recall': 0.9877590763666713, 'f1': 0.9847455276660656, 'number': 7189} | {'precision': 0.6854838709677419, 'recall': 0.9239130434782609, 'f1': 0.787037037037037, 'number': 92} | {'precision': 0.9249303392886412, 'recall': 0.9844731332868109, 'f1': 0.9537733457280487, 'number': 5732} | 0.8261 | 0.8755 | 0.8501 | 0.8339 |
80
+ | 0.4412 | 4.36 | 22000 | 0.4888 | {'precision': 0.6534954407294833, 'recall': 0.7477177220692653, 'f1': 0.6974386700006758, 'number': 6901} | {'precision': 0.7870067582297798, 'recall': 0.8151744382973919, 'f1': 0.8008429926238145, 'number': 8857} | {'precision': 0.9839268394069558, 'recall': 0.9877590763666713, 'f1': 0.9858392336526447, 'number': 7189} | {'precision': 0.6717557251908397, 'recall': 0.9565217391304348, 'f1': 0.789237668161435, 'number': 92} | {'precision': 0.9248280379954144, 'recall': 0.9851709699930217, 'f1': 0.9540462916033113, 'number': 5732} | 0.8261 | 0.8764 | 0.8505 | 0.8325 |
81
+ | 0.4423 | 4.55 | 23000 | 0.4827 | {'precision': 0.6532828282828282, 'recall': 0.7497464135632517, 'f1': 0.6981985021253626, 'number': 6901} | {'precision': 0.7874007180937874, 'recall': 0.817093824093937, 'f1': 0.8019725177304966, 'number': 8857} | {'precision': 0.9835202880487467, 'recall': 0.9878981777715955, 'f1': 0.9857043719639139, 'number': 7189} | {'precision': 0.6766917293233082, 'recall': 0.9782608695652174, 'f1': 0.7999999999999999, 'number': 92} | {'precision': 0.9264850672792911, 'recall': 0.984996510816469, 'f1': 0.9548452562151193, 'number': 5732} | 0.8262 | 0.8776 | 0.8511 | 0.8338 |
82
+ | 0.4507 | 4.75 | 24000 | 0.4740 | {'precision': 0.6584520600693108, 'recall': 0.7433705260107231, 'f1': 0.69833923223523, 'number': 6901} | {'precision': 0.7933530766699572, 'recall': 0.8166422039065147, 'f1': 0.8048291977300545, 'number': 8857} | {'precision': 0.9801898472967395, 'recall': 0.9910975100848518, 'f1': 0.9856135011758197, 'number': 7189} | {'precision': 0.6692307692307692, 'recall': 0.9456521739130435, 'f1': 0.7837837837837838, 'number': 92} | {'precision': 0.922976501305483, 'recall': 0.9867411025819958, 'f1': 0.9537942664418213, 'number': 5732} | 0.8290 | 0.8770 | 0.8523 | 0.8347 |
83
+ | 0.4452 | 4.95 | 25000 | 0.4791 | {'precision': 0.6528792569659443, 'recall': 0.7639472540211564, 'f1': 0.7040598290598291, 'number': 6901} | {'precision': 0.7875054513737462, 'recall': 0.8155131534379587, 'f1': 0.8012646292084975, 'number': 8857} | {'precision': 0.9825798423890502, 'recall': 0.9885936847962165, 'f1': 0.9855775897933713, 'number': 7189} | {'precision': 0.6640625, 'recall': 0.9239130434782609, 'f1': 0.7727272727272728, 'number': 92} | {'precision': 0.9227881162259223, 'recall': 0.9862177250523377, 'f1': 0.953449148254343, 'number': 5732} | 0.8245 | 0.8807 | 0.8517 | 0.8352 |
84
+ | 0.4274 | 5.15 | 26000 | 0.4807 | {'precision': 0.6607946026986506, 'recall': 0.766410665120997, 'f1': 0.7096947333109694, 'number': 6901} | {'precision': 0.795727342803656, 'recall': 0.8158518685785254, 'f1': 0.8056639536180176, 'number': 8857} | {'precision': 0.9844660194174757, 'recall': 0.9873417721518988, 'f1': 0.9859017987360232, 'number': 7189} | {'precision': 0.6935483870967742, 'recall': 0.9347826086956522, 'f1': 0.7962962962962964, 'number': 92} | {'precision': 0.9229010127409344, 'recall': 0.9856943475226797, 'f1': 0.9532647207693606, 'number': 5732} | 0.8300 | 0.8811 | 0.8548 | 0.8361 |
85
+ | 0.4312 | 5.35 | 27000 | 0.4861 | {'precision': 0.6542461005199307, 'recall': 0.7658310389798579, 'f1': 0.7056545830829829, 'number': 6901} | {'precision': 0.7903508771929825, 'recall': 0.8138195777351248, 'f1': 0.8019135562107137, 'number': 8857} | {'precision': 0.981501932633904, 'recall': 0.989010989010989, 'f1': 0.9852421533984619, 'number': 7189} | {'precision': 0.6717557251908397, 'recall': 0.9565217391304348, 'f1': 0.789237668161435, 'number': 92} | {'precision': 0.9154405820533549, 'recall': 0.9877878576413119, 'f1': 0.9502391541495343, 'number': 5732} | 0.8243 | 0.8812 | 0.8518 | 0.8335 |
86
+ | 0.4315 | 5.54 | 28000 | 0.4820 | {'precision': 0.6583983883152859, 'recall': 0.7577162730039124, 'f1': 0.7045745469244761, 'number': 6901} | {'precision': 0.7930996593780903, 'recall': 0.8149486282036807, 'f1': 0.8038757099899767, 'number': 8857} | {'precision': 0.9831328632655882, 'recall': 0.9891500904159132, 'f1': 0.9861322978782415, 'number': 7189} | {'precision': 0.6796875, 'recall': 0.9456521739130435, 'f1': 0.7909090909090909, 'number': 92} | {'precision': 0.9204878048780488, 'recall': 0.9876133984647593, 'f1': 0.9528698872243729, 'number': 5732} | 0.8282 | 0.8796 | 0.8531 | 0.8341 |
87
+ | 0.4316 | 5.74 | 29000 | 0.4762 | {'precision': 0.6612373737373738, 'recall': 0.7588755252861904, 'f1': 0.7066999527697188, 'number': 6901} | {'precision': 0.7980441709702231, 'recall': 0.8200293553121825, 'f1': 0.8088874039425326, 'number': 8857} | {'precision': 0.9830040071852978, 'recall': 0.9895673946306858, 'f1': 0.9862747816442535, 'number': 7189} | {'precision': 0.672, 'recall': 0.9130434782608695, 'f1': 0.7741935483870968, 'number': 92} | {'precision': 0.9263813739957371, 'recall': 0.9856943475226797, 'f1': 0.955117910573916, 'number': 5732} | 0.8316 | 0.8810 | 0.8556 | 0.8370 |
88
+ | 0.4278 | 5.94 | 30000 | 0.4823 | {'precision': 0.6596223583843942, 'recall': 0.7643819736270105, 'f1': 0.7081487447979596, 'number': 6901} | {'precision': 0.7918309242225142, 'recall': 0.8164163938128034, 'f1': 0.8039357385068653, 'number': 8857} | {'precision': 0.9835339698353397, 'recall': 0.9887327862011406, 'f1': 0.9861265260821309, 'number': 7189} | {'precision': 0.68, 'recall': 0.9239130434782609, 'f1': 0.783410138248848, 'number': 92} | {'precision': 0.9244109947643979, 'recall': 0.9856943475226797, 'f1': 0.9540695710908478, 'number': 5732} | 0.8286 | 0.8811 | 0.8540 | 0.8348 |
89
+ | 0.4211 | 6.14 | 31000 | 0.4794 | {'precision': 0.6637281206081512, 'recall': 0.7527894508042313, 'f1': 0.705458989679522, 'number': 6901} | {'precision': 0.7826885671061162, 'recall': 0.8177712543750706, 'f1': 0.7998453978245265, 'number': 8857} | {'precision': 0.9804649883065071, 'recall': 0.9913757128947003, 'f1': 0.9858901646147462, 'number': 7189} | {'precision': 0.6854838709677419, 'recall': 0.9239130434782609, 'f1': 0.787037037037037, 'number': 92} | {'precision': 0.925495333224169, 'recall': 0.9860432658757851, 'f1': 0.9548103724976772, 'number': 5732} | 0.8274 | 0.8794 | 0.8526 | 0.8356 |
90
+ | 0.4231 | 6.34 | 32000 | 0.4757 | {'precision': 0.6627510420613869, 'recall': 0.7603245906390378, 'f1': 0.7081927385612093, 'number': 6901} | {'precision': 0.7868816735672259, 'recall': 0.815400248391103, 'f1': 0.8008871638480732, 'number': 8857} | {'precision': 0.9844875346260388, 'recall': 0.9887327862011406, 'f1': 0.9866055937261433, 'number': 7189} | {'precision': 0.696, 'recall': 0.9456521739130435, 'f1': 0.8018433179723502, 'number': 92} | {'precision': 0.9235918367346939, 'recall': 0.9869155617585486, 'f1': 0.9542042675212956, 'number': 5732} | 0.8284 | 0.8801 | 0.8535 | 0.8364 |
91
+ | 0.4302 | 6.53 | 33000 | 0.4786 | {'precision': 0.6624333248666497, 'recall': 0.7558324880452109, 'f1': 0.706057529610829, 'number': 6901} | {'precision': 0.7953421948808085, 'recall': 0.8174325392345038, 'f1': 0.8062360801781736, 'number': 8857} | {'precision': 0.9832664914949523, 'recall': 0.989010989010989, 'f1': 0.986130374479889, 'number': 7189} | {'precision': 0.7017543859649122, 'recall': 0.8695652173913043, 'f1': 0.7766990291262136, 'number': 92} | {'precision': 0.9243216737495914, 'recall': 0.9865666434054431, 'f1': 0.9544303797468354, 'number': 5732} | 0.8312 | 0.8794 | 0.8546 | 0.8355 |
92
+ | 0.4223 | 6.73 | 34000 | 0.4795 | {'precision': 0.6597820577800304, 'recall': 0.7545283292276481, 'f1': 0.703981612925032, 'number': 6901} | {'precision': 0.7922049485439019, 'recall': 0.8169809190470814, 'f1': 0.8044022011005503, 'number': 8857} | {'precision': 0.9832664914949523, 'recall': 0.989010989010989, 'f1': 0.986130374479889, 'number': 7189} | {'precision': 0.6904761904761905, 'recall': 0.9456521739130435, 'f1': 0.7981651376146789, 'number': 92} | {'precision': 0.923730197615548, 'recall': 0.9867411025819958, 'f1': 0.9541965415436525, 'number': 5732} | 0.8292 | 0.8792 | 0.8535 | 0.8363 |
93
+ | 0.4184 | 6.93 | 35000 | 0.4803 | {'precision': 0.6614741641337386, 'recall': 0.7568468337922041, 'f1': 0.7059539095762654, 'number': 6901} | {'precision': 0.788057099269914, 'recall': 0.8165292988596591, 'f1': 0.8020405899966729, 'number': 8857} | {'precision': 0.9823472624465591, 'recall': 0.9908193072750034, 'f1': 0.9865650969529086, 'number': 7189} | {'precision': 0.6821705426356589, 'recall': 0.9565217391304348, 'f1': 0.7963800904977375, 'number': 92} | {'precision': 0.9216229428059313, 'recall': 0.9867411025819958, 'f1': 0.9530710253601821, 'number': 5732} | 0.8278 | 0.8801 | 0.8532 | 0.8356 |
94
+ | 0.4071 | 7.13 | 36000 | 0.4882 | {'precision': 0.6610340479192938, 'recall': 0.7596000579626141, 'f1': 0.7068977142471848, 'number': 6901} | {'precision': 0.7952072111685171, 'recall': 0.8167551089533702, 'f1': 0.8058371393561323, 'number': 8857} | {'precision': 0.9823423920540765, 'recall': 0.9905411044651551, 'f1': 0.9864247125640672, 'number': 7189} | {'precision': 0.6904761904761905, 'recall': 0.9456521739130435, 'f1': 0.7981651376146789, 'number': 92} | {'precision': 0.9252826478780928, 'recall': 0.9851709699930217, 'f1': 0.9542881284326151, 'number': 5732} | 0.8304 | 0.8804 | 0.8547 | 0.8358 |
95
+ | 0.4093 | 7.33 | 37000 | 0.4856 | {'precision': 0.6579605098725319, 'recall': 0.7629329082741632, 'f1': 0.7065691471515801, 'number': 6901} | {'precision': 0.794249972566663, 'recall': 0.8172067291407926, 'f1': 0.8055648302726766, 'number': 8857} | {'precision': 0.9832734310201825, 'recall': 0.9894282932257615, 'f1': 0.9863412604867227, 'number': 7189} | {'precision': 0.7, 'recall': 0.9130434782608695, 'f1': 0.7924528301886793, 'number': 92} | {'precision': 0.9225248735932148, 'recall': 0.9867411025819958, 'f1': 0.9535530641490347, 'number': 5732} | 0.8286 | 0.8813 | 0.8542 | 0.8367 |
96
+ | 0.4124 | 7.52 | 38000 | 0.4802 | {'precision': 0.6584084084084084, 'recall': 0.762498188668309, 'f1': 0.7066407036862955, 'number': 6901} | {'precision': 0.7942951179374658, 'recall': 0.8174325392345038, 'f1': 0.8056977520587582, 'number': 8857} | {'precision': 0.9831375259156876, 'recall': 0.9894282932257615, 'f1': 0.9862728785357736, 'number': 7189} | {'precision': 0.6821705426356589, 'recall': 0.9565217391304348, 'f1': 0.7963800904977375, 'number': 92} | {'precision': 0.9221244705115673, 'recall': 0.9874389392882066, 'f1': 0.9536647009267059, 'number': 5732} | 0.8286 | 0.8815 | 0.8543 | 0.8362 |
97
+ | 0.414 | 7.72 | 39000 | 0.4830 | {'precision': 0.6575084681972149, 'recall': 0.7594551514273293, 'f1': 0.7048144163528779, 'number': 6901} | {'precision': 0.7878721779910568, 'recall': 0.8156260584848143, 'f1': 0.8015089315433264, 'number': 8857} | {'precision': 0.9819235545743066, 'recall': 0.9898455974405341, 'f1': 0.9858686616791354, 'number': 7189} | {'precision': 0.6850393700787402, 'recall': 0.9456521739130435, 'f1': 0.7945205479452054, 'number': 92} | {'precision': 0.925229057591623, 'recall': 0.9865666434054431, 'f1': 0.9549138804457953, 'number': 5732} | 0.8268 | 0.8802 | 0.8527 | 0.8366 |
98
+ | 0.4212 | 7.92 | 40000 | 0.4803 | {'precision': 0.6614674319940105, 'recall': 0.7681495435444139, 'f1': 0.7108280254777071, 'number': 6901} | {'precision': 0.7921052631578948, 'recall': 0.8156260584848143, 'f1': 0.8036936084997496, 'number': 8857} | {'precision': 0.9846089850249584, 'recall': 0.9877590763666713, 'f1': 0.9861815151725575, 'number': 7189} | {'precision': 0.6854838709677419, 'recall': 0.9239130434782609, 'f1': 0.787037037037037, 'number': 92} | {'precision': 0.9240444299248611, 'recall': 0.9869155617585486, 'f1': 0.9544457567065969, 'number': 5732} | 0.8292 | 0.8817 | 0.8547 | 0.8373 |
99
+ | 0.3994 | 8.12 | 41000 | 0.4923 | {'precision': 0.6586345381526104, 'recall': 0.7604694971743226, 'f1': 0.7058981774161006, 'number': 6901} | {'precision': 0.7905782052683353, 'recall': 0.8166422039065147, 'f1': 0.8033988670443185, 'number': 8857} | {'precision': 0.9830016583747927, 'recall': 0.9894282932257615, 'f1': 0.9862045060658579, 'number': 7189} | {'precision': 0.6821705426356589, 'recall': 0.9565217391304348, 'f1': 0.7963800904977375, 'number': 92} | {'precision': 0.9232903541700669, 'recall': 0.9869155617585486, 'f1': 0.9540433426089888, 'number': 5732} | 0.8278 | 0.8807 | 0.8535 | 0.8355 |
100
+ | 0.4052 | 8.32 | 42000 | 0.4866 | {'precision': 0.6577553593947036, 'recall': 0.7558324880452109, 'f1': 0.7033915447373744, 'number': 6901} | {'precision': 0.7920087575259989, 'recall': 0.8168680140002258, 'f1': 0.8042463317029791, 'number': 8857} | {'precision': 0.9823326432022084, 'recall': 0.9899846988454584, 'f1': 0.9861438270749618, 'number': 7189} | {'precision': 0.6846153846153846, 'recall': 0.967391304347826, 'f1': 0.8018018018018018, 'number': 92} | {'precision': 0.9250531827851416, 'recall': 0.9862177250523377, 'f1': 0.9546567592670776, 'number': 5732} | 0.8285 | 0.8797 | 0.8533 | 0.8360 |
101
+ | 0.4042 | 8.51 | 43000 | 0.4866 | {'precision': 0.663912546078556, 'recall': 0.7568468337922041, 'f1': 0.7073401950162513, 'number': 6901} | {'precision': 0.7910823838737949, 'recall': 0.8152873433442475, 'f1': 0.8030025020850708, 'number': 8857} | {'precision': 0.980462300495322, 'recall': 0.991236611489776, 'f1': 0.9858200179843675, 'number': 7189} | {'precision': 0.6796875, 'recall': 0.9456521739130435, 'f1': 0.7909090909090909, 'number': 92} | {'precision': 0.921961550993809, 'recall': 0.9872644801116539, 'f1': 0.9534962089300758, 'number': 5732} | 0.8292 | 0.8799 | 0.8538 | 0.8365 |
102
+ | 0.4135 | 8.71 | 44000 | 0.4830 | {'precision': 0.664262212098203, 'recall': 0.7606144037096073, 'f1': 0.7091805715057758, 'number': 6901} | {'precision': 0.7914884282110344, 'recall': 0.8147228181099695, 'f1': 0.802937576499388, 'number': 8857} | {'precision': 0.9812594736116853, 'recall': 0.9905411044651551, 'f1': 0.985878443859892, 'number': 7189} | {'precision': 0.6829268292682927, 'recall': 0.9130434782608695, 'f1': 0.7813953488372093, 'number': 92} | {'precision': 0.9230141901810471, 'recall': 0.9872644801116539, 'f1': 0.9540588384051252, 'number': 5732} | 0.8296 | 0.8804 | 0.8543 | 0.8368 |
103
+ | 0.3958 | 8.91 | 45000 | 0.4859 | {'precision': 0.6619275289380976, 'recall': 0.7623532821330242, 'f1': 0.7085999057175567, 'number': 6901} | {'precision': 0.7909240021869874, 'recall': 0.8166422039065147, 'f1': 0.8035773802910788, 'number': 8857} | {'precision': 0.9831445150594087, 'recall': 0.9898455974405341, 'f1': 0.9864836764400082, 'number': 7189} | {'precision': 0.6910569105691057, 'recall': 0.9239130434782609, 'f1': 0.7906976744186046, 'number': 92} | {'precision': 0.9235543939888925, 'recall': 0.9863921842288904, 'f1': 0.9539395984477813, 'number': 5732} | 0.8290 | 0.8811 | 0.8543 | 0.8371 |
104
+ | 0.3985 | 9.11 | 46000 | 0.4897 | {'precision': 0.6627135934710533, 'recall': 0.7530792638748007, 'f1': 0.7050125483280201, 'number': 6901} | {'precision': 0.7878688881629097, 'recall': 0.8168680140002258, 'f1': 0.8021064301552105, 'number': 8857} | {'precision': 0.9842192691029901, 'recall': 0.989010989010989, 'f1': 0.9866093110386457, 'number': 7189} | {'precision': 0.6771653543307087, 'recall': 0.9347826086956522, 'f1': 0.7853881278538813, 'number': 92} | {'precision': 0.9269413889344935, 'recall': 0.984996510816469, 'f1': 0.9550875412331895, 'number': 5732} | 0.8296 | 0.8785 | 0.8533 | 0.8352 |
105
+ | 0.3944 | 9.31 | 47000 | 0.4890 | {'precision': 0.6661152818424736, 'recall': 0.7585857122156209, 'f1': 0.709349593495935, 'number': 6901} | {'precision': 0.7902785363189514, 'recall': 0.8168680140002258, 'f1': 0.8033533200088829, 'number': 8857} | {'precision': 0.9839535205422604, 'recall': 0.9894282932257615, 'f1': 0.9866833125260092, 'number': 7189} | {'precision': 0.6854838709677419, 'recall': 0.9239130434782609, 'f1': 0.787037037037037, 'number': 92} | {'precision': 0.9251923391717138, 'recall': 0.9860432658757851, 'f1': 0.954649100582721, 'number': 5732} | 0.8308 | 0.8801 | 0.8547 | 0.8369 |
106
+ | 0.3959 | 9.5 | 48000 | 0.4869 | {'precision': 0.6632755589047978, 'recall': 0.765251412838719, 'f1': 0.7106236964273699, 'number': 6901} | {'precision': 0.7917122239230264, 'recall': 0.8175454442813593, 'f1': 0.8044214853080043, 'number': 8857} | {'precision': 0.9835476289229919, 'recall': 0.9895673946306858, 'f1': 0.9865483289418943, 'number': 7189} | {'precision': 0.688, 'recall': 0.9347826086956522, 'f1': 0.7926267281105991, 'number': 92} | {'precision': 0.9240196078431373, 'recall': 0.9865666434054431, 'f1': 0.9542693216334796, 'number': 5732} | 0.8297 | 0.8820 | 0.8551 | 0.8369 |
107
+ | 0.3979 | 9.7 | 49000 | 0.4878 | {'precision': 0.666244939271255, 'recall': 0.7630778148094479, 'f1': 0.7113812901046943, 'number': 6901} | {'precision': 0.7906239755218009, 'recall': 0.8168680140002258, 'f1': 0.8035317636605953, 'number': 8857} | {'precision': 0.9835453539823009, 'recall': 0.9894282932257615, 'f1': 0.9864780528396089, 'number': 7189} | {'precision': 0.6829268292682927, 'recall': 0.9130434782608695, 'f1': 0.7813953488372093, 'number': 92} | {'precision': 0.9240071907174375, 'recall': 0.9863921842288904, 'f1': 0.9541810817652518, 'number': 5732} | 0.8304 | 0.8812 | 0.8550 | 0.8369 |
108
+ | 0.4095 | 9.9 | 50000 | 0.4862 | {'precision': 0.665783497350492, 'recall': 0.7646717866975801, 'f1': 0.7118095366561004, 'number': 6901} | {'precision': 0.7912472647702407, 'recall': 0.8165292988596591, 'f1': 0.80368950380619, 'number': 8857} | {'precision': 0.9832734310201825, 'recall': 0.9894282932257615, 'f1': 0.9863412604867227, 'number': 7189} | {'precision': 0.6829268292682927, 'recall': 0.9130434782608695, 'f1': 0.7813953488372093, 'number': 92} | {'precision': 0.9244604316546763, 'recall': 0.9863921842288904, 'f1': 0.9544226873733964, 'number': 5732} | 0.8304 | 0.8814 | 0.8552 | 0.8373 |
109
+
110
+
111
+ ### Framework versions
112
+
113
+ - Transformers 4.34.1
114
+ - Pytorch 2.1.0+cu118
115
+ - Datasets 2.14.5
116
+ - Tokenizers 0.14.1
all_results.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "eval_COMMENT": {
4
+ "f1": 0.7114860480207656,
5
+ "number": 7171,
6
+ "precision": 0.6653720111664037,
7
+ "recall": 0.7644679960953842
8
+ },
9
+ "eval_NAME": {
10
+ "f1": 0.8086344637849849,
11
+ "number": 9305,
12
+ "precision": 0.7963734889537307,
13
+ "recall": 0.8212788823213326
14
+ },
15
+ "eval_QTY": {
16
+ "f1": 0.9862540673351484,
17
+ "number": 7495,
18
+ "precision": 0.981755684822845,
19
+ "recall": 0.9907938625750501
20
+ },
21
+ "eval_RANGE_END": {
22
+ "f1": 0.7443946188340806,
23
+ "number": 90,
24
+ "precision": 0.6240601503759399,
25
+ "recall": 0.9222222222222223
26
+ },
27
+ "eval_UNIT": {
28
+ "f1": 0.95358036651328,
29
+ "number": 5989,
30
+ "precision": 0.923100969052829,
31
+ "recall": 0.9861412589747871
32
+ },
33
+ "eval_loss": 0.4705313444137573,
34
+ "eval_overall_accuracy": 0.8349855394073885,
35
+ "eval_overall_f1": 0.8563730235559858,
36
+ "eval_overall_precision": 0.8311619166927654,
37
+ "eval_overall_recall": 0.8831613976705491,
38
+ "eval_runtime": 8.4988,
39
+ "eval_samples_per_second": 1053.557,
40
+ "eval_steps_per_second": 32.946
41
+ }
config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "napsternxg/gte-small-L3-ingredient-v2",
3
+ "architectures": [
4
+ "PretrainedTaggerModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 384,
11
+ "id2label": {
12
+ "0": "O",
13
+ "1": "B-COMMENT",
14
+ "2": "I-COMMENT",
15
+ "3": "B-NAME",
16
+ "4": "I-NAME",
17
+ "5": "B-RANGE_END",
18
+ "6": "I-RANGE_END",
19
+ "7": "B-QTY",
20
+ "8": "I-QTY",
21
+ "9": "B-UNIT",
22
+ "10": "I-UNIT"
23
+ },
24
+ "initializer_range": 0.02,
25
+ "intermediate_size": 1536,
26
+ "label2id": {
27
+ "B-COMMENT": 1,
28
+ "B-NAME": 3,
29
+ "B-QTY": 7,
30
+ "B-RANGE_END": 5,
31
+ "B-UNIT": 9,
32
+ "I-COMMENT": 2,
33
+ "I-NAME": 4,
34
+ "I-QTY": 8,
35
+ "I-RANGE_END": 6,
36
+ "I-UNIT": 10,
37
+ "O": 0
38
+ },
39
+ "layer_norm_eps": 1e-12,
40
+ "max_position_embeddings": 512,
41
+ "model_type": "bert",
42
+ "num_attention_heads": 12,
43
+ "num_hidden_layers": 3,
44
+ "pad_token_id": 0,
45
+ "position_embedding_type": "absolute",
46
+ "torch_dtype": "float32",
47
+ "transformers_version": "4.34.1",
48
+ "type_vocab_size": 2,
49
+ "use_cache": true,
50
+ "vocab_size": 30522
51
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2395ae8a9abeffa945966cd12ef3f2d1b87f42814c0ff25275981260c3d1ed2b
3
+ size 69004115
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
test_results.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "eval_COMMENT": {
4
+ "f1": 0.7114860480207656,
5
+ "number": 7171,
6
+ "precision": 0.6653720111664037,
7
+ "recall": 0.7644679960953842
8
+ },
9
+ "eval_NAME": {
10
+ "f1": 0.8086344637849849,
11
+ "number": 9305,
12
+ "precision": 0.7963734889537307,
13
+ "recall": 0.8212788823213326
14
+ },
15
+ "eval_QTY": {
16
+ "f1": 0.9862540673351484,
17
+ "number": 7495,
18
+ "precision": 0.981755684822845,
19
+ "recall": 0.9907938625750501
20
+ },
21
+ "eval_RANGE_END": {
22
+ "f1": 0.7443946188340806,
23
+ "number": 90,
24
+ "precision": 0.6240601503759399,
25
+ "recall": 0.9222222222222223
26
+ },
27
+ "eval_UNIT": {
28
+ "f1": 0.95358036651328,
29
+ "number": 5989,
30
+ "precision": 0.923100969052829,
31
+ "recall": 0.9861412589747871
32
+ },
33
+ "eval_loss": 0.4705313444137573,
34
+ "eval_overall_accuracy": 0.8349855394073885,
35
+ "eval_overall_f1": 0.8563730235559858,
36
+ "eval_overall_precision": 0.8311619166927654,
37
+ "eval_overall_recall": 0.8831613976705491,
38
+ "eval_runtime": 8.4988,
39
+ "eval_samples_per_second": 1053.557,
40
+ "eval_steps_per_second": 32.946
41
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "max_length": 128,
50
+ "model_max_length": 1000000000000000019884624838656,
51
+ "never_split": null,
52
+ "pad_to_multiple_of": null,
53
+ "pad_token": "[PAD]",
54
+ "pad_token_type_id": 0,
55
+ "padding_side": "right",
56
+ "sep_token": "[SEP]",
57
+ "stride": 0,
58
+ "strip_accents": null,
59
+ "tokenize_chinese_chars": true,
60
+ "tokenizer_class": "BertTokenizer",
61
+ "truncation_side": "right",
62
+ "truncation_strategy": "longest_first",
63
+ "unk_token": "[UNK]"
64
+ }
train_results.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "eval_COMMENT": {
4
+ "f1": 0.7388161975793072,
5
+ "number": 129716,
6
+ "precision": 0.694144754676064,
7
+ "recall": 0.7896327361312405
8
+ },
9
+ "eval_NAME": {
10
+ "f1": 0.8224766455255967,
11
+ "number": 167638,
12
+ "precision": 0.809525735315358,
13
+ "recall": 0.8358486739283456
14
+ },
15
+ "eval_QTY": {
16
+ "f1": 0.9868797185369786,
17
+ "number": 135780,
18
+ "precision": 0.9822001750802452,
19
+ "recall": 0.9916040653999116
20
+ },
21
+ "eval_RANGE_END": {
22
+ "f1": 0.7616517749335909,
23
+ "number": 1682,
24
+ "precision": 0.6413176087840585,
25
+ "recall": 0.9375743162901308
26
+ },
27
+ "eval_UNIT": {
28
+ "f1": 0.9564042026259744,
29
+ "number": 108832,
30
+ "precision": 0.926564721085505,
31
+ "recall": 0.9882295648338724
32
+ },
33
+ "eval_loss": 0.4124242663383484,
34
+ "eval_overall_accuracy": 0.855277993837768,
35
+ "eval_overall_f1": 0.868490442544095,
36
+ "eval_overall_precision": 0.8439132826504565,
37
+ "eval_overall_recall": 0.894542056624875,
38
+ "eval_runtime": 130.0825,
39
+ "eval_samples_per_second": 1242.311,
40
+ "eval_steps_per_second": 38.829
41
+ }
trainer_state.json ADDED
@@ -0,0 +1,2734 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.474032998085022,
3
+ "best_model_checkpoint": "nyt_ingredients-tagger-gte-small-L3-ingredient-v2/checkpoint-24000",
4
+ "epoch": 10.0,
5
+ "eval_steps": 1000,
6
+ "global_step": 50510,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.1,
13
+ "learning_rate": 4.9505048505246485e-05,
14
+ "loss": 1.1293,
15
+ "step": 500
16
+ },
17
+ {
18
+ "epoch": 0.2,
19
+ "learning_rate": 4.9010097010492975e-05,
20
+ "loss": 0.6931,
21
+ "step": 1000
22
+ },
23
+ {
24
+ "epoch": 0.2,
25
+ "eval_COMMENT": {
26
+ "f1": 0.5770606987183658,
27
+ "number": 6901,
28
+ "precision": 0.5236127508854782,
29
+ "recall": 0.6426604839878278
30
+ },
31
+ "eval_NAME": {
32
+ "f1": 0.7875208913649026,
33
+ "number": 8857,
34
+ "precision": 0.7773012207192346,
35
+ "recall": 0.7980128711753416
36
+ },
37
+ "eval_QTY": {
38
+ "f1": 0.9780634343998882,
39
+ "number": 7189,
40
+ "precision": 0.9824561403508771,
41
+ "recall": 0.9737098344693281
42
+ },
43
+ "eval_RANGE_END": {
44
+ "f1": 0.0,
45
+ "number": 92,
46
+ "precision": 0.0,
47
+ "recall": 0.0
48
+ },
49
+ "eval_UNIT": {
50
+ "f1": 0.9434346865975879,
51
+ "number": 5732,
52
+ "precision": 0.9192320423700762,
53
+ "recall": 0.9689462665736218
54
+ },
55
+ "eval_loss": 0.6230219006538391,
56
+ "eval_overall_accuracy": 0.7985813450669499,
57
+ "eval_overall_f1": 0.8086250651249558,
58
+ "eval_overall_precision": 0.7828506345590628,
59
+ "eval_overall_recall": 0.8361544610892913,
60
+ "eval_runtime": 7.9128,
61
+ "eval_samples_per_second": 1074.967,
62
+ "eval_steps_per_second": 33.616,
63
+ "step": 1000
64
+ },
65
+ {
66
+ "epoch": 0.3,
67
+ "learning_rate": 4.851514551573946e-05,
68
+ "loss": 0.6087,
69
+ "step": 1500
70
+ },
71
+ {
72
+ "epoch": 0.4,
73
+ "learning_rate": 4.802019402098595e-05,
74
+ "loss": 0.5826,
75
+ "step": 2000
76
+ },
77
+ {
78
+ "epoch": 0.4,
79
+ "eval_COMMENT": {
80
+ "f1": 0.602454780361757,
81
+ "number": 6901,
82
+ "precision": 0.5435365427205968,
83
+ "recall": 0.6756991740327489
84
+ },
85
+ "eval_NAME": {
86
+ "f1": 0.7907440212577502,
87
+ "number": 8857,
88
+ "precision": 0.7757141305528402,
89
+ "recall": 0.8063678446426555
90
+ },
91
+ "eval_QTY": {
92
+ "f1": 0.9754149163280765,
93
+ "number": 7189,
94
+ "precision": 0.9659028914348063,
95
+ "recall": 0.9851161496731117
96
+ },
97
+ "eval_RANGE_END": {
98
+ "f1": 0.6567164179104478,
99
+ "number": 92,
100
+ "precision": 0.6055045871559633,
101
+ "recall": 0.717391304347826
102
+ },
103
+ "eval_UNIT": {
104
+ "f1": 0.9462474645030426,
105
+ "number": 5732,
106
+ "precision": 0.9177049180327869,
107
+ "recall": 0.9766224703419399
108
+ },
109
+ "eval_loss": 0.5530511736869812,
110
+ "eval_overall_accuracy": 0.8078557068618898,
111
+ "eval_overall_f1": 0.8170321807714068,
112
+ "eval_overall_precision": 0.7837009608325087,
113
+ "eval_overall_recall": 0.8533245281707275,
114
+ "eval_runtime": 6.3157,
115
+ "eval_samples_per_second": 1346.806,
116
+ "eval_steps_per_second": 42.117,
117
+ "step": 2000
118
+ },
119
+ {
120
+ "epoch": 0.49,
121
+ "learning_rate": 4.752524252623243e-05,
122
+ "loss": 0.5569,
123
+ "step": 2500
124
+ },
125
+ {
126
+ "epoch": 0.59,
127
+ "learning_rate": 4.703029103147892e-05,
128
+ "loss": 0.5435,
129
+ "step": 3000
130
+ },
131
+ {
132
+ "epoch": 0.59,
133
+ "eval_COMMENT": {
134
+ "f1": 0.6313494946826079,
135
+ "number": 6901,
136
+ "precision": 0.5801165331391115,
137
+ "recall": 0.6925083321257789
138
+ },
139
+ "eval_NAME": {
140
+ "f1": 0.7944305207463102,
141
+ "number": 8857,
142
+ "precision": 0.7839085513299626,
143
+ "recall": 0.8052387941740996
144
+ },
145
+ "eval_QTY": {
146
+ "f1": 0.9791782343142699,
147
+ "number": 7189,
148
+ "precision": 0.9771436487048067,
149
+ "recall": 0.9812213103352344
150
+ },
151
+ "eval_RANGE_END": {
152
+ "f1": 0.7109004739336493,
153
+ "number": 92,
154
+ "precision": 0.6302521008403361,
155
+ "recall": 0.8152173913043478
156
+ },
157
+ "eval_UNIT": {
158
+ "f1": 0.9472093999160722,
159
+ "number": 5732,
160
+ "precision": 0.9126637554585153,
161
+ "recall": 0.9844731332868109
162
+ },
163
+ "eval_loss": 0.5327398180961609,
164
+ "eval_overall_accuracy": 0.8150438114023442,
165
+ "eval_overall_f1": 0.827899644462333,
166
+ "eval_overall_precision": 0.7999157403506497,
167
+ "eval_overall_recall": 0.8579124813179938,
168
+ "eval_runtime": 8.1233,
169
+ "eval_samples_per_second": 1047.112,
170
+ "eval_steps_per_second": 32.745,
171
+ "step": 3000
172
+ },
173
+ {
174
+ "epoch": 0.69,
175
+ "learning_rate": 4.65353395367254e-05,
176
+ "loss": 0.5324,
177
+ "step": 3500
178
+ },
179
+ {
180
+ "epoch": 0.79,
181
+ "learning_rate": 4.6040388041971886e-05,
182
+ "loss": 0.5333,
183
+ "step": 4000
184
+ },
185
+ {
186
+ "epoch": 0.79,
187
+ "eval_COMMENT": {
188
+ "f1": 0.6446886446886447,
189
+ "number": 6901,
190
+ "precision": 0.5875760104924288,
191
+ "recall": 0.7140994058832053
192
+ },
193
+ "eval_NAME": {
194
+ "f1": 0.7953999888349244,
195
+ "number": 8857,
196
+ "precision": 0.786660777385159,
197
+ "recall": 0.8043355537992548
198
+ },
199
+ "eval_QTY": {
200
+ "f1": 0.9809583594894328,
201
+ "number": 7189,
202
+ "precision": 0.9837716843872412,
203
+ "recall": 0.9781610794269022
204
+ },
205
+ "eval_RANGE_END": {
206
+ "f1": 0.7555555555555556,
207
+ "number": 92,
208
+ "precision": 0.6390977443609023,
209
+ "recall": 0.9239130434782609
210
+ },
211
+ "eval_UNIT": {
212
+ "f1": 0.9506497918967128,
213
+ "number": 5732,
214
+ "precision": 0.9263366992219831,
215
+ "recall": 0.9762735519888346
216
+ },
217
+ "eval_loss": 0.5212323665618896,
218
+ "eval_overall_accuracy": 0.8183059591093578,
219
+ "eval_overall_f1": 0.831933619994625,
220
+ "eval_overall_precision": 0.8049731838127743,
221
+ "eval_overall_recall": 0.8607625734246289,
222
+ "eval_runtime": 8.6379,
223
+ "eval_samples_per_second": 984.732,
224
+ "eval_steps_per_second": 30.795,
225
+ "step": 4000
226
+ },
227
+ {
228
+ "epoch": 0.89,
229
+ "learning_rate": 4.5545436547218376e-05,
230
+ "loss": 0.5285,
231
+ "step": 4500
232
+ },
233
+ {
234
+ "epoch": 0.99,
235
+ "learning_rate": 4.505048505246486e-05,
236
+ "loss": 0.5199,
237
+ "step": 5000
238
+ },
239
+ {
240
+ "epoch": 0.99,
241
+ "eval_COMMENT": {
242
+ "f1": 0.6402057097646205,
243
+ "number": 6901,
244
+ "precision": 0.5873457536898137,
245
+ "recall": 0.7035212288074192
246
+ },
247
+ "eval_NAME": {
248
+ "f1": 0.8005563282336579,
249
+ "number": 8857,
250
+ "precision": 0.7890984865101996,
251
+ "recall": 0.812351812126002
252
+ },
253
+ "eval_QTY": {
254
+ "f1": 0.9803540437348144,
255
+ "number": 7189,
256
+ "precision": 0.978519955654102,
257
+ "recall": 0.9821950201697037
258
+ },
259
+ "eval_RANGE_END": {
260
+ "f1": 0.7747747747747747,
261
+ "number": 92,
262
+ "precision": 0.6615384615384615,
263
+ "recall": 0.9347826086956522
264
+ },
265
+ "eval_UNIT": {
266
+ "f1": 0.9499704716105627,
267
+ "number": 5732,
268
+ "precision": 0.9197843489625878,
269
+ "recall": 0.9822051639916259
270
+ },
271
+ "eval_loss": 0.5120549201965332,
272
+ "eval_overall_accuracy": 0.8185525167848879,
273
+ "eval_overall_f1": 0.8328133910301567,
274
+ "eval_overall_precision": 0.804738906356358,
275
+ "eval_overall_recall": 0.8629175211150116,
276
+ "eval_runtime": 6.4358,
277
+ "eval_samples_per_second": 1321.664,
278
+ "eval_steps_per_second": 41.331,
279
+ "step": 5000
280
+ },
281
+ {
282
+ "epoch": 1.09,
283
+ "learning_rate": 4.455553355771135e-05,
284
+ "loss": 0.5127,
285
+ "step": 5500
286
+ },
287
+ {
288
+ "epoch": 1.19,
289
+ "learning_rate": 4.406058206295783e-05,
290
+ "loss": 0.4983,
291
+ "step": 6000
292
+ },
293
+ {
294
+ "epoch": 1.19,
295
+ "eval_COMMENT": {
296
+ "f1": 0.6476600322754169,
297
+ "number": 6901,
298
+ "precision": 0.6041901894367081,
299
+ "recall": 0.6978698739313143
300
+ },
301
+ "eval_NAME": {
302
+ "f1": 0.7935644937586686,
303
+ "number": 8857,
304
+ "precision": 0.7801047120418848,
305
+ "recall": 0.8074968951112115
306
+ },
307
+ "eval_QTY": {
308
+ "f1": 0.9824293353705119,
309
+ "number": 7189,
310
+ "precision": 0.980998613037448,
311
+ "recall": 0.983864237028794
312
+ },
313
+ "eval_RANGE_END": {
314
+ "f1": 0.7601809954751132,
315
+ "number": 92,
316
+ "precision": 0.6511627906976745,
317
+ "recall": 0.9130434782608695
318
+ },
319
+ "eval_UNIT": {
320
+ "f1": 0.9500843170320405,
321
+ "number": 5732,
322
+ "precision": 0.9193864229765013,
323
+ "recall": 0.9829030006978368
324
+ },
325
+ "eval_loss": 0.5088106393814087,
326
+ "eval_overall_accuracy": 0.8192163259113151,
327
+ "eval_overall_f1": 0.8339592771611903,
328
+ "eval_overall_precision": 0.8089590276416389,
329
+ "eval_overall_recall": 0.8605540300997532,
330
+ "eval_runtime": 8.5928,
331
+ "eval_samples_per_second": 989.902,
332
+ "eval_steps_per_second": 30.956,
333
+ "step": 6000
334
+ },
335
+ {
336
+ "epoch": 1.29,
337
+ "learning_rate": 4.356563056820432e-05,
338
+ "loss": 0.5102,
339
+ "step": 6500
340
+ },
341
+ {
342
+ "epoch": 1.39,
343
+ "learning_rate": 4.3070679073450804e-05,
344
+ "loss": 0.5031,
345
+ "step": 7000
346
+ },
347
+ {
348
+ "epoch": 1.39,
349
+ "eval_COMMENT": {
350
+ "f1": 0.6483065113460373,
351
+ "number": 6901,
352
+ "precision": 0.6055345911949686,
353
+ "recall": 0.6975800608607449
354
+ },
355
+ "eval_NAME": {
356
+ "f1": 0.797360248447205,
357
+ "number": 8857,
358
+ "precision": 0.7835422343324251,
359
+ "recall": 0.8116743818448685
360
+ },
361
+ "eval_QTY": {
362
+ "f1": 0.9815493055075669,
363
+ "number": 7189,
364
+ "precision": 0.9752815160670145,
365
+ "recall": 0.9878981777715955
366
+ },
367
+ "eval_RANGE_END": {
368
+ "f1": 0.7706422018348623,
369
+ "number": 92,
370
+ "precision": 0.6666666666666666,
371
+ "recall": 0.9130434782608695
372
+ },
373
+ "eval_UNIT": {
374
+ "f1": 0.9498936622713738,
375
+ "number": 5732,
376
+ "precision": 0.9269467043001827,
377
+ "recall": 0.9740055826936497
378
+ },
379
+ "eval_loss": 0.5030972361564636,
380
+ "eval_overall_accuracy": 0.8199370329628646,
381
+ "eval_overall_f1": 0.8351003758828189,
382
+ "eval_overall_precision": 0.8107082078806126,
383
+ "eval_overall_recall": 0.8610058739703174,
384
+ "eval_runtime": 7.9063,
385
+ "eval_samples_per_second": 1075.848,
386
+ "eval_steps_per_second": 33.644,
387
+ "step": 7000
388
+ },
389
+ {
390
+ "epoch": 1.48,
391
+ "learning_rate": 4.257572757869729e-05,
392
+ "loss": 0.5027,
393
+ "step": 7500
394
+ },
395
+ {
396
+ "epoch": 1.58,
397
+ "learning_rate": 4.208077608394378e-05,
398
+ "loss": 0.492,
399
+ "step": 8000
400
+ },
401
+ {
402
+ "epoch": 1.58,
403
+ "eval_COMMENT": {
404
+ "f1": 0.6769068494956819,
405
+ "number": 6901,
406
+ "precision": 0.6209482341557814,
407
+ "recall": 0.743950152151862
408
+ },
409
+ "eval_NAME": {
410
+ "f1": 0.7926012072880323,
411
+ "number": 8857,
412
+ "precision": 0.7778260869565218,
413
+ "recall": 0.8079485152986339
414
+ },
415
+ "eval_QTY": {
416
+ "f1": 0.9821801475706529,
417
+ "number": 7189,
418
+ "precision": 0.983001254005852,
419
+ "recall": 0.9813604117401585
420
+ },
421
+ "eval_RANGE_END": {
422
+ "f1": 0.7685589519650656,
423
+ "number": 92,
424
+ "precision": 0.6423357664233577,
425
+ "recall": 0.9565217391304348
426
+ },
427
+ "eval_UNIT": {
428
+ "f1": 0.9496828752642706,
429
+ "number": 5732,
430
+ "precision": 0.9215493188905302,
431
+ "recall": 0.9795882763433357
432
+ },
433
+ "eval_loss": 0.5041355490684509,
434
+ "eval_overall_accuracy": 0.8246216287979365,
435
+ "eval_overall_f1": 0.8398886765248299,
436
+ "eval_overall_precision": 0.8112712550607287,
437
+ "eval_overall_recall": 0.8705988669146015,
438
+ "eval_runtime": 9.0062,
439
+ "eval_samples_per_second": 944.457,
440
+ "eval_steps_per_second": 29.535,
441
+ "step": 8000
442
+ },
443
+ {
444
+ "epoch": 1.68,
445
+ "learning_rate": 4.158582458919026e-05,
446
+ "loss": 0.4939,
447
+ "step": 8500
448
+ },
449
+ {
450
+ "epoch": 1.78,
451
+ "learning_rate": 4.109087309443675e-05,
452
+ "loss": 0.4817,
453
+ "step": 9000
454
+ },
455
+ {
456
+ "epoch": 1.78,
457
+ "eval_COMMENT": {
458
+ "f1": 0.6750676255195619,
459
+ "number": 6901,
460
+ "precision": 0.6196705426356589,
461
+ "recall": 0.7413418345167367
462
+ },
463
+ "eval_NAME": {
464
+ "f1": 0.8006897702620014,
465
+ "number": 8857,
466
+ "precision": 0.7891447368421053,
467
+ "recall": 0.8125776222197132
468
+ },
469
+ "eval_QTY": {
470
+ "f1": 0.9833679833679833,
471
+ "number": 7189,
472
+ "precision": 0.9798370390829996,
473
+ "recall": 0.9869244679371262
474
+ },
475
+ "eval_RANGE_END": {
476
+ "f1": 0.7792207792207793,
477
+ "number": 92,
478
+ "precision": 0.6474820143884892,
479
+ "recall": 0.9782608695652174
480
+ },
481
+ "eval_UNIT": {
482
+ "f1": 0.9505083606419629,
483
+ "number": 5732,
484
+ "precision": 0.9168422758956071,
485
+ "recall": 0.9867411025819958
486
+ },
487
+ "eval_loss": 0.4901449382305145,
488
+ "eval_overall_accuracy": 0.8292872586579676,
489
+ "eval_overall_f1": 0.8427365317609219,
490
+ "eval_overall_precision": 0.8133872271624899,
491
+ "eval_overall_recall": 0.8742831323207396,
492
+ "eval_runtime": 9.1291,
493
+ "eval_samples_per_second": 931.746,
494
+ "eval_steps_per_second": 29.138,
495
+ "step": 9000
496
+ },
497
+ {
498
+ "epoch": 1.88,
499
+ "learning_rate": 4.059592159968323e-05,
500
+ "loss": 0.4903,
501
+ "step": 9500
502
+ },
503
+ {
504
+ "epoch": 1.98,
505
+ "learning_rate": 4.010097010492972e-05,
506
+ "loss": 0.4905,
507
+ "step": 10000
508
+ },
509
+ {
510
+ "epoch": 1.98,
511
+ "eval_COMMENT": {
512
+ "f1": 0.6778359049069598,
513
+ "number": 6901,
514
+ "precision": 0.6241463414634146,
515
+ "recall": 0.7416316475873062
516
+ },
517
+ "eval_NAME": {
518
+ "f1": 0.8002232142857143,
519
+ "number": 8857,
520
+ "precision": 0.7911287653095002,
521
+ "recall": 0.8095291859546122
522
+ },
523
+ "eval_QTY": {
524
+ "f1": 0.9842749791260784,
525
+ "number": 7189,
526
+ "precision": 0.9846860643185299,
527
+ "recall": 0.983864237028794
528
+ },
529
+ "eval_RANGE_END": {
530
+ "f1": 0.789237668161435,
531
+ "number": 92,
532
+ "precision": 0.6717557251908397,
533
+ "recall": 0.9565217391304348
534
+ },
535
+ "eval_UNIT": {
536
+ "f1": 0.9502270052127123,
537
+ "number": 5732,
538
+ "precision": 0.9170723790976956,
539
+ "recall": 0.9858688066992324
540
+ },
541
+ "eval_loss": 0.4891791045665741,
542
+ "eval_overall_accuracy": 0.8287751773318667,
543
+ "eval_overall_f1": 0.8435557049235421,
544
+ "eval_overall_precision": 0.8165522625980025,
545
+ "eval_overall_recall": 0.8724062423968579,
546
+ "eval_runtime": 6.9634,
547
+ "eval_samples_per_second": 1221.536,
548
+ "eval_steps_per_second": 38.2,
549
+ "step": 10000
550
+ },
551
+ {
552
+ "epoch": 2.08,
553
+ "learning_rate": 3.9606018610176205e-05,
554
+ "loss": 0.4804,
555
+ "step": 10500
556
+ },
557
+ {
558
+ "epoch": 2.18,
559
+ "learning_rate": 3.911106711542269e-05,
560
+ "loss": 0.4757,
561
+ "step": 11000
562
+ },
563
+ {
564
+ "epoch": 2.18,
565
+ "eval_COMMENT": {
566
+ "f1": 0.6788539520042544,
567
+ "number": 6901,
568
+ "precision": 0.6271186440677966,
569
+ "recall": 0.7398927691638892
570
+ },
571
+ "eval_NAME": {
572
+ "f1": 0.802429240026744,
573
+ "number": 8857,
574
+ "precision": 0.7921020789792103,
575
+ "recall": 0.8130292424071356
576
+ },
577
+ "eval_QTY": {
578
+ "f1": 0.9835042971998891,
579
+ "number": 7189,
580
+ "precision": 0.9801077496891836,
581
+ "recall": 0.9869244679371262
582
+ },
583
+ "eval_RANGE_END": {
584
+ "f1": 0.7758620689655172,
585
+ "number": 92,
586
+ "precision": 0.6428571428571429,
587
+ "recall": 0.9782608695652174
588
+ },
589
+ "eval_UNIT": {
590
+ "f1": 0.9515842839036756,
591
+ "number": 5732,
592
+ "precision": 0.9226609864001311,
593
+ "recall": 0.9823796231681786
594
+ },
595
+ "eval_loss": 0.4953509271144867,
596
+ "eval_overall_accuracy": 0.8274285931039714,
597
+ "eval_overall_f1": 0.844669333960932,
598
+ "eval_overall_precision": 0.8179391176949373,
599
+ "eval_overall_recall": 0.8732056584755483,
600
+ "eval_runtime": 8.0512,
601
+ "eval_samples_per_second": 1056.487,
602
+ "eval_steps_per_second": 33.039,
603
+ "step": 11000
604
+ },
605
+ {
606
+ "epoch": 2.28,
607
+ "learning_rate": 3.861611562066917e-05,
608
+ "loss": 0.4856,
609
+ "step": 11500
610
+ },
611
+ {
612
+ "epoch": 2.38,
613
+ "learning_rate": 3.812116412591566e-05,
614
+ "loss": 0.4691,
615
+ "step": 12000
616
+ },
617
+ {
618
+ "epoch": 2.38,
619
+ "eval_COMMENT": {
620
+ "f1": 0.6842557693579316,
621
+ "number": 6901,
622
+ "precision": 0.6292872780345414,
623
+ "recall": 0.7497464135632517
624
+ },
625
+ "eval_NAME": {
626
+ "f1": 0.803944509443423,
627
+ "number": 8857,
628
+ "precision": 0.7935547734271887,
629
+ "recall": 0.8146099130631139
630
+ },
631
+ "eval_QTY": {
632
+ "f1": 0.984621778886118,
633
+ "number": 7189,
634
+ "precision": 0.9806816613771215,
635
+ "recall": 0.9885936847962165
636
+ },
637
+ "eval_RANGE_END": {
638
+ "f1": 0.780701754385965,
639
+ "number": 92,
640
+ "precision": 0.6544117647058824,
641
+ "recall": 0.967391304347826
642
+ },
643
+ "eval_UNIT": {
644
+ "f1": 0.9528556944913822,
645
+ "number": 5732,
646
+ "precision": 0.9238204456094364,
647
+ "recall": 0.9837752965806001
648
+ },
649
+ "eval_loss": 0.4902682304382324,
650
+ "eval_overall_accuracy": 0.8301407275348026,
651
+ "eval_overall_f1": 0.84684079769019,
652
+ "eval_overall_precision": 0.818934450180189,
653
+ "eval_overall_recall": 0.8767161377776233,
654
+ "eval_runtime": 8.9123,
655
+ "eval_samples_per_second": 954.413,
656
+ "eval_steps_per_second": 29.846,
657
+ "step": 12000
658
+ },
659
+ {
660
+ "epoch": 2.47,
661
+ "learning_rate": 3.762621263116215e-05,
662
+ "loss": 0.4806,
663
+ "step": 12500
664
+ },
665
+ {
666
+ "epoch": 2.57,
667
+ "learning_rate": 3.7131261136408633e-05,
668
+ "loss": 0.4765,
669
+ "step": 13000
670
+ },
671
+ {
672
+ "epoch": 2.57,
673
+ "eval_COMMENT": {
674
+ "f1": 0.6893633899649634,
675
+ "number": 6901,
676
+ "precision": 0.6338439095550693,
677
+ "recall": 0.7555426749746413
678
+ },
679
+ "eval_NAME": {
680
+ "f1": 0.805656475322788,
681
+ "number": 8857,
682
+ "precision": 0.7977640026566305,
683
+ "recall": 0.8137066726882691
684
+ },
685
+ "eval_QTY": {
686
+ "f1": 0.9841977027497391,
687
+ "number": 7189,
688
+ "precision": 0.9850891861761427,
689
+ "recall": 0.9833078314090973
690
+ },
691
+ "eval_RANGE_END": {
692
+ "f1": 0.7777777777777777,
693
+ "number": 92,
694
+ "precision": 0.6774193548387096,
695
+ "recall": 0.9130434782608695
696
+ },
697
+ "eval_UNIT": {
698
+ "f1": 0.9518021440027011,
699
+ "number": 5732,
700
+ "precision": 0.9219950940310712,
701
+ "recall": 0.9836008374040475
702
+ },
703
+ "eval_loss": 0.4845636188983917,
704
+ "eval_overall_accuracy": 0.8307097067860258,
705
+ "eval_overall_f1": 0.8482320088820106,
706
+ "eval_overall_precision": 0.8219070904645477,
707
+ "eval_overall_recall": 0.8762990511278718,
708
+ "eval_runtime": 6.7092,
709
+ "eval_samples_per_second": 1267.814,
710
+ "eval_steps_per_second": 39.647,
711
+ "step": 13000
712
+ },
713
+ {
714
+ "epoch": 2.67,
715
+ "learning_rate": 3.663630964165512e-05,
716
+ "loss": 0.4715,
717
+ "step": 13500
718
+ },
719
+ {
720
+ "epoch": 2.77,
721
+ "learning_rate": 3.6141358146901606e-05,
722
+ "loss": 0.4747,
723
+ "step": 14000
724
+ },
725
+ {
726
+ "epoch": 2.77,
727
+ "eval_COMMENT": {
728
+ "f1": 0.6842317515795134,
729
+ "number": 6901,
730
+ "precision": 0.6380844929171368,
731
+ "recall": 0.7375742645993334
732
+ },
733
+ "eval_NAME": {
734
+ "f1": 0.8026484170700496,
735
+ "number": 8857,
736
+ "precision": 0.791246160596753,
737
+ "recall": 0.8143841029694028
738
+ },
739
+ "eval_QTY": {
740
+ "f1": 0.9847090569431951,
741
+ "number": 7189,
742
+ "precision": 0.9796255506607929,
743
+ "recall": 0.9898455974405341
744
+ },
745
+ "eval_RANGE_END": {
746
+ "f1": 0.7878787878787878,
747
+ "number": 92,
748
+ "precision": 0.6546762589928058,
749
+ "recall": 0.9891304347826086
750
+ },
751
+ "eval_UNIT": {
752
+ "f1": 0.9519481612387444,
753
+ "number": 5732,
754
+ "precision": 0.9195252804422045,
755
+ "recall": 0.9867411025819958
756
+ },
757
+ "eval_loss": 0.4844052493572235,
758
+ "eval_overall_accuracy": 0.8314304138375754,
759
+ "eval_overall_f1": 0.8470833754081255,
760
+ "eval_overall_precision": 0.8211570463666917,
761
+ "eval_overall_recall": 0.8747002189704911,
762
+ "eval_runtime": 8.8562,
763
+ "eval_samples_per_second": 960.458,
764
+ "eval_steps_per_second": 30.035,
765
+ "step": 14000
766
+ },
767
+ {
768
+ "epoch": 2.87,
769
+ "learning_rate": 3.564640665214809e-05,
770
+ "loss": 0.4673,
771
+ "step": 14500
772
+ },
773
+ {
774
+ "epoch": 2.97,
775
+ "learning_rate": 3.515145515739457e-05,
776
+ "loss": 0.4654,
777
+ "step": 15000
778
+ },
779
+ {
780
+ "epoch": 2.97,
781
+ "eval_COMMENT": {
782
+ "f1": 0.6951928862739855,
783
+ "number": 6901,
784
+ "precision": 0.6453574975173784,
785
+ "recall": 0.7533690769453703
786
+ },
787
+ "eval_NAME": {
788
+ "f1": 0.8027195720017833,
789
+ "number": 8857,
790
+ "precision": 0.7925608011444921,
791
+ "recall": 0.8131421474539912
792
+ },
793
+ "eval_QTY": {
794
+ "f1": 0.9852237252861602,
795
+ "number": 7189,
796
+ "precision": 0.9827013562136728,
797
+ "recall": 0.9877590763666713
798
+ },
799
+ "eval_RANGE_END": {
800
+ "f1": 0.7802690582959643,
801
+ "number": 92,
802
+ "precision": 0.6641221374045801,
803
+ "recall": 0.9456521739130435
804
+ },
805
+ "eval_UNIT": {
806
+ "f1": 0.9533801506049582,
807
+ "number": 5732,
808
+ "precision": 0.9255791030064071,
809
+ "recall": 0.9829030006978368
810
+ },
811
+ "eval_loss": 0.48082008957862854,
812
+ "eval_overall_accuracy": 0.8331752835413269,
813
+ "eval_overall_f1": 0.8498601704909194,
814
+ "eval_overall_precision": 0.8246313793441659,
815
+ "eval_overall_recall": 0.8766813805568107,
816
+ "eval_runtime": 7.2911,
817
+ "eval_samples_per_second": 1166.621,
818
+ "eval_steps_per_second": 36.483,
819
+ "step": 15000
820
+ },
821
+ {
822
+ "epoch": 3.07,
823
+ "learning_rate": 3.465650366264107e-05,
824
+ "loss": 0.4573,
825
+ "step": 15500
826
+ },
827
+ {
828
+ "epoch": 3.17,
829
+ "learning_rate": 3.416155216788755e-05,
830
+ "loss": 0.4586,
831
+ "step": 16000
832
+ },
833
+ {
834
+ "epoch": 3.17,
835
+ "eval_COMMENT": {
836
+ "f1": 0.6976900801400768,
837
+ "number": 6901,
838
+ "precision": 0.6517362858580775,
839
+ "recall": 0.7506158527749601
840
+ },
841
+ "eval_NAME": {
842
+ "f1": 0.8010911317708622,
843
+ "number": 8857,
844
+ "precision": 0.7901383703052932,
845
+ "recall": 0.812351812126002
846
+ },
847
+ "eval_QTY": {
848
+ "f1": 0.9851262538913871,
849
+ "number": 7189,
850
+ "precision": 0.979906413432425,
851
+ "recall": 0.990402003060231
852
+ },
853
+ "eval_RANGE_END": {
854
+ "f1": 0.7802690582959643,
855
+ "number": 92,
856
+ "precision": 0.6641221374045801,
857
+ "recall": 0.9456521739130435
858
+ },
859
+ "eval_UNIT": {
860
+ "f1": 0.9516034003871727,
861
+ "number": 5732,
862
+ "precision": 0.9193364774760123,
863
+ "recall": 0.9862177250523377
864
+ },
865
+ "eval_loss": 0.48265689611434937,
866
+ "eval_overall_accuracy": 0.8316959374881463,
867
+ "eval_overall_f1": 0.8500783210658401,
868
+ "eval_overall_precision": 0.824673202614379,
869
+ "eval_overall_recall": 0.8770984672065621,
870
+ "eval_runtime": 9.1659,
871
+ "eval_samples_per_second": 928.008,
872
+ "eval_steps_per_second": 29.021,
873
+ "step": 16000
874
+ },
875
+ {
876
+ "epoch": 3.27,
877
+ "learning_rate": 3.3666600673134034e-05,
878
+ "loss": 0.4591,
879
+ "step": 16500
880
+ },
881
+ {
882
+ "epoch": 3.37,
883
+ "learning_rate": 3.317164917838052e-05,
884
+ "loss": 0.4612,
885
+ "step": 17000
886
+ },
887
+ {
888
+ "epoch": 3.37,
889
+ "eval_COMMENT": {
890
+ "f1": 0.6966127636920211,
891
+ "number": 6901,
892
+ "precision": 0.6441053408811224,
893
+ "recall": 0.7584408056803362
894
+ },
895
+ "eval_NAME": {
896
+ "f1": 0.7990913120567377,
897
+ "number": 8857,
898
+ "precision": 0.7845718637797846,
899
+ "recall": 0.8141582928756915
900
+ },
901
+ "eval_QTY": {
902
+ "f1": 0.9846325012168833,
903
+ "number": 7189,
904
+ "precision": 0.9844271412680756,
905
+ "recall": 0.9848379468632633
906
+ },
907
+ "eval_RANGE_END": {
908
+ "f1": 0.7802690582959643,
909
+ "number": 92,
910
+ "precision": 0.6641221374045801,
911
+ "recall": 0.9456521739130435
912
+ },
913
+ "eval_UNIT": {
914
+ "f1": 0.9502140878179833,
915
+ "number": 5732,
916
+ "precision": 0.9158439877002751,
917
+ "recall": 0.9872644801116539
918
+ },
919
+ "eval_loss": 0.4868798851966858,
920
+ "eval_overall_accuracy": 0.8307666047111482,
921
+ "eval_overall_f1": 0.8481624433629804,
922
+ "eval_overall_precision": 0.8199811804406373,
923
+ "eval_overall_recall": 0.8783497271558166,
924
+ "eval_runtime": 7.3722,
925
+ "eval_samples_per_second": 1153.794,
926
+ "eval_steps_per_second": 36.081,
927
+ "step": 17000
928
+ },
929
+ {
930
+ "epoch": 3.46,
931
+ "learning_rate": 3.267669768362701e-05,
932
+ "loss": 0.4592,
933
+ "step": 17500
934
+ },
935
+ {
936
+ "epoch": 3.56,
937
+ "learning_rate": 3.218174618887349e-05,
938
+ "loss": 0.4546,
939
+ "step": 18000
940
+ },
941
+ {
942
+ "epoch": 3.56,
943
+ "eval_COMMENT": {
944
+ "f1": 0.6903326332904275,
945
+ "number": 6901,
946
+ "precision": 0.6482188295165394,
947
+ "recall": 0.7382987972757571
948
+ },
949
+ "eval_NAME": {
950
+ "f1": 0.8029488387561666,
951
+ "number": 8857,
952
+ "precision": 0.788654181184669,
953
+ "recall": 0.8177712543750706
954
+ },
955
+ "eval_QTY": {
956
+ "f1": 0.9853083853083853,
957
+ "number": 7189,
958
+ "precision": 0.9817704736914791,
959
+ "recall": 0.9888718876060648
960
+ },
961
+ "eval_RANGE_END": {
962
+ "f1": 0.787037037037037,
963
+ "number": 92,
964
+ "precision": 0.6854838709677419,
965
+ "recall": 0.9239130434782609
966
+ },
967
+ "eval_UNIT": {
968
+ "f1": 0.9534019922336655,
969
+ "number": 5732,
970
+ "precision": 0.9236179260713118,
971
+ "recall": 0.9851709699930217
972
+ },
973
+ "eval_loss": 0.480613112449646,
974
+ "eval_overall_accuracy": 0.8314683457876569,
975
+ "eval_overall_f1": 0.8492933517725234,
976
+ "eval_overall_precision": 0.8249189136061331,
977
+ "eval_overall_recall": 0.8751520628410552,
978
+ "eval_runtime": 8.0402,
979
+ "eval_samples_per_second": 1057.931,
980
+ "eval_steps_per_second": 33.084,
981
+ "step": 18000
982
+ },
983
+ {
984
+ "epoch": 3.66,
985
+ "learning_rate": 3.168679469411997e-05,
986
+ "loss": 0.4609,
987
+ "step": 18500
988
+ },
989
+ {
990
+ "epoch": 3.76,
991
+ "learning_rate": 3.119184319936647e-05,
992
+ "loss": 0.4471,
993
+ "step": 19000
994
+ },
995
+ {
996
+ "epoch": 3.76,
997
+ "eval_COMMENT": {
998
+ "f1": 0.6993611924407772,
999
+ "number": 6901,
1000
+ "precision": 0.6466100652147164,
1001
+ "recall": 0.7614838429213158
1002
+ },
1003
+ "eval_NAME": {
1004
+ "f1": 0.8037861915367484,
1005
+ "number": 8857,
1006
+ "precision": 0.7929254092057564,
1007
+ "recall": 0.8149486282036807
1008
+ },
1009
+ "eval_QTY": {
1010
+ "f1": 0.9852052510939778,
1011
+ "number": 7189,
1012
+ "precision": 0.983906770255272,
1013
+ "recall": 0.9865071637223536
1014
+ },
1015
+ "eval_RANGE_END": {
1016
+ "f1": 0.7927927927927929,
1017
+ "number": 92,
1018
+ "precision": 0.676923076923077,
1019
+ "recall": 0.9565217391304348
1020
+ },
1021
+ "eval_UNIT": {
1022
+ "f1": 0.9520276536548351,
1023
+ "number": 5732,
1024
+ "precision": 0.9211943220753793,
1025
+ "recall": 0.984996510816469
1026
+ },
1027
+ "eval_loss": 0.4822600483894348,
1028
+ "eval_overall_accuracy": 0.8327769980654706,
1029
+ "eval_overall_f1": 0.8508441514764242,
1030
+ "eval_overall_precision": 0.8241521972831222,
1031
+ "eval_overall_recall": 0.87932292933857,
1032
+ "eval_runtime": 8.7949,
1033
+ "eval_samples_per_second": 967.151,
1034
+ "eval_steps_per_second": 30.245,
1035
+ "step": 19000
1036
+ },
1037
+ {
1038
+ "epoch": 3.86,
1039
+ "learning_rate": 3.069689170461295e-05,
1040
+ "loss": 0.4581,
1041
+ "step": 19500
1042
+ },
1043
+ {
1044
+ "epoch": 3.96,
1045
+ "learning_rate": 3.0201940209859435e-05,
1046
+ "loss": 0.4542,
1047
+ "step": 20000
1048
+ },
1049
+ {
1050
+ "epoch": 3.96,
1051
+ "eval_COMMENT": {
1052
+ "f1": 0.6950766529344229,
1053
+ "number": 6901,
1054
+ "precision": 0.6508980521123198,
1055
+ "recall": 0.7456890305752789
1056
+ },
1057
+ "eval_NAME": {
1058
+ "f1": 0.7992666259236624,
1059
+ "number": 8857,
1060
+ "precision": 0.7868081382629621,
1061
+ "recall": 0.8121260020322908
1062
+ },
1063
+ "eval_QTY": {
1064
+ "f1": 0.9853604384930272,
1065
+ "number": 7189,
1066
+ "precision": 0.9829734219269103,
1067
+ "recall": 0.9877590763666713
1068
+ },
1069
+ "eval_RANGE_END": {
1070
+ "f1": 0.7873303167420815,
1071
+ "number": 92,
1072
+ "precision": 0.6744186046511628,
1073
+ "recall": 0.9456521739130435
1074
+ },
1075
+ "eval_UNIT": {
1076
+ "f1": 0.9524210526315788,
1077
+ "number": 5732,
1078
+ "precision": 0.920559986977047,
1079
+ "recall": 0.9865666434054431
1080
+ },
1081
+ "eval_loss": 0.47578319907188416,
1082
+ "eval_overall_accuracy": 0.832568372340022,
1083
+ "eval_overall_f1": 0.8490938211245047,
1084
+ "eval_overall_precision": 0.8244499738082766,
1085
+ "eval_overall_recall": 0.875256334503493,
1086
+ "eval_runtime": 6.7831,
1087
+ "eval_samples_per_second": 1253.998,
1088
+ "eval_steps_per_second": 39.215,
1089
+ "step": 20000
1090
+ },
1091
+ {
1092
+ "epoch": 4.06,
1093
+ "learning_rate": 2.970698871510592e-05,
1094
+ "loss": 0.4454,
1095
+ "step": 20500
1096
+ },
1097
+ {
1098
+ "epoch": 4.16,
1099
+ "learning_rate": 2.9212037220352405e-05,
1100
+ "loss": 0.4452,
1101
+ "step": 21000
1102
+ },
1103
+ {
1104
+ "epoch": 4.16,
1105
+ "eval_COMMENT": {
1106
+ "f1": 0.6982899022801302,
1107
+ "number": 6901,
1108
+ "precision": 0.6566687938736439,
1109
+ "recall": 0.7455441240399941
1110
+ },
1111
+ "eval_NAME": {
1112
+ "f1": 0.7992468294844105,
1113
+ "number": 8857,
1114
+ "precision": 0.7843478260869565,
1115
+ "recall": 0.8147228181099695
1116
+ },
1117
+ "eval_QTY": {
1118
+ "f1": 0.9847455276660656,
1119
+ "number": 7189,
1120
+ "precision": 0.981750311074243,
1121
+ "recall": 0.9877590763666713
1122
+ },
1123
+ "eval_RANGE_END": {
1124
+ "f1": 0.787037037037037,
1125
+ "number": 92,
1126
+ "precision": 0.6854838709677419,
1127
+ "recall": 0.9239130434782609
1128
+ },
1129
+ "eval_UNIT": {
1130
+ "f1": 0.9537733457280487,
1131
+ "number": 5732,
1132
+ "precision": 0.9249303392886412,
1133
+ "recall": 0.9844731332868109
1134
+ },
1135
+ "eval_loss": 0.48325347900390625,
1136
+ "eval_overall_accuracy": 0.8338959905928763,
1137
+ "eval_overall_f1": 0.8500944924406048,
1138
+ "eval_overall_precision": 0.8260912340537172,
1139
+ "eval_overall_recall": 0.8755343922699941,
1140
+ "eval_runtime": 9.0461,
1141
+ "eval_samples_per_second": 940.291,
1142
+ "eval_steps_per_second": 29.405,
1143
+ "step": 21000
1144
+ },
1145
+ {
1146
+ "epoch": 4.26,
1147
+ "learning_rate": 2.871708572559889e-05,
1148
+ "loss": 0.4217,
1149
+ "step": 21500
1150
+ },
1151
+ {
1152
+ "epoch": 4.36,
1153
+ "learning_rate": 2.8222134230845377e-05,
1154
+ "loss": 0.4412,
1155
+ "step": 22000
1156
+ },
1157
+ {
1158
+ "epoch": 4.36,
1159
+ "eval_COMMENT": {
1160
+ "f1": 0.6974386700006758,
1161
+ "number": 6901,
1162
+ "precision": 0.6534954407294833,
1163
+ "recall": 0.7477177220692653
1164
+ },
1165
+ "eval_NAME": {
1166
+ "f1": 0.8008429926238145,
1167
+ "number": 8857,
1168
+ "precision": 0.7870067582297798,
1169
+ "recall": 0.8151744382973919
1170
+ },
1171
+ "eval_QTY": {
1172
+ "f1": 0.9858392336526447,
1173
+ "number": 7189,
1174
+ "precision": 0.9839268394069558,
1175
+ "recall": 0.9877590763666713
1176
+ },
1177
+ "eval_RANGE_END": {
1178
+ "f1": 0.789237668161435,
1179
+ "number": 92,
1180
+ "precision": 0.6717557251908397,
1181
+ "recall": 0.9565217391304348
1182
+ },
1183
+ "eval_UNIT": {
1184
+ "f1": 0.9540462916033113,
1185
+ "number": 5732,
1186
+ "precision": 0.9248280379954144,
1187
+ "recall": 0.9851709699930217
1188
+ },
1189
+ "eval_loss": 0.4888293445110321,
1190
+ "eval_overall_accuracy": 0.8325494063649812,
1191
+ "eval_overall_f1": 0.8505270258875117,
1192
+ "eval_overall_precision": 0.8261040492727034,
1193
+ "eval_overall_recall": 0.8764380800111223,
1194
+ "eval_runtime": 6.5585,
1195
+ "eval_samples_per_second": 1296.944,
1196
+ "eval_steps_per_second": 40.558,
1197
+ "step": 22000
1198
+ },
1199
+ {
1200
+ "epoch": 4.45,
1201
+ "learning_rate": 2.7727182736091867e-05,
1202
+ "loss": 0.4481,
1203
+ "step": 22500
1204
+ },
1205
+ {
1206
+ "epoch": 4.55,
1207
+ "learning_rate": 2.7232231241338353e-05,
1208
+ "loss": 0.4423,
1209
+ "step": 23000
1210
+ },
1211
+ {
1212
+ "epoch": 4.55,
1213
+ "eval_COMMENT": {
1214
+ "f1": 0.6981985021253626,
1215
+ "number": 6901,
1216
+ "precision": 0.6532828282828282,
1217
+ "recall": 0.7497464135632517
1218
+ },
1219
+ "eval_NAME": {
1220
+ "f1": 0.8019725177304966,
1221
+ "number": 8857,
1222
+ "precision": 0.7874007180937874,
1223
+ "recall": 0.817093824093937
1224
+ },
1225
+ "eval_QTY": {
1226
+ "f1": 0.9857043719639139,
1227
+ "number": 7189,
1228
+ "precision": 0.9835202880487467,
1229
+ "recall": 0.9878981777715955
1230
+ },
1231
+ "eval_RANGE_END": {
1232
+ "f1": 0.7999999999999999,
1233
+ "number": 92,
1234
+ "precision": 0.6766917293233082,
1235
+ "recall": 0.9782608695652174
1236
+ },
1237
+ "eval_UNIT": {
1238
+ "f1": 0.9548452562151193,
1239
+ "number": 5732,
1240
+ "precision": 0.9264850672792911,
1241
+ "recall": 0.984996510816469
1242
+ },
1243
+ "eval_loss": 0.4827423095703125,
1244
+ "eval_overall_accuracy": 0.8337821947426317,
1245
+ "eval_overall_f1": 0.8511377043654138,
1246
+ "eval_overall_precision": 0.8262377695605223,
1247
+ "eval_overall_recall": 0.8775850682979389,
1248
+ "eval_runtime": 8.9572,
1249
+ "eval_samples_per_second": 949.629,
1250
+ "eval_steps_per_second": 29.697,
1251
+ "step": 23000
1252
+ },
1253
+ {
1254
+ "epoch": 4.65,
1255
+ "learning_rate": 2.6737279746584836e-05,
1256
+ "loss": 0.4519,
1257
+ "step": 23500
1258
+ },
1259
+ {
1260
+ "epoch": 4.75,
1261
+ "learning_rate": 2.6242328251831323e-05,
1262
+ "loss": 0.4507,
1263
+ "step": 24000
1264
+ },
1265
+ {
1266
+ "epoch": 4.75,
1267
+ "eval_COMMENT": {
1268
+ "f1": 0.69833923223523,
1269
+ "number": 6901,
1270
+ "precision": 0.6584520600693108,
1271
+ "recall": 0.7433705260107231
1272
+ },
1273
+ "eval_NAME": {
1274
+ "f1": 0.8048291977300545,
1275
+ "number": 8857,
1276
+ "precision": 0.7933530766699572,
1277
+ "recall": 0.8166422039065147
1278
+ },
1279
+ "eval_QTY": {
1280
+ "f1": 0.9856135011758197,
1281
+ "number": 7189,
1282
+ "precision": 0.9801898472967395,
1283
+ "recall": 0.9910975100848518
1284
+ },
1285
+ "eval_RANGE_END": {
1286
+ "f1": 0.7837837837837838,
1287
+ "number": 92,
1288
+ "precision": 0.6692307692307692,
1289
+ "recall": 0.9456521739130435
1290
+ },
1291
+ "eval_UNIT": {
1292
+ "f1": 0.9537942664418213,
1293
+ "number": 5732,
1294
+ "precision": 0.922976501305483,
1295
+ "recall": 0.9867411025819958
1296
+ },
1297
+ "eval_loss": 0.474032998085022,
1298
+ "eval_overall_accuracy": 0.8347115275196297,
1299
+ "eval_overall_f1": 0.8523122656487518,
1300
+ "eval_overall_precision": 0.8290126499096435,
1301
+ "eval_overall_recall": 0.8769594383233117,
1302
+ "eval_runtime": 7.5421,
1303
+ "eval_samples_per_second": 1127.8,
1304
+ "eval_steps_per_second": 35.269,
1305
+ "step": 24000
1306
+ },
1307
+ {
1308
+ "epoch": 4.85,
1309
+ "learning_rate": 2.5747376757077806e-05,
1310
+ "loss": 0.4377,
1311
+ "step": 24500
1312
+ },
1313
+ {
1314
+ "epoch": 4.95,
1315
+ "learning_rate": 2.5252425262324292e-05,
1316
+ "loss": 0.4452,
1317
+ "step": 25000
1318
+ },
1319
+ {
1320
+ "epoch": 4.95,
1321
+ "eval_COMMENT": {
1322
+ "f1": 0.7040598290598291,
1323
+ "number": 6901,
1324
+ "precision": 0.6528792569659443,
1325
+ "recall": 0.7639472540211564
1326
+ },
1327
+ "eval_NAME": {
1328
+ "f1": 0.8012646292084975,
1329
+ "number": 8857,
1330
+ "precision": 0.7875054513737462,
1331
+ "recall": 0.8155131534379587
1332
+ },
1333
+ "eval_QTY": {
1334
+ "f1": 0.9855775897933713,
1335
+ "number": 7189,
1336
+ "precision": 0.9825798423890502,
1337
+ "recall": 0.9885936847962165
1338
+ },
1339
+ "eval_RANGE_END": {
1340
+ "f1": 0.7727272727272728,
1341
+ "number": 92,
1342
+ "precision": 0.6640625,
1343
+ "recall": 0.9239130434782609
1344
+ },
1345
+ "eval_UNIT": {
1346
+ "f1": 0.953449148254343,
1347
+ "number": 5732,
1348
+ "precision": 0.9227881162259223,
1349
+ "recall": 0.9862177250523377
1350
+ },
1351
+ "eval_loss": 0.4791179597377777,
1352
+ "eval_overall_accuracy": 0.8352236088457308,
1353
+ "eval_overall_f1": 0.8516931350306697,
1354
+ "eval_overall_precision": 0.8244940456823062,
1355
+ "eval_overall_recall": 0.8807479753918876,
1356
+ "eval_runtime": 6.5842,
1357
+ "eval_samples_per_second": 1291.88,
1358
+ "eval_steps_per_second": 40.4,
1359
+ "step": 25000
1360
+ },
1361
+ {
1362
+ "epoch": 5.05,
1363
+ "learning_rate": 2.4757473767570778e-05,
1364
+ "loss": 0.4442,
1365
+ "step": 25500
1366
+ },
1367
+ {
1368
+ "epoch": 5.15,
1369
+ "learning_rate": 2.4262522272817265e-05,
1370
+ "loss": 0.4274,
1371
+ "step": 26000
1372
+ },
1373
+ {
1374
+ "epoch": 5.15,
1375
+ "eval_COMMENT": {
1376
+ "f1": 0.7096947333109694,
1377
+ "number": 6901,
1378
+ "precision": 0.6607946026986506,
1379
+ "recall": 0.766410665120997
1380
+ },
1381
+ "eval_NAME": {
1382
+ "f1": 0.8056639536180176,
1383
+ "number": 8857,
1384
+ "precision": 0.795727342803656,
1385
+ "recall": 0.8158518685785254
1386
+ },
1387
+ "eval_QTY": {
1388
+ "f1": 0.9859017987360232,
1389
+ "number": 7189,
1390
+ "precision": 0.9844660194174757,
1391
+ "recall": 0.9873417721518988
1392
+ },
1393
+ "eval_RANGE_END": {
1394
+ "f1": 0.7962962962962964,
1395
+ "number": 92,
1396
+ "precision": 0.6935483870967742,
1397
+ "recall": 0.9347826086956522
1398
+ },
1399
+ "eval_UNIT": {
1400
+ "f1": 0.9532647207693606,
1401
+ "number": 5732,
1402
+ "precision": 0.9229010127409344,
1403
+ "recall": 0.9856943475226797
1404
+ },
1405
+ "eval_loss": 0.48070788383483887,
1406
+ "eval_overall_accuracy": 0.836058111747525,
1407
+ "eval_overall_f1": 0.854768006474238,
1408
+ "eval_overall_precision": 0.8299990177138928,
1409
+ "eval_overall_recall": 0.8810607903792013,
1410
+ "eval_runtime": 9.3326,
1411
+ "eval_samples_per_second": 911.433,
1412
+ "eval_steps_per_second": 28.502,
1413
+ "step": 26000
1414
+ },
1415
+ {
1416
+ "epoch": 5.25,
1417
+ "learning_rate": 2.376757077806375e-05,
1418
+ "loss": 0.432,
1419
+ "step": 26500
1420
+ },
1421
+ {
1422
+ "epoch": 5.35,
1423
+ "learning_rate": 2.3272619283310237e-05,
1424
+ "loss": 0.4312,
1425
+ "step": 27000
1426
+ },
1427
+ {
1428
+ "epoch": 5.35,
1429
+ "eval_COMMENT": {
1430
+ "f1": 0.7056545830829829,
1431
+ "number": 6901,
1432
+ "precision": 0.6542461005199307,
1433
+ "recall": 0.7658310389798579
1434
+ },
1435
+ "eval_NAME": {
1436
+ "f1": 0.8019135562107137,
1437
+ "number": 8857,
1438
+ "precision": 0.7903508771929825,
1439
+ "recall": 0.8138195777351248
1440
+ },
1441
+ "eval_QTY": {
1442
+ "f1": 0.9852421533984619,
1443
+ "number": 7189,
1444
+ "precision": 0.981501932633904,
1445
+ "recall": 0.989010989010989
1446
+ },
1447
+ "eval_RANGE_END": {
1448
+ "f1": 0.789237668161435,
1449
+ "number": 92,
1450
+ "precision": 0.6717557251908397,
1451
+ "recall": 0.9565217391304348
1452
+ },
1453
+ "eval_UNIT": {
1454
+ "f1": 0.9502391541495343,
1455
+ "number": 5732,
1456
+ "precision": 0.9154405820533549,
1457
+ "recall": 0.9877878576413119
1458
+ },
1459
+ "eval_loss": 0.48605257272720337,
1460
+ "eval_overall_accuracy": 0.83349770511702,
1461
+ "eval_overall_f1": 0.8517865242150884,
1462
+ "eval_overall_precision": 0.8242733597763183,
1463
+ "eval_overall_recall": 0.8811998192624517,
1464
+ "eval_runtime": 7.0035,
1465
+ "eval_samples_per_second": 1214.536,
1466
+ "eval_steps_per_second": 37.981,
1467
+ "step": 27000
1468
+ },
1469
+ {
1470
+ "epoch": 5.44,
1471
+ "learning_rate": 2.2777667788556724e-05,
1472
+ "loss": 0.4321,
1473
+ "step": 27500
1474
+ },
1475
+ {
1476
+ "epoch": 5.54,
1477
+ "learning_rate": 2.2282716293803206e-05,
1478
+ "loss": 0.4315,
1479
+ "step": 28000
1480
+ },
1481
+ {
1482
+ "epoch": 5.54,
1483
+ "eval_COMMENT": {
1484
+ "f1": 0.7045745469244761,
1485
+ "number": 6901,
1486
+ "precision": 0.6583983883152859,
1487
+ "recall": 0.7577162730039124
1488
+ },
1489
+ "eval_NAME": {
1490
+ "f1": 0.8038757099899767,
1491
+ "number": 8857,
1492
+ "precision": 0.7930996593780903,
1493
+ "recall": 0.8149486282036807
1494
+ },
1495
+ "eval_QTY": {
1496
+ "f1": 0.9861322978782415,
1497
+ "number": 7189,
1498
+ "precision": 0.9831328632655882,
1499
+ "recall": 0.9891500904159132
1500
+ },
1501
+ "eval_RANGE_END": {
1502
+ "f1": 0.7909090909090909,
1503
+ "number": 92,
1504
+ "precision": 0.6796875,
1505
+ "recall": 0.9456521739130435
1506
+ },
1507
+ "eval_UNIT": {
1508
+ "f1": 0.9528698872243729,
1509
+ "number": 5732,
1510
+ "precision": 0.9204878048780488,
1511
+ "recall": 0.9876133984647593
1512
+ },
1513
+ "eval_loss": 0.481955349445343,
1514
+ "eval_overall_accuracy": 0.8341235822933657,
1515
+ "eval_overall_f1": 0.8531310577328276,
1516
+ "eval_overall_precision": 0.8282385285069058,
1517
+ "eval_overall_recall": 0.8795662298842585,
1518
+ "eval_runtime": 8.4264,
1519
+ "eval_samples_per_second": 1009.444,
1520
+ "eval_steps_per_second": 31.567,
1521
+ "step": 28000
1522
+ },
1523
+ {
1524
+ "epoch": 5.64,
1525
+ "learning_rate": 2.1787764799049696e-05,
1526
+ "loss": 0.4328,
1527
+ "step": 28500
1528
+ },
1529
+ {
1530
+ "epoch": 5.74,
1531
+ "learning_rate": 2.129281330429618e-05,
1532
+ "loss": 0.4316,
1533
+ "step": 29000
1534
+ },
1535
+ {
1536
+ "epoch": 5.74,
1537
+ "eval_COMMENT": {
1538
+ "f1": 0.7066999527697188,
1539
+ "number": 6901,
1540
+ "precision": 0.6612373737373738,
1541
+ "recall": 0.7588755252861904
1542
+ },
1543
+ "eval_NAME": {
1544
+ "f1": 0.8088874039425326,
1545
+ "number": 8857,
1546
+ "precision": 0.7980441709702231,
1547
+ "recall": 0.8200293553121825
1548
+ },
1549
+ "eval_QTY": {
1550
+ "f1": 0.9862747816442535,
1551
+ "number": 7189,
1552
+ "precision": 0.9830040071852978,
1553
+ "recall": 0.9895673946306858
1554
+ },
1555
+ "eval_RANGE_END": {
1556
+ "f1": 0.7741935483870968,
1557
+ "number": 92,
1558
+ "precision": 0.672,
1559
+ "recall": 0.9130434782608695
1560
+ },
1561
+ "eval_UNIT": {
1562
+ "f1": 0.955117910573916,
1563
+ "number": 5732,
1564
+ "precision": 0.9263813739957371,
1565
+ "recall": 0.9856943475226797
1566
+ },
1567
+ "eval_loss": 0.4761992394924164,
1568
+ "eval_overall_accuracy": 0.836987444524523,
1569
+ "eval_overall_f1": 0.8555853712048336,
1570
+ "eval_overall_precision": 0.8315727314480678,
1571
+ "eval_overall_recall": 0.8810260331583887,
1572
+ "eval_runtime": 8.3244,
1573
+ "eval_samples_per_second": 1021.82,
1574
+ "eval_steps_per_second": 31.954,
1575
+ "step": 29000
1576
+ },
1577
+ {
1578
+ "epoch": 5.84,
1579
+ "learning_rate": 2.0797861809542665e-05,
1580
+ "loss": 0.4429,
1581
+ "step": 29500
1582
+ },
1583
+ {
1584
+ "epoch": 5.94,
1585
+ "learning_rate": 2.0302910314789152e-05,
1586
+ "loss": 0.4278,
1587
+ "step": 30000
1588
+ },
1589
+ {
1590
+ "epoch": 5.94,
1591
+ "eval_COMMENT": {
1592
+ "f1": 0.7081487447979596,
1593
+ "number": 6901,
1594
+ "precision": 0.6596223583843942,
1595
+ "recall": 0.7643819736270105
1596
+ },
1597
+ "eval_NAME": {
1598
+ "f1": 0.8039357385068653,
1599
+ "number": 8857,
1600
+ "precision": 0.7918309242225142,
1601
+ "recall": 0.8164163938128034
1602
+ },
1603
+ "eval_QTY": {
1604
+ "f1": 0.9861265260821309,
1605
+ "number": 7189,
1606
+ "precision": 0.9835339698353397,
1607
+ "recall": 0.9887327862011406
1608
+ },
1609
+ "eval_RANGE_END": {
1610
+ "f1": 0.783410138248848,
1611
+ "number": 92,
1612
+ "precision": 0.68,
1613
+ "recall": 0.9239130434782609
1614
+ },
1615
+ "eval_UNIT": {
1616
+ "f1": 0.9540695710908478,
1617
+ "number": 5732,
1618
+ "precision": 0.9244109947643979,
1619
+ "recall": 0.9856943475226797
1620
+ },
1621
+ "eval_loss": 0.4822809398174286,
1622
+ "eval_overall_accuracy": 0.8347684254447522,
1623
+ "eval_overall_f1": 0.8540192709386161,
1624
+ "eval_overall_precision": 0.8285882391396725,
1625
+ "eval_overall_recall": 0.8810607903792013,
1626
+ "eval_runtime": 6.5281,
1627
+ "eval_samples_per_second": 1302.987,
1628
+ "eval_steps_per_second": 40.747,
1629
+ "step": 30000
1630
+ },
1631
+ {
1632
+ "epoch": 6.04,
1633
+ "learning_rate": 1.9807958820035638e-05,
1634
+ "loss": 0.4251,
1635
+ "step": 30500
1636
+ },
1637
+ {
1638
+ "epoch": 6.14,
1639
+ "learning_rate": 1.9313007325282124e-05,
1640
+ "loss": 0.4211,
1641
+ "step": 31000
1642
+ },
1643
+ {
1644
+ "epoch": 6.14,
1645
+ "eval_COMMENT": {
1646
+ "f1": 0.705458989679522,
1647
+ "number": 6901,
1648
+ "precision": 0.6637281206081512,
1649
+ "recall": 0.7527894508042313
1650
+ },
1651
+ "eval_NAME": {
1652
+ "f1": 0.7998453978245265,
1653
+ "number": 8857,
1654
+ "precision": 0.7826885671061162,
1655
+ "recall": 0.8177712543750706
1656
+ },
1657
+ "eval_QTY": {
1658
+ "f1": 0.9858901646147462,
1659
+ "number": 7189,
1660
+ "precision": 0.9804649883065071,
1661
+ "recall": 0.9913757128947003
1662
+ },
1663
+ "eval_RANGE_END": {
1664
+ "f1": 0.787037037037037,
1665
+ "number": 92,
1666
+ "precision": 0.6854838709677419,
1667
+ "recall": 0.9239130434782609
1668
+ },
1669
+ "eval_UNIT": {
1670
+ "f1": 0.9548103724976772,
1671
+ "number": 5732,
1672
+ "precision": 0.925495333224169,
1673
+ "recall": 0.9860432658757851
1674
+ },
1675
+ "eval_loss": 0.47935572266578674,
1676
+ "eval_overall_accuracy": 0.8356218943215871,
1677
+ "eval_overall_f1": 0.8526081682167409,
1678
+ "eval_overall_precision": 0.8273764755894183,
1679
+ "eval_overall_recall": 0.8794272010010079,
1680
+ "eval_runtime": 9.2091,
1681
+ "eval_samples_per_second": 923.653,
1682
+ "eval_steps_per_second": 28.885,
1683
+ "step": 31000
1684
+ },
1685
+ {
1686
+ "epoch": 6.24,
1687
+ "learning_rate": 1.8818055830528607e-05,
1688
+ "loss": 0.4113,
1689
+ "step": 31500
1690
+ },
1691
+ {
1692
+ "epoch": 6.34,
1693
+ "learning_rate": 1.8323104335775097e-05,
1694
+ "loss": 0.4231,
1695
+ "step": 32000
1696
+ },
1697
+ {
1698
+ "epoch": 6.34,
1699
+ "eval_COMMENT": {
1700
+ "f1": 0.7081927385612093,
1701
+ "number": 6901,
1702
+ "precision": 0.6627510420613869,
1703
+ "recall": 0.7603245906390378
1704
+ },
1705
+ "eval_NAME": {
1706
+ "f1": 0.8008871638480732,
1707
+ "number": 8857,
1708
+ "precision": 0.7868816735672259,
1709
+ "recall": 0.815400248391103
1710
+ },
1711
+ "eval_QTY": {
1712
+ "f1": 0.9866055937261433,
1713
+ "number": 7189,
1714
+ "precision": 0.9844875346260388,
1715
+ "recall": 0.9887327862011406
1716
+ },
1717
+ "eval_RANGE_END": {
1718
+ "f1": 0.8018433179723502,
1719
+ "number": 92,
1720
+ "precision": 0.696,
1721
+ "recall": 0.9456521739130435
1722
+ },
1723
+ "eval_UNIT": {
1724
+ "f1": 0.9542042675212956,
1725
+ "number": 5732,
1726
+ "precision": 0.9235918367346939,
1727
+ "recall": 0.9869155617585486
1728
+ },
1729
+ "eval_loss": 0.4756552577018738,
1730
+ "eval_overall_accuracy": 0.8364374312483405,
1731
+ "eval_overall_f1": 0.8534784953485236,
1732
+ "eval_overall_precision": 0.8284312121707835,
1733
+ "eval_overall_recall": 0.8800875881964478,
1734
+ "eval_runtime": 6.7948,
1735
+ "eval_samples_per_second": 1251.831,
1736
+ "eval_steps_per_second": 39.147,
1737
+ "step": 32000
1738
+ },
1739
+ {
1740
+ "epoch": 6.43,
1741
+ "learning_rate": 1.782815284102158e-05,
1742
+ "loss": 0.4209,
1743
+ "step": 32500
1744
+ },
1745
+ {
1746
+ "epoch": 6.53,
1747
+ "learning_rate": 1.7333201346268066e-05,
1748
+ "loss": 0.4302,
1749
+ "step": 33000
1750
+ },
1751
+ {
1752
+ "epoch": 6.53,
1753
+ "eval_COMMENT": {
1754
+ "f1": 0.706057529610829,
1755
+ "number": 6901,
1756
+ "precision": 0.6624333248666497,
1757
+ "recall": 0.7558324880452109
1758
+ },
1759
+ "eval_NAME": {
1760
+ "f1": 0.8062360801781736,
1761
+ "number": 8857,
1762
+ "precision": 0.7953421948808085,
1763
+ "recall": 0.8174325392345038
1764
+ },
1765
+ "eval_QTY": {
1766
+ "f1": 0.986130374479889,
1767
+ "number": 7189,
1768
+ "precision": 0.9832664914949523,
1769
+ "recall": 0.989010989010989
1770
+ },
1771
+ "eval_RANGE_END": {
1772
+ "f1": 0.7766990291262136,
1773
+ "number": 92,
1774
+ "precision": 0.7017543859649122,
1775
+ "recall": 0.8695652173913043
1776
+ },
1777
+ "eval_UNIT": {
1778
+ "f1": 0.9544303797468354,
1779
+ "number": 5732,
1780
+ "precision": 0.9243216737495914,
1781
+ "recall": 0.9865666434054431
1782
+ },
1783
+ "eval_loss": 0.4785662591457367,
1784
+ "eval_overall_accuracy": 0.8354891324963016,
1785
+ "eval_overall_f1": 0.8546047187178056,
1786
+ "eval_overall_precision": 0.8311760840998685,
1787
+ "eval_overall_recall": 0.8793924437801953,
1788
+ "eval_runtime": 8.3624,
1789
+ "eval_samples_per_second": 1017.166,
1790
+ "eval_steps_per_second": 31.809,
1791
+ "step": 33000
1792
+ },
1793
+ {
1794
+ "epoch": 6.63,
1795
+ "learning_rate": 1.6838249851514553e-05,
1796
+ "loss": 0.4309,
1797
+ "step": 33500
1798
+ },
1799
+ {
1800
+ "epoch": 6.73,
1801
+ "learning_rate": 1.634329835676104e-05,
1802
+ "loss": 0.4223,
1803
+ "step": 34000
1804
+ },
1805
+ {
1806
+ "epoch": 6.73,
1807
+ "eval_COMMENT": {
1808
+ "f1": 0.703981612925032,
1809
+ "number": 6901,
1810
+ "precision": 0.6597820577800304,
1811
+ "recall": 0.7545283292276481
1812
+ },
1813
+ "eval_NAME": {
1814
+ "f1": 0.8044022011005503,
1815
+ "number": 8857,
1816
+ "precision": 0.7922049485439019,
1817
+ "recall": 0.8169809190470814
1818
+ },
1819
+ "eval_QTY": {
1820
+ "f1": 0.986130374479889,
1821
+ "number": 7189,
1822
+ "precision": 0.9832664914949523,
1823
+ "recall": 0.989010989010989
1824
+ },
1825
+ "eval_RANGE_END": {
1826
+ "f1": 0.7981651376146789,
1827
+ "number": 92,
1828
+ "precision": 0.6904761904761905,
1829
+ "recall": 0.9456521739130435
1830
+ },
1831
+ "eval_UNIT": {
1832
+ "f1": 0.9541965415436525,
1833
+ "number": 5732,
1834
+ "precision": 0.923730197615548,
1835
+ "recall": 0.9867411025819958
1836
+ },
1837
+ "eval_loss": 0.4795403480529785,
1838
+ "eval_overall_accuracy": 0.836304669423055,
1839
+ "eval_overall_f1": 0.8534844880813807,
1840
+ "eval_overall_precision": 0.8292139251294828,
1841
+ "eval_overall_recall": 0.8792186576761322,
1842
+ "eval_runtime": 8.6534,
1843
+ "eval_samples_per_second": 982.967,
1844
+ "eval_steps_per_second": 30.739,
1845
+ "step": 34000
1846
+ },
1847
+ {
1848
+ "epoch": 6.83,
1849
+ "learning_rate": 1.5848346862007525e-05,
1850
+ "loss": 0.4119,
1851
+ "step": 34500
1852
+ },
1853
+ {
1854
+ "epoch": 6.93,
1855
+ "learning_rate": 1.535339536725401e-05,
1856
+ "loss": 0.4184,
1857
+ "step": 35000
1858
+ },
1859
+ {
1860
+ "epoch": 6.93,
1861
+ "eval_COMMENT": {
1862
+ "f1": 0.7059539095762654,
1863
+ "number": 6901,
1864
+ "precision": 0.6614741641337386,
1865
+ "recall": 0.7568468337922041
1866
+ },
1867
+ "eval_NAME": {
1868
+ "f1": 0.8020405899966729,
1869
+ "number": 8857,
1870
+ "precision": 0.788057099269914,
1871
+ "recall": 0.8165292988596591
1872
+ },
1873
+ "eval_QTY": {
1874
+ "f1": 0.9865650969529086,
1875
+ "number": 7189,
1876
+ "precision": 0.9823472624465591,
1877
+ "recall": 0.9908193072750034
1878
+ },
1879
+ "eval_RANGE_END": {
1880
+ "f1": 0.7963800904977375,
1881
+ "number": 92,
1882
+ "precision": 0.6821705426356589,
1883
+ "recall": 0.9565217391304348
1884
+ },
1885
+ "eval_UNIT": {
1886
+ "f1": 0.9530710253601821,
1887
+ "number": 5732,
1888
+ "precision": 0.9216229428059313,
1889
+ "recall": 0.9867411025819958
1890
+ },
1891
+ "eval_loss": 0.4803193211555481,
1892
+ "eval_overall_accuracy": 0.8355839623715056,
1893
+ "eval_overall_f1": 0.8531527433837031,
1894
+ "eval_overall_precision": 0.8277868584504741,
1895
+ "eval_overall_recall": 0.8801223454172604,
1896
+ "eval_runtime": 7.0311,
1897
+ "eval_samples_per_second": 1209.766,
1898
+ "eval_steps_per_second": 37.832,
1899
+ "step": 35000
1900
+ },
1901
+ {
1902
+ "epoch": 7.03,
1903
+ "learning_rate": 1.4858443872500496e-05,
1904
+ "loss": 0.4189,
1905
+ "step": 35500
1906
+ },
1907
+ {
1908
+ "epoch": 7.13,
1909
+ "learning_rate": 1.4363492377746981e-05,
1910
+ "loss": 0.4071,
1911
+ "step": 36000
1912
+ },
1913
+ {
1914
+ "epoch": 7.13,
1915
+ "eval_COMMENT": {
1916
+ "f1": 0.7068977142471848,
1917
+ "number": 6901,
1918
+ "precision": 0.6610340479192938,
1919
+ "recall": 0.7596000579626141
1920
+ },
1921
+ "eval_NAME": {
1922
+ "f1": 0.8058371393561323,
1923
+ "number": 8857,
1924
+ "precision": 0.7952072111685171,
1925
+ "recall": 0.8167551089533702
1926
+ },
1927
+ "eval_QTY": {
1928
+ "f1": 0.9864247125640672,
1929
+ "number": 7189,
1930
+ "precision": 0.9823423920540765,
1931
+ "recall": 0.9905411044651551
1932
+ },
1933
+ "eval_RANGE_END": {
1934
+ "f1": 0.7981651376146789,
1935
+ "number": 92,
1936
+ "precision": 0.6904761904761905,
1937
+ "recall": 0.9456521739130435
1938
+ },
1939
+ "eval_UNIT": {
1940
+ "f1": 0.9542881284326151,
1941
+ "number": 5732,
1942
+ "precision": 0.9252826478780928,
1943
+ "recall": 0.9851709699930217
1944
+ },
1945
+ "eval_loss": 0.48823681473731995,
1946
+ "eval_overall_accuracy": 0.8358115540719948,
1947
+ "eval_overall_f1": 0.8546798029556651,
1948
+ "eval_overall_precision": 0.8303884609080479,
1949
+ "eval_overall_recall": 0.880435160404574,
1950
+ "eval_runtime": 9.3911,
1951
+ "eval_samples_per_second": 905.75,
1952
+ "eval_steps_per_second": 28.325,
1953
+ "step": 36000
1954
+ },
1955
+ {
1956
+ "epoch": 7.23,
1957
+ "learning_rate": 1.3868540882993467e-05,
1958
+ "loss": 0.4066,
1959
+ "step": 36500
1960
+ },
1961
+ {
1962
+ "epoch": 7.33,
1963
+ "learning_rate": 1.3373589388239954e-05,
1964
+ "loss": 0.4093,
1965
+ "step": 37000
1966
+ },
1967
+ {
1968
+ "epoch": 7.33,
1969
+ "eval_COMMENT": {
1970
+ "f1": 0.7065691471515801,
1971
+ "number": 6901,
1972
+ "precision": 0.6579605098725319,
1973
+ "recall": 0.7629329082741632
1974
+ },
1975
+ "eval_NAME": {
1976
+ "f1": 0.8055648302726766,
1977
+ "number": 8857,
1978
+ "precision": 0.794249972566663,
1979
+ "recall": 0.8172067291407926
1980
+ },
1981
+ "eval_QTY": {
1982
+ "f1": 0.9863412604867227,
1983
+ "number": 7189,
1984
+ "precision": 0.9832734310201825,
1985
+ "recall": 0.9894282932257615
1986
+ },
1987
+ "eval_RANGE_END": {
1988
+ "f1": 0.7924528301886793,
1989
+ "number": 92,
1990
+ "precision": 0.7,
1991
+ "recall": 0.9130434782608695
1992
+ },
1993
+ "eval_UNIT": {
1994
+ "f1": 0.9535530641490347,
1995
+ "number": 5732,
1996
+ "precision": 0.9225248735932148,
1997
+ "recall": 0.9867411025819958
1998
+ },
1999
+ "eval_loss": 0.48563364148139954,
2000
+ "eval_overall_accuracy": 0.8367219208739521,
2001
+ "eval_overall_f1": 0.8541543851375251,
2002
+ "eval_overall_precision": 0.8286274509803921,
2003
+ "eval_overall_recall": 0.8813040909248896,
2004
+ "eval_runtime": 6.6204,
2005
+ "eval_samples_per_second": 1284.823,
2006
+ "eval_steps_per_second": 40.179,
2007
+ "step": 37000
2008
+ },
2009
+ {
2010
+ "epoch": 7.42,
2011
+ "learning_rate": 1.287863789348644e-05,
2012
+ "loss": 0.4197,
2013
+ "step": 37500
2014
+ },
2015
+ {
2016
+ "epoch": 7.52,
2017
+ "learning_rate": 1.2383686398732925e-05,
2018
+ "loss": 0.4124,
2019
+ "step": 38000
2020
+ },
2021
+ {
2022
+ "epoch": 7.52,
2023
+ "eval_COMMENT": {
2024
+ "f1": 0.7066407036862955,
2025
+ "number": 6901,
2026
+ "precision": 0.6584084084084084,
2027
+ "recall": 0.762498188668309
2028
+ },
2029
+ "eval_NAME": {
2030
+ "f1": 0.8056977520587582,
2031
+ "number": 8857,
2032
+ "precision": 0.7942951179374658,
2033
+ "recall": 0.8174325392345038
2034
+ },
2035
+ "eval_QTY": {
2036
+ "f1": 0.9862728785357736,
2037
+ "number": 7189,
2038
+ "precision": 0.9831375259156876,
2039
+ "recall": 0.9894282932257615
2040
+ },
2041
+ "eval_RANGE_END": {
2042
+ "f1": 0.7963800904977375,
2043
+ "number": 92,
2044
+ "precision": 0.6821705426356589,
2045
+ "recall": 0.9565217391304348
2046
+ },
2047
+ "eval_UNIT": {
2048
+ "f1": 0.9536647009267059,
2049
+ "number": 5732,
2050
+ "precision": 0.9221244705115673,
2051
+ "recall": 0.9874389392882066
2052
+ },
2053
+ "eval_loss": 0.4802015423774719,
2054
+ "eval_overall_accuracy": 0.8361908735728104,
2055
+ "eval_overall_f1": 0.8542606938363086,
2056
+ "eval_overall_precision": 0.8286124995916234,
2057
+ "eval_overall_recall": 0.881547391470578,
2058
+ "eval_runtime": 9.142,
2059
+ "eval_samples_per_second": 930.428,
2060
+ "eval_steps_per_second": 29.096,
2061
+ "step": 38000
2062
+ },
2063
+ {
2064
+ "epoch": 7.62,
2065
+ "learning_rate": 1.1888734903979411e-05,
2066
+ "loss": 0.4071,
2067
+ "step": 38500
2068
+ },
2069
+ {
2070
+ "epoch": 7.72,
2071
+ "learning_rate": 1.1393783409225896e-05,
2072
+ "loss": 0.414,
2073
+ "step": 39000
2074
+ },
2075
+ {
2076
+ "epoch": 7.72,
2077
+ "eval_COMMENT": {
2078
+ "f1": 0.7048144163528779,
2079
+ "number": 6901,
2080
+ "precision": 0.6575084681972149,
2081
+ "recall": 0.7594551514273293
2082
+ },
2083
+ "eval_NAME": {
2084
+ "f1": 0.8015089315433264,
2085
+ "number": 8857,
2086
+ "precision": 0.7878721779910568,
2087
+ "recall": 0.8156260584848143
2088
+ },
2089
+ "eval_QTY": {
2090
+ "f1": 0.9858686616791354,
2091
+ "number": 7189,
2092
+ "precision": 0.9819235545743066,
2093
+ "recall": 0.9898455974405341
2094
+ },
2095
+ "eval_RANGE_END": {
2096
+ "f1": 0.7945205479452054,
2097
+ "number": 92,
2098
+ "precision": 0.6850393700787402,
2099
+ "recall": 0.9456521739130435
2100
+ },
2101
+ "eval_UNIT": {
2102
+ "f1": 0.9549138804457953,
2103
+ "number": 5732,
2104
+ "precision": 0.925229057591623,
2105
+ "recall": 0.9865666434054431
2106
+ },
2107
+ "eval_loss": 0.483047753572464,
2108
+ "eval_overall_accuracy": 0.8365701930736259,
2109
+ "eval_overall_f1": 0.8526693267336735,
2110
+ "eval_overall_precision": 0.8268464703193366,
2111
+ "eval_overall_recall": 0.880157102638073,
2112
+ "eval_runtime": 7.5994,
2113
+ "eval_samples_per_second": 1119.299,
2114
+ "eval_steps_per_second": 35.003,
2115
+ "step": 39000
2116
+ },
2117
+ {
2118
+ "epoch": 7.82,
2119
+ "learning_rate": 1.0898831914472382e-05,
2120
+ "loss": 0.4196,
2121
+ "step": 39500
2122
+ },
2123
+ {
2124
+ "epoch": 7.92,
2125
+ "learning_rate": 1.0403880419718868e-05,
2126
+ "loss": 0.4212,
2127
+ "step": 40000
2128
+ },
2129
+ {
2130
+ "epoch": 7.92,
2131
+ "eval_COMMENT": {
2132
+ "f1": 0.7108280254777071,
2133
+ "number": 6901,
2134
+ "precision": 0.6614674319940105,
2135
+ "recall": 0.7681495435444139
2136
+ },
2137
+ "eval_NAME": {
2138
+ "f1": 0.8036936084997496,
2139
+ "number": 8857,
2140
+ "precision": 0.7921052631578948,
2141
+ "recall": 0.8156260584848143
2142
+ },
2143
+ "eval_QTY": {
2144
+ "f1": 0.9861815151725575,
2145
+ "number": 7189,
2146
+ "precision": 0.9846089850249584,
2147
+ "recall": 0.9877590763666713
2148
+ },
2149
+ "eval_RANGE_END": {
2150
+ "f1": 0.787037037037037,
2151
+ "number": 92,
2152
+ "precision": 0.6854838709677419,
2153
+ "recall": 0.9239130434782609
2154
+ },
2155
+ "eval_UNIT": {
2156
+ "f1": 0.9544457567065969,
2157
+ "number": 5732,
2158
+ "precision": 0.9240444299248611,
2159
+ "recall": 0.9869155617585486
2160
+ },
2161
+ "eval_loss": 0.4802730679512024,
2162
+ "eval_overall_accuracy": 0.8373477980502978,
2163
+ "eval_overall_f1": 0.8546737867021544,
2164
+ "eval_overall_precision": 0.8292364016736402,
2165
+ "eval_overall_recall": 0.8817211775746411,
2166
+ "eval_runtime": 8.1983,
2167
+ "eval_samples_per_second": 1037.537,
2168
+ "eval_steps_per_second": 32.446,
2169
+ "step": 40000
2170
+ },
2171
+ {
2172
+ "epoch": 8.02,
2173
+ "learning_rate": 9.908928924965353e-06,
2174
+ "loss": 0.4135,
2175
+ "step": 40500
2176
+ },
2177
+ {
2178
+ "epoch": 8.12,
2179
+ "learning_rate": 9.41397743021184e-06,
2180
+ "loss": 0.3994,
2181
+ "step": 41000
2182
+ },
2183
+ {
2184
+ "epoch": 8.12,
2185
+ "eval_COMMENT": {
2186
+ "f1": 0.7058981774161006,
2187
+ "number": 6901,
2188
+ "precision": 0.6586345381526104,
2189
+ "recall": 0.7604694971743226
2190
+ },
2191
+ "eval_NAME": {
2192
+ "f1": 0.8033988670443185,
2193
+ "number": 8857,
2194
+ "precision": 0.7905782052683353,
2195
+ "recall": 0.8166422039065147
2196
+ },
2197
+ "eval_QTY": {
2198
+ "f1": 0.9862045060658579,
2199
+ "number": 7189,
2200
+ "precision": 0.9830016583747927,
2201
+ "recall": 0.9894282932257615
2202
+ },
2203
+ "eval_RANGE_END": {
2204
+ "f1": 0.7963800904977375,
2205
+ "number": 92,
2206
+ "precision": 0.6821705426356589,
2207
+ "recall": 0.9565217391304348
2208
+ },
2209
+ "eval_UNIT": {
2210
+ "f1": 0.9540433426089888,
2211
+ "number": 5732,
2212
+ "precision": 0.9232903541700669,
2213
+ "recall": 0.9869155617585486
2214
+ },
2215
+ "eval_loss": 0.4922930598258972,
2216
+ "eval_overall_accuracy": 0.8354701665212608,
2217
+ "eval_overall_f1": 0.8534523408555069,
2218
+ "eval_overall_precision": 0.8278284164788134,
2219
+ "eval_overall_recall": 0.8807132181710751,
2220
+ "eval_runtime": 7.4213,
2221
+ "eval_samples_per_second": 1146.156,
2222
+ "eval_steps_per_second": 35.843,
2223
+ "step": 41000
2224
+ },
2225
+ {
2226
+ "epoch": 8.22,
2227
+ "learning_rate": 8.919025935458326e-06,
2228
+ "loss": 0.4167,
2229
+ "step": 41500
2230
+ },
2231
+ {
2232
+ "epoch": 8.32,
2233
+ "learning_rate": 8.424074440704812e-06,
2234
+ "loss": 0.4052,
2235
+ "step": 42000
2236
+ },
2237
+ {
2238
+ "epoch": 8.32,
2239
+ "eval_COMMENT": {
2240
+ "f1": 0.7033915447373744,
2241
+ "number": 6901,
2242
+ "precision": 0.6577553593947036,
2243
+ "recall": 0.7558324880452109
2244
+ },
2245
+ "eval_NAME": {
2246
+ "f1": 0.8042463317029791,
2247
+ "number": 8857,
2248
+ "precision": 0.7920087575259989,
2249
+ "recall": 0.8168680140002258
2250
+ },
2251
+ "eval_QTY": {
2252
+ "f1": 0.9861438270749618,
2253
+ "number": 7189,
2254
+ "precision": 0.9823326432022084,
2255
+ "recall": 0.9899846988454584
2256
+ },
2257
+ "eval_RANGE_END": {
2258
+ "f1": 0.8018018018018018,
2259
+ "number": 92,
2260
+ "precision": 0.6846153846153846,
2261
+ "recall": 0.967391304347826
2262
+ },
2263
+ "eval_UNIT": {
2264
+ "f1": 0.9546567592670776,
2265
+ "number": 5732,
2266
+ "precision": 0.9250531827851416,
2267
+ "recall": 0.9862177250523377
2268
+ },
2269
+ "eval_loss": 0.4865518808364868,
2270
+ "eval_overall_accuracy": 0.8359822478473619,
2271
+ "eval_overall_f1": 0.8533090590337481,
2272
+ "eval_overall_precision": 0.8284507872082747,
2273
+ "eval_overall_recall": 0.8797052587675089,
2274
+ "eval_runtime": 7.4797,
2275
+ "eval_samples_per_second": 1137.217,
2276
+ "eval_steps_per_second": 35.563,
2277
+ "step": 42000
2278
+ },
2279
+ {
2280
+ "epoch": 8.41,
2281
+ "learning_rate": 7.929122945951298e-06,
2282
+ "loss": 0.4042,
2283
+ "step": 42500
2284
+ },
2285
+ {
2286
+ "epoch": 8.51,
2287
+ "learning_rate": 7.434171451197783e-06,
2288
+ "loss": 0.4042,
2289
+ "step": 43000
2290
+ },
2291
+ {
2292
+ "epoch": 8.51,
2293
+ "eval_COMMENT": {
2294
+ "f1": 0.7073401950162513,
2295
+ "number": 6901,
2296
+ "precision": 0.663912546078556,
2297
+ "recall": 0.7568468337922041
2298
+ },
2299
+ "eval_NAME": {
2300
+ "f1": 0.8030025020850708,
2301
+ "number": 8857,
2302
+ "precision": 0.7910823838737949,
2303
+ "recall": 0.8152873433442475
2304
+ },
2305
+ "eval_QTY": {
2306
+ "f1": 0.9858200179843675,
2307
+ "number": 7189,
2308
+ "precision": 0.980462300495322,
2309
+ "recall": 0.991236611489776
2310
+ },
2311
+ "eval_RANGE_END": {
2312
+ "f1": 0.7909090909090909,
2313
+ "number": 92,
2314
+ "precision": 0.6796875,
2315
+ "recall": 0.9456521739130435
2316
+ },
2317
+ "eval_UNIT": {
2318
+ "f1": 0.9534962089300758,
2319
+ "number": 5732,
2320
+ "precision": 0.921961550993809,
2321
+ "recall": 0.9872644801116539
2322
+ },
2323
+ "eval_loss": 0.48657840490341187,
2324
+ "eval_overall_accuracy": 0.8364563972233813,
2325
+ "eval_overall_f1": 0.8538279932546375,
2326
+ "eval_overall_precision": 0.8292443250679682,
2327
+ "eval_overall_recall": 0.8799138020923847,
2328
+ "eval_runtime": 9.0804,
2329
+ "eval_samples_per_second": 936.741,
2330
+ "eval_steps_per_second": 29.294,
2331
+ "step": 43000
2332
+ },
2333
+ {
2334
+ "epoch": 8.61,
2335
+ "learning_rate": 6.939219956444269e-06,
2336
+ "loss": 0.4036,
2337
+ "step": 43500
2338
+ },
2339
+ {
2340
+ "epoch": 8.71,
2341
+ "learning_rate": 6.444268461690754e-06,
2342
+ "loss": 0.4135,
2343
+ "step": 44000
2344
+ },
2345
+ {
2346
+ "epoch": 8.71,
2347
+ "eval_COMMENT": {
2348
+ "f1": 0.7091805715057758,
2349
+ "number": 6901,
2350
+ "precision": 0.664262212098203,
2351
+ "recall": 0.7606144037096073
2352
+ },
2353
+ "eval_NAME": {
2354
+ "f1": 0.802937576499388,
2355
+ "number": 8857,
2356
+ "precision": 0.7914884282110344,
2357
+ "recall": 0.8147228181099695
2358
+ },
2359
+ "eval_QTY": {
2360
+ "f1": 0.985878443859892,
2361
+ "number": 7189,
2362
+ "precision": 0.9812594736116853,
2363
+ "recall": 0.9905411044651551
2364
+ },
2365
+ "eval_RANGE_END": {
2366
+ "f1": 0.7813953488372093,
2367
+ "number": 92,
2368
+ "precision": 0.6829268292682927,
2369
+ "recall": 0.9130434782608695
2370
+ },
2371
+ "eval_UNIT": {
2372
+ "f1": 0.9540588384051252,
2373
+ "number": 5732,
2374
+ "precision": 0.9230141901810471,
2375
+ "recall": 0.9872644801116539
2376
+ },
2377
+ "eval_loss": 0.48304322361946106,
2378
+ "eval_overall_accuracy": 0.8367977847741153,
2379
+ "eval_overall_f1": 0.8542520362219861,
2380
+ "eval_overall_precision": 0.8296429741238126,
2381
+ "eval_overall_recall": 0.8803656459629488,
2382
+ "eval_runtime": 6.5688,
2383
+ "eval_samples_per_second": 1294.905,
2384
+ "eval_steps_per_second": 40.494,
2385
+ "step": 44000
2386
+ },
2387
+ {
2388
+ "epoch": 8.81,
2389
+ "learning_rate": 5.949316966937241e-06,
2390
+ "loss": 0.4078,
2391
+ "step": 44500
2392
+ },
2393
+ {
2394
+ "epoch": 8.91,
2395
+ "learning_rate": 5.4543654721837265e-06,
2396
+ "loss": 0.3958,
2397
+ "step": 45000
2398
+ },
2399
+ {
2400
+ "epoch": 8.91,
2401
+ "eval_COMMENT": {
2402
+ "f1": 0.7085999057175567,
2403
+ "number": 6901,
2404
+ "precision": 0.6619275289380976,
2405
+ "recall": 0.7623532821330242
2406
+ },
2407
+ "eval_NAME": {
2408
+ "f1": 0.8035773802910788,
2409
+ "number": 8857,
2410
+ "precision": 0.7909240021869874,
2411
+ "recall": 0.8166422039065147
2412
+ },
2413
+ "eval_QTY": {
2414
+ "f1": 0.9864836764400082,
2415
+ "number": 7189,
2416
+ "precision": 0.9831445150594087,
2417
+ "recall": 0.9898455974405341
2418
+ },
2419
+ "eval_RANGE_END": {
2420
+ "f1": 0.7906976744186046,
2421
+ "number": 92,
2422
+ "precision": 0.6910569105691057,
2423
+ "recall": 0.9239130434782609
2424
+ },
2425
+ "eval_UNIT": {
2426
+ "f1": 0.9539395984477813,
2427
+ "number": 5732,
2428
+ "precision": 0.9235543939888925,
2429
+ "recall": 0.9863921842288904
2430
+ },
2431
+ "eval_loss": 0.4859357178211212,
2432
+ "eval_overall_accuracy": 0.8370822743997269,
2433
+ "eval_overall_f1": 0.8542639055049118,
2434
+ "eval_overall_precision": 0.829048927263213,
2435
+ "eval_overall_recall": 0.8810607903792013,
2436
+ "eval_runtime": 9.1351,
2437
+ "eval_samples_per_second": 931.131,
2438
+ "eval_steps_per_second": 29.118,
2439
+ "step": 45000
2440
+ },
2441
+ {
2442
+ "epoch": 9.01,
2443
+ "learning_rate": 4.959413977430212e-06,
2444
+ "loss": 0.4071,
2445
+ "step": 45500
2446
+ },
2447
+ {
2448
+ "epoch": 9.11,
2449
+ "learning_rate": 4.4644624826766974e-06,
2450
+ "loss": 0.3985,
2451
+ "step": 46000
2452
+ },
2453
+ {
2454
+ "epoch": 9.11,
2455
+ "eval_COMMENT": {
2456
+ "f1": 0.7050125483280201,
2457
+ "number": 6901,
2458
+ "precision": 0.6627135934710533,
2459
+ "recall": 0.7530792638748007
2460
+ },
2461
+ "eval_NAME": {
2462
+ "f1": 0.8021064301552105,
2463
+ "number": 8857,
2464
+ "precision": 0.7878688881629097,
2465
+ "recall": 0.8168680140002258
2466
+ },
2467
+ "eval_QTY": {
2468
+ "f1": 0.9866093110386457,
2469
+ "number": 7189,
2470
+ "precision": 0.9842192691029901,
2471
+ "recall": 0.989010989010989
2472
+ },
2473
+ "eval_RANGE_END": {
2474
+ "f1": 0.7853881278538813,
2475
+ "number": 92,
2476
+ "precision": 0.6771653543307087,
2477
+ "recall": 0.9347826086956522
2478
+ },
2479
+ "eval_UNIT": {
2480
+ "f1": 0.9550875412331895,
2481
+ "number": 5732,
2482
+ "precision": 0.9269413889344935,
2483
+ "recall": 0.984996510816469
2484
+ },
2485
+ "eval_loss": 0.4896639585494995,
2486
+ "eval_overall_accuracy": 0.8351856768956492,
2487
+ "eval_overall_f1": 0.8533036226746344,
2488
+ "eval_overall_precision": 0.8295532871631601,
2489
+ "eval_overall_recall": 0.8784539988182545,
2490
+ "eval_runtime": 6.8177,
2491
+ "eval_samples_per_second": 1247.642,
2492
+ "eval_steps_per_second": 39.016,
2493
+ "step": 46000
2494
+ },
2495
+ {
2496
+ "epoch": 9.21,
2497
+ "learning_rate": 3.969510987923184e-06,
2498
+ "loss": 0.3989,
2499
+ "step": 46500
2500
+ },
2501
+ {
2502
+ "epoch": 9.31,
2503
+ "learning_rate": 3.4745594931696697e-06,
2504
+ "loss": 0.3944,
2505
+ "step": 47000
2506
+ },
2507
+ {
2508
+ "epoch": 9.31,
2509
+ "eval_COMMENT": {
2510
+ "f1": 0.709349593495935,
2511
+ "number": 6901,
2512
+ "precision": 0.6661152818424736,
2513
+ "recall": 0.7585857122156209
2514
+ },
2515
+ "eval_NAME": {
2516
+ "f1": 0.8033533200088829,
2517
+ "number": 8857,
2518
+ "precision": 0.7902785363189514,
2519
+ "recall": 0.8168680140002258
2520
+ },
2521
+ "eval_QTY": {
2522
+ "f1": 0.9866833125260092,
2523
+ "number": 7189,
2524
+ "precision": 0.9839535205422604,
2525
+ "recall": 0.9894282932257615
2526
+ },
2527
+ "eval_RANGE_END": {
2528
+ "f1": 0.787037037037037,
2529
+ "number": 92,
2530
+ "precision": 0.6854838709677419,
2531
+ "recall": 0.9239130434782609
2532
+ },
2533
+ "eval_UNIT": {
2534
+ "f1": 0.954649100582721,
2535
+ "number": 5732,
2536
+ "precision": 0.9251923391717138,
2537
+ "recall": 0.9860432658757851
2538
+ },
2539
+ "eval_loss": 0.48901429772377014,
2540
+ "eval_overall_accuracy": 0.8369495125744415,
2541
+ "eval_overall_f1": 0.8547268216112208,
2542
+ "eval_overall_precision": 0.8308176926105788,
2543
+ "eval_overall_recall": 0.8800528309756351,
2544
+ "eval_runtime": 9.5285,
2545
+ "eval_samples_per_second": 892.692,
2546
+ "eval_steps_per_second": 27.916,
2547
+ "step": 47000
2548
+ },
2549
+ {
2550
+ "epoch": 9.4,
2551
+ "learning_rate": 2.979607998416155e-06,
2552
+ "loss": 0.397,
2553
+ "step": 47500
2554
+ },
2555
+ {
2556
+ "epoch": 9.5,
2557
+ "learning_rate": 2.484656503662641e-06,
2558
+ "loss": 0.3959,
2559
+ "step": 48000
2560
+ },
2561
+ {
2562
+ "epoch": 9.5,
2563
+ "eval_COMMENT": {
2564
+ "f1": 0.7106236964273699,
2565
+ "number": 6901,
2566
+ "precision": 0.6632755589047978,
2567
+ "recall": 0.765251412838719
2568
+ },
2569
+ "eval_NAME": {
2570
+ "f1": 0.8044214853080043,
2571
+ "number": 8857,
2572
+ "precision": 0.7917122239230264,
2573
+ "recall": 0.8175454442813593
2574
+ },
2575
+ "eval_QTY": {
2576
+ "f1": 0.9865483289418943,
2577
+ "number": 7189,
2578
+ "precision": 0.9835476289229919,
2579
+ "recall": 0.9895673946306858
2580
+ },
2581
+ "eval_RANGE_END": {
2582
+ "f1": 0.7926267281105991,
2583
+ "number": 92,
2584
+ "precision": 0.688,
2585
+ "recall": 0.9347826086956522
2586
+ },
2587
+ "eval_UNIT": {
2588
+ "f1": 0.9542693216334796,
2589
+ "number": 5732,
2590
+ "precision": 0.9240196078431373,
2591
+ "recall": 0.9865666434054431
2592
+ },
2593
+ "eval_loss": 0.4869215190410614,
2594
+ "eval_overall_accuracy": 0.8368736486742784,
2595
+ "eval_overall_f1": 0.8550634297555469,
2596
+ "eval_overall_precision": 0.829693323742889,
2597
+ "eval_overall_recall": 0.8820339925619547,
2598
+ "eval_runtime": 6.6612,
2599
+ "eval_samples_per_second": 1276.945,
2600
+ "eval_steps_per_second": 39.933,
2601
+ "step": 48000
2602
+ },
2603
+ {
2604
+ "epoch": 9.6,
2605
+ "learning_rate": 1.989705008909127e-06,
2606
+ "loss": 0.3916,
2607
+ "step": 48500
2608
+ },
2609
+ {
2610
+ "epoch": 9.7,
2611
+ "learning_rate": 1.4947535141556129e-06,
2612
+ "loss": 0.3979,
2613
+ "step": 49000
2614
+ },
2615
+ {
2616
+ "epoch": 9.7,
2617
+ "eval_COMMENT": {
2618
+ "f1": 0.7113812901046943,
2619
+ "number": 6901,
2620
+ "precision": 0.666244939271255,
2621
+ "recall": 0.7630778148094479
2622
+ },
2623
+ "eval_NAME": {
2624
+ "f1": 0.8035317636605953,
2625
+ "number": 8857,
2626
+ "precision": 0.7906239755218009,
2627
+ "recall": 0.8168680140002258
2628
+ },
2629
+ "eval_QTY": {
2630
+ "f1": 0.9864780528396089,
2631
+ "number": 7189,
2632
+ "precision": 0.9835453539823009,
2633
+ "recall": 0.9894282932257615
2634
+ },
2635
+ "eval_RANGE_END": {
2636
+ "f1": 0.7813953488372093,
2637
+ "number": 92,
2638
+ "precision": 0.6829268292682927,
2639
+ "recall": 0.9130434782608695
2640
+ },
2641
+ "eval_UNIT": {
2642
+ "f1": 0.9541810817652518,
2643
+ "number": 5732,
2644
+ "precision": 0.9240071907174375,
2645
+ "recall": 0.9863921842288904
2646
+ },
2647
+ "eval_loss": 0.48777857422828674,
2648
+ "eval_overall_accuracy": 0.8369115806243599,
2649
+ "eval_overall_f1": 0.8550421585160202,
2650
+ "eval_overall_precision": 0.8304235317239346,
2651
+ "eval_overall_recall": 0.8811650620416391,
2652
+ "eval_runtime": 8.6569,
2653
+ "eval_samples_per_second": 982.572,
2654
+ "eval_steps_per_second": 30.727,
2655
+ "step": 49000
2656
+ },
2657
+ {
2658
+ "epoch": 9.8,
2659
+ "learning_rate": 9.998020194020988e-07,
2660
+ "loss": 0.4088,
2661
+ "step": 49500
2662
+ },
2663
+ {
2664
+ "epoch": 9.9,
2665
+ "learning_rate": 5.048505246485845e-07,
2666
+ "loss": 0.4095,
2667
+ "step": 50000
2668
+ },
2669
+ {
2670
+ "epoch": 9.9,
2671
+ "eval_COMMENT": {
2672
+ "f1": 0.7118095366561004,
2673
+ "number": 6901,
2674
+ "precision": 0.665783497350492,
2675
+ "recall": 0.7646717866975801
2676
+ },
2677
+ "eval_NAME": {
2678
+ "f1": 0.80368950380619,
2679
+ "number": 8857,
2680
+ "precision": 0.7912472647702407,
2681
+ "recall": 0.8165292988596591
2682
+ },
2683
+ "eval_QTY": {
2684
+ "f1": 0.9863412604867227,
2685
+ "number": 7189,
2686
+ "precision": 0.9832734310201825,
2687
+ "recall": 0.9894282932257615
2688
+ },
2689
+ "eval_RANGE_END": {
2690
+ "f1": 0.7813953488372093,
2691
+ "number": 92,
2692
+ "precision": 0.6829268292682927,
2693
+ "recall": 0.9130434782608695
2694
+ },
2695
+ "eval_UNIT": {
2696
+ "f1": 0.9544226873733964,
2697
+ "number": 5732,
2698
+ "precision": 0.9244604316546763,
2699
+ "recall": 0.9863921842288904
2700
+ },
2701
+ "eval_loss": 0.48620378971099854,
2702
+ "eval_overall_accuracy": 0.8372719341501347,
2703
+ "eval_overall_f1": 0.855167762603271,
2704
+ "eval_overall_precision": 0.8304135695340384,
2705
+ "eval_overall_recall": 0.8814431198081402,
2706
+ "eval_runtime": 8.2871,
2707
+ "eval_samples_per_second": 1026.42,
2708
+ "eval_steps_per_second": 32.098,
2709
+ "step": 50000
2710
+ },
2711
+ {
2712
+ "epoch": 10.0,
2713
+ "learning_rate": 9.899029895070283e-09,
2714
+ "loss": 0.3994,
2715
+ "step": 50500
2716
+ },
2717
+ {
2718
+ "epoch": 10.0,
2719
+ "step": 50510,
2720
+ "total_flos": 1555191327435270.0,
2721
+ "train_loss": 0.45639907907811844,
2722
+ "train_runtime": 1954.9419,
2723
+ "train_samples_per_second": 826.638,
2724
+ "train_steps_per_second": 25.837
2725
+ }
2726
+ ],
2727
+ "logging_steps": 500,
2728
+ "max_steps": 50510,
2729
+ "num_train_epochs": 10,
2730
+ "save_steps": 1000,
2731
+ "total_flos": 1555191327435270.0,
2732
+ "trial_name": null,
2733
+ "trial_params": null
2734
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c5410c47250eb6dc78a5b7266e040300f9e0d9b784546b7746f4dfdda92fce2
3
+ size 4600
validation_results.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "eval_COMMENT": {
4
+ "f1": 0.69833923223523,
5
+ "number": 6901,
6
+ "precision": 0.6584520600693108,
7
+ "recall": 0.7433705260107231
8
+ },
9
+ "eval_NAME": {
10
+ "f1": 0.8048291977300545,
11
+ "number": 8857,
12
+ "precision": 0.7933530766699572,
13
+ "recall": 0.8166422039065147
14
+ },
15
+ "eval_QTY": {
16
+ "f1": 0.9856135011758197,
17
+ "number": 7189,
18
+ "precision": 0.9801898472967395,
19
+ "recall": 0.9910975100848518
20
+ },
21
+ "eval_RANGE_END": {
22
+ "f1": 0.7837837837837838,
23
+ "number": 92,
24
+ "precision": 0.6692307692307692,
25
+ "recall": 0.9456521739130435
26
+ },
27
+ "eval_UNIT": {
28
+ "f1": 0.9537942664418213,
29
+ "number": 5732,
30
+ "precision": 0.922976501305483,
31
+ "recall": 0.9867411025819958
32
+ },
33
+ "eval_loss": 0.47403302788734436,
34
+ "eval_overall_accuracy": 0.8347115275196297,
35
+ "eval_overall_f1": 0.8523122656487518,
36
+ "eval_overall_precision": 0.8290126499096435,
37
+ "eval_overall_recall": 0.8769594383233117,
38
+ "eval_runtime": 9.862,
39
+ "eval_samples_per_second": 862.507,
40
+ "eval_steps_per_second": 26.972
41
+ }
vocab.txt ADDED
The diff for this file is too large to render. See raw diff