nielsr HF staff commited on
Commit
fa7d4a2
1 Parent(s): e13cfdd

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "eval_accuracy": 0.9384550084889643,
4
+ "eval_f1": 0.9269016697588126,
5
+ "eval_loss": 0.30563604831695557,
6
+ "eval_precision": 0.9190581309786607,
7
+ "eval_recall": 0.9348802395209581,
8
+ "eval_runtime": 8.103,
9
+ "eval_samples": 100,
10
+ "eval_samples_per_second": 12.341,
11
+ "eval_steps_per_second": 0.864,
12
+ "train_loss": 0.7290411071777344,
13
+ "train_runtime": 1777.9741,
14
+ "train_samples": 800,
15
+ "train_samples_per_second": 8.999,
16
+ "train_steps_per_second": 0.562
17
+ }
eval_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "eval_accuracy": 0.9384550084889643,
4
+ "eval_f1": 0.9269016697588126,
5
+ "eval_loss": 0.30563604831695557,
6
+ "eval_precision": 0.9190581309786607,
7
+ "eval_recall": 0.9348802395209581,
8
+ "eval_runtime": 8.103,
9
+ "eval_samples": 100,
10
+ "eval_samples_per_second": 12.341,
11
+ "eval_steps_per_second": 0.864
12
+ }
runs/May02_17-47-48_brutasse/events.out.tfevents.1651516292.brutasse.19888.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de232cdbaea82115cd76733b0d0fcd778eea43446f40a50892537f4d5504d02
3
+ size 512
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "train_loss": 0.7290411071777344,
4
+ "train_runtime": 1777.9741,
5
+ "train_samples": 800,
6
+ "train_samples_per_second": 8.999,
7
+ "train_steps_per_second": 0.562
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,157 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9269016697588126,
3
+ "best_model_checkpoint": "layoutlmv3-test-cord/checkpoint-1000",
4
+ "epoch": 20.0,
5
+ "global_step": 1000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 2.0,
12
+ "eval_accuracy": 0.6366723259762309,
13
+ "eval_f1": 0.5626932325661285,
14
+ "eval_loss": 1.6054191589355469,
15
+ "eval_precision": 0.52,
16
+ "eval_recall": 0.6130239520958084,
17
+ "eval_runtime": 8.1419,
18
+ "eval_samples_per_second": 12.282,
19
+ "eval_steps_per_second": 0.86,
20
+ "step": 100
21
+ },
22
+ {
23
+ "epoch": 4.0,
24
+ "eval_accuracy": 0.8314940577249575,
25
+ "eval_f1": 0.8096632503660322,
26
+ "eval_loss": 0.9171701669692993,
27
+ "eval_precision": 0.7922636103151862,
28
+ "eval_recall": 0.8278443113772455,
29
+ "eval_runtime": 8.1716,
30
+ "eval_samples_per_second": 12.238,
31
+ "eval_steps_per_second": 0.857,
32
+ "step": 200
33
+ },
34
+ {
35
+ "epoch": 6.0,
36
+ "eval_accuracy": 0.866723259762309,
37
+ "eval_f1": 0.8496683861459101,
38
+ "eval_loss": 0.6381942629814148,
39
+ "eval_precision": 0.8367198838896952,
40
+ "eval_recall": 0.8630239520958084,
41
+ "eval_runtime": 8.0786,
42
+ "eval_samples_per_second": 12.378,
43
+ "eval_steps_per_second": 0.866,
44
+ "step": 300
45
+ },
46
+ {
47
+ "epoch": 8.0,
48
+ "eval_accuracy": 0.8960101867572157,
49
+ "eval_f1": 0.8775811209439529,
50
+ "eval_loss": 0.4974280595779419,
51
+ "eval_precision": 0.8648255813953488,
52
+ "eval_recall": 0.8907185628742516,
53
+ "eval_runtime": 8.0768,
54
+ "eval_samples_per_second": 12.381,
55
+ "eval_steps_per_second": 0.867,
56
+ "step": 400
57
+ },
58
+ {
59
+ "epoch": 10.0,
60
+ "learning_rate": 5e-06,
61
+ "loss": 1.1589,
62
+ "step": 500
63
+ },
64
+ {
65
+ "epoch": 10.0,
66
+ "eval_accuracy": 0.916383701188455,
67
+ "eval_f1": 0.8914243651085757,
68
+ "eval_loss": 0.41238266229629517,
69
+ "eval_precision": 0.8769007965242578,
70
+ "eval_recall": 0.906437125748503,
71
+ "eval_runtime": 8.1158,
72
+ "eval_samples_per_second": 12.322,
73
+ "eval_steps_per_second": 0.863,
74
+ "step": 500
75
+ },
76
+ {
77
+ "epoch": 12.0,
78
+ "eval_accuracy": 0.9235993208828522,
79
+ "eval_f1": 0.9064002959674436,
80
+ "eval_loss": 0.37666961550712585,
81
+ "eval_precision": 0.8961228968544257,
82
+ "eval_recall": 0.9169161676646707,
83
+ "eval_runtime": 8.1123,
84
+ "eval_samples_per_second": 12.327,
85
+ "eval_steps_per_second": 0.863,
86
+ "step": 600
87
+ },
88
+ {
89
+ "epoch": 14.0,
90
+ "eval_accuracy": 0.933786078098472,
91
+ "eval_f1": 0.9210818821785848,
92
+ "eval_loss": 0.3387647271156311,
93
+ "eval_precision": 0.9119589141599413,
94
+ "eval_recall": 0.9303892215568862,
95
+ "eval_runtime": 8.0833,
96
+ "eval_samples_per_second": 12.371,
97
+ "eval_steps_per_second": 0.866,
98
+ "step": 700
99
+ },
100
+ {
101
+ "epoch": 16.0,
102
+ "eval_accuracy": 0.9393039049235993,
103
+ "eval_f1": 0.927643784786642,
104
+ "eval_loss": 0.3137519955635071,
105
+ "eval_precision": 0.919793966151582,
106
+ "eval_recall": 0.9356287425149701,
107
+ "eval_runtime": 7.8384,
108
+ "eval_samples_per_second": 12.758,
109
+ "eval_steps_per_second": 0.893,
110
+ "step": 800
111
+ },
112
+ {
113
+ "epoch": 18.0,
114
+ "eval_accuracy": 0.9376061120543294,
115
+ "eval_f1": 0.9254174397031539,
116
+ "eval_loss": 0.30727389454841614,
117
+ "eval_precision": 0.9175864606328182,
118
+ "eval_recall": 0.9333832335329342,
119
+ "eval_runtime": 7.8694,
120
+ "eval_samples_per_second": 12.708,
121
+ "eval_steps_per_second": 0.89,
122
+ "step": 900
123
+ },
124
+ {
125
+ "epoch": 20.0,
126
+ "learning_rate": 0.0,
127
+ "loss": 0.2992,
128
+ "step": 1000
129
+ },
130
+ {
131
+ "epoch": 20.0,
132
+ "eval_accuracy": 0.9384550084889643,
133
+ "eval_f1": 0.9269016697588126,
134
+ "eval_loss": 0.30563604831695557,
135
+ "eval_precision": 0.9190581309786607,
136
+ "eval_recall": 0.9348802395209581,
137
+ "eval_runtime": 7.9092,
138
+ "eval_samples_per_second": 12.644,
139
+ "eval_steps_per_second": 0.885,
140
+ "step": 1000
141
+ },
142
+ {
143
+ "epoch": 20.0,
144
+ "step": 1000,
145
+ "total_flos": 4248755355648000.0,
146
+ "train_loss": 0.7290411071777344,
147
+ "train_runtime": 1777.9741,
148
+ "train_samples_per_second": 8.999,
149
+ "train_steps_per_second": 0.562
150
+ }
151
+ ],
152
+ "max_steps": 1000,
153
+ "num_train_epochs": 20,
154
+ "total_flos": 4248755355648000.0,
155
+ "trial_name": null,
156
+ "trial_params": null
157
+ }