nielsr HF staff commited on
Commit
dba26d1
1 Parent(s): e68ba5f

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 100.0,
3
+ "eval_accuracy": 0.8330271015158475,
4
+ "eval_f1": 0.9077802634849614,
5
+ "eval_loss": 1.1164220571517944,
6
+ "eval_precision": 0.9026198714780029,
7
+ "eval_recall": 0.913,
8
+ "eval_runtime": 4.5243,
9
+ "eval_samples": 54,
10
+ "eval_samples_per_second": 11.936,
11
+ "eval_steps_per_second": 0.884,
12
+ "train_loss": 0.12633917331695557,
13
+ "train_runtime": 1653.606,
14
+ "train_samples": 150,
15
+ "train_samples_per_second": 9.676,
16
+ "train_steps_per_second": 0.605
17
+ }
eval_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 100.0,
3
+ "eval_accuracy": 0.8330271015158475,
4
+ "eval_f1": 0.9077802634849614,
5
+ "eval_loss": 1.1164220571517944,
6
+ "eval_precision": 0.9026198714780029,
7
+ "eval_recall": 0.913,
8
+ "eval_runtime": 4.5243,
9
+ "eval_samples": 54,
10
+ "eval_samples_per_second": 11.936,
11
+ "eval_steps_per_second": 0.884
12
+ }
runs/May02_16-26-18_brutasse/events.out.tfevents.1651510649.brutasse.9557.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb2ed9c23e5973706e0aaa2a59ef0f1cfcfedaa1baa2552e05455bc0bebe9eaf
3
+ size 512
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 100.0,
3
+ "train_loss": 0.12633917331695557,
4
+ "train_runtime": 1653.606,
5
+ "train_samples": 150,
6
+ "train_samples_per_second": 9.676,
7
+ "train_steps_per_second": 0.605
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,157 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9077802634849614,
3
+ "best_model_checkpoint": "layoutlmv3-test/checkpoint-1000",
4
+ "epoch": 100.0,
5
+ "global_step": 1000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 10.0,
12
+ "eval_accuracy": 0.8409508497932935,
13
+ "eval_f1": 0.8606119475473532,
14
+ "eval_loss": 0.5238379240036011,
15
+ "eval_precision": 0.8366383380547686,
16
+ "eval_recall": 0.886,
17
+ "eval_runtime": 4.4875,
18
+ "eval_samples_per_second": 12.033,
19
+ "eval_steps_per_second": 0.891,
20
+ "step": 100
21
+ },
22
+ {
23
+ "epoch": 20.0,
24
+ "eval_accuracy": 0.8322232429949472,
25
+ "eval_f1": 0.8856507779698691,
26
+ "eval_loss": 0.6930040717124939,
27
+ "eval_precision": 0.8750610053684724,
28
+ "eval_recall": 0.8965,
29
+ "eval_runtime": 4.6295,
30
+ "eval_samples_per_second": 11.664,
31
+ "eval_steps_per_second": 0.864,
32
+ "step": 200
33
+ },
34
+ {
35
+ "epoch": 30.0,
36
+ "eval_accuracy": 0.8414101975195223,
37
+ "eval_f1": 0.899009900990099,
38
+ "eval_loss": 0.7784350514411926,
39
+ "eval_precision": 0.8901960784313725,
40
+ "eval_recall": 0.908,
41
+ "eval_runtime": 4.5256,
42
+ "eval_samples_per_second": 11.932,
43
+ "eval_steps_per_second": 0.884,
44
+ "step": 300
45
+ },
46
+ {
47
+ "epoch": 40.0,
48
+ "eval_accuracy": 0.836357372531006,
49
+ "eval_f1": 0.8982630272952853,
50
+ "eval_loss": 0.9056066870689392,
51
+ "eval_precision": 0.8916256157635468,
52
+ "eval_recall": 0.905,
53
+ "eval_runtime": 4.5498,
54
+ "eval_samples_per_second": 11.869,
55
+ "eval_steps_per_second": 0.879,
56
+ "step": 400
57
+ },
58
+ {
59
+ "epoch": 50.0,
60
+ "learning_rate": 5e-06,
61
+ "loss": 0.2429,
62
+ "step": 500
63
+ },
64
+ {
65
+ "epoch": 50.0,
66
+ "eval_accuracy": 0.8298116674322462,
67
+ "eval_f1": 0.9014154457412467,
68
+ "eval_loss": 1.001568078994751,
69
+ "eval_precision": 0.895411938825851,
70
+ "eval_recall": 0.9075,
71
+ "eval_runtime": 4.6434,
72
+ "eval_samples_per_second": 11.629,
73
+ "eval_steps_per_second": 0.861,
74
+ "step": 500
75
+ },
76
+ {
77
+ "epoch": 60.0,
78
+ "eval_accuracy": 0.8293523197060174,
79
+ "eval_f1": 0.8934262948207171,
80
+ "eval_loss": 1.009719967842102,
81
+ "eval_precision": 0.8898809523809523,
82
+ "eval_recall": 0.897,
83
+ "eval_runtime": 4.6541,
84
+ "eval_samples_per_second": 11.603,
85
+ "eval_steps_per_second": 0.859,
86
+ "step": 600
87
+ },
88
+ {
89
+ "epoch": 70.0,
90
+ "eval_accuracy": 0.8315342214056041,
91
+ "eval_f1": 0.906008476689105,
92
+ "eval_loss": 1.072226643562317,
93
+ "eval_precision": 0.9035305818000995,
94
+ "eval_recall": 0.9085,
95
+ "eval_runtime": 4.5145,
96
+ "eval_samples_per_second": 11.961,
97
+ "eval_steps_per_second": 0.886,
98
+ "step": 700
99
+ },
100
+ {
101
+ "epoch": 80.0,
102
+ "eval_accuracy": 0.8269407441433165,
103
+ "eval_f1": 0.9003708281829418,
104
+ "eval_loss": 1.088362693786621,
105
+ "eval_precision": 0.8904645476772616,
106
+ "eval_recall": 0.9105,
107
+ "eval_runtime": 4.4141,
108
+ "eval_samples_per_second": 12.233,
109
+ "eval_steps_per_second": 0.906,
110
+ "step": 800
111
+ },
112
+ {
113
+ "epoch": 90.0,
114
+ "eval_accuracy": 0.827859439595774,
115
+ "eval_f1": 0.9013386217154189,
116
+ "eval_loss": 1.129175066947937,
117
+ "eval_precision": 0.8938053097345132,
118
+ "eval_recall": 0.909,
119
+ "eval_runtime": 4.4449,
120
+ "eval_samples_per_second": 12.149,
121
+ "eval_steps_per_second": 0.9,
122
+ "step": 900
123
+ },
124
+ {
125
+ "epoch": 100.0,
126
+ "learning_rate": 0.0,
127
+ "loss": 0.0098,
128
+ "step": 1000
129
+ },
130
+ {
131
+ "epoch": 100.0,
132
+ "eval_accuracy": 0.8330271015158475,
133
+ "eval_f1": 0.9077802634849614,
134
+ "eval_loss": 1.1164220571517944,
135
+ "eval_precision": 0.9026198714780029,
136
+ "eval_recall": 0.913,
137
+ "eval_runtime": 4.533,
138
+ "eval_samples_per_second": 11.913,
139
+ "eval_steps_per_second": 0.882,
140
+ "step": 1000
141
+ },
142
+ {
143
+ "epoch": 100.0,
144
+ "step": 1000,
145
+ "total_flos": 3954080148480000.0,
146
+ "train_loss": 0.12633917331695557,
147
+ "train_runtime": 1653.606,
148
+ "train_samples_per_second": 9.676,
149
+ "train_steps_per_second": 0.605
150
+ }
151
+ ],
152
+ "max_steps": 1000,
153
+ "num_train_epochs": 100,
154
+ "total_flos": 3954080148480000.0,
155
+ "trial_name": null,
156
+ "trial_params": null
157
+ }