Franman commited on
Commit
95cb9ca
1 Parent(s): 6a7ace6

End of training

Browse files
Files changed (5) hide show
  1. README.md +1 -1
  2. all_results.json +10 -10
  3. eval_results.json +6 -6
  4. train_results.json +5 -5
  5. trainer_state.json +128 -92
README.md CHANGED
@@ -17,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [microsoft/beit-base-patch16-224](https://huggingface.co/microsoft/beit-base-patch16-224) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.0675
21
  - Accuracy: 0.9843
22
 
23
  ## Model description
 
17
 
18
  This model is a fine-tuned version of [microsoft/beit-base-patch16-224](https://huggingface.co/microsoft/beit-base-patch16-224) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.0739
21
  - Accuracy: 0.9843
22
 
23
  ## Model description
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 7.47,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.015091076493263245,
5
- "eval_runtime": 12.3295,
6
- "eval_samples_per_second": 8.516,
7
- "eval_steps_per_second": 0.324,
8
- "train_loss": 0.4356716935123716,
9
- "train_runtime": 2360.1881,
10
- "train_samples_per_second": 3.183,
11
- "train_steps_per_second": 0.024
12
  }
 
1
  {
2
+ "epoch": 7.7,
3
+ "eval_accuracy": 0.9842931937172775,
4
+ "eval_loss": 0.07386188954114914,
5
+ "eval_runtime": 26.1219,
6
+ "eval_samples_per_second": 7.312,
7
+ "eval_steps_per_second": 0.23,
8
+ "train_loss": 0.5548124955250666,
9
+ "train_runtime": 4572.4853,
10
+ "train_samples_per_second": 3.004,
11
+ "train_steps_per_second": 0.023
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 7.47,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.015091076493263245,
5
- "eval_runtime": 12.3295,
6
- "eval_samples_per_second": 8.516,
7
- "eval_steps_per_second": 0.324
8
  }
 
1
  {
2
+ "epoch": 7.7,
3
+ "eval_accuracy": 0.9842931937172775,
4
+ "eval_loss": 0.07386188954114914,
5
+ "eval_runtime": 26.1219,
6
+ "eval_samples_per_second": 7.312,
7
+ "eval_steps_per_second": 0.23
8
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 7.47,
3
- "train_loss": 0.4356716935123716,
4
- "train_runtime": 2360.1881,
5
- "train_samples_per_second": 3.183,
6
- "train_steps_per_second": 0.024
7
  }
 
1
  {
2
+ "epoch": 7.7,
3
+ "train_loss": 0.5548124955250666,
4
+ "train_runtime": 4572.4853,
5
+ "train_samples_per_second": 3.004,
6
+ "train_steps_per_second": 0.023
7
  }
trainer_state.json CHANGED
@@ -1,142 +1,178 @@
1
  {
2
- "best_metric": 1.0,
3
- "best_model_checkpoint": "model/checkpoint-30",
4
- "epoch": 7.466666666666667,
5
  "eval_steps": 500,
6
- "global_step": 56,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.93,
13
- "eval_accuracy": 0.6190476190476191,
14
- "eval_loss": 0.5468170046806335,
15
- "eval_runtime": 12.9206,
16
- "eval_samples_per_second": 8.127,
17
- "eval_steps_per_second": 0.31,
18
- "step": 7
19
  },
20
  {
21
- "epoch": 1.07,
22
- "learning_rate": 0.00048,
23
- "loss": 1.0237,
24
- "step": 8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  },
26
  {
27
  "epoch": 2.0,
28
- "eval_accuracy": 0.9619047619047619,
29
- "eval_loss": 0.11131703853607178,
30
- "eval_runtime": 12.3741,
31
- "eval_samples_per_second": 8.485,
32
- "eval_steps_per_second": 0.323,
33
- "step": 15
34
  },
35
  {
36
- "epoch": 2.13,
37
- "learning_rate": 0.0004,
38
- "loss": 0.5329,
39
- "step": 16
40
  },
41
  {
42
- "epoch": 2.93,
43
- "eval_accuracy": 0.9714285714285714,
44
- "eval_loss": 0.046230871230363846,
45
- "eval_runtime": 12.3758,
46
- "eval_samples_per_second": 8.484,
47
- "eval_steps_per_second": 0.323,
48
- "step": 22
49
  },
50
  {
51
- "epoch": 3.2,
52
- "learning_rate": 0.00032,
53
- "loss": 0.335,
54
- "step": 24
 
 
 
 
 
 
 
 
 
55
  },
56
  {
57
  "epoch": 4.0,
58
- "eval_accuracy": 1.0,
59
- "eval_loss": 0.015091076493263245,
60
- "eval_runtime": 12.4003,
61
- "eval_samples_per_second": 8.468,
62
- "eval_steps_per_second": 0.323,
63
- "step": 30
64
  },
65
  {
66
- "epoch": 4.27,
67
- "learning_rate": 0.00024,
68
- "loss": 0.3359,
69
- "step": 32
70
  },
71
  {
72
- "epoch": 4.93,
73
- "eval_accuracy": 0.9428571428571428,
74
- "eval_loss": 0.1429169476032257,
75
- "eval_runtime": 12.3608,
76
- "eval_samples_per_second": 8.495,
77
- "eval_steps_per_second": 0.324,
78
- "step": 37
 
 
 
 
 
 
79
  },
80
  {
81
  "epoch": 5.33,
82
- "learning_rate": 0.00016,
83
- "loss": 0.2794,
84
- "step": 40
 
 
 
 
 
 
85
  },
86
  {
87
  "epoch": 6.0,
88
- "eval_accuracy": 0.9619047619047619,
89
- "eval_loss": 0.060580089688301086,
90
- "eval_runtime": 12.4196,
91
- "eval_samples_per_second": 8.454,
92
- "eval_steps_per_second": 0.322,
93
- "step": 45
94
  },
95
  {
96
- "epoch": 6.4,
97
- "learning_rate": 8e-05,
98
- "loss": 0.2937,
99
- "step": 48
100
  },
101
  {
102
- "epoch": 6.93,
103
- "eval_accuracy": 0.9904761904761905,
104
- "eval_loss": 0.01593722589313984,
105
- "eval_runtime": 12.3709,
106
- "eval_samples_per_second": 8.488,
107
- "eval_steps_per_second": 0.323,
108
- "step": 52
109
  },
110
  {
111
- "epoch": 7.47,
 
 
 
 
 
 
112
  "learning_rate": 0.0,
113
- "loss": 0.249,
114
- "step": 56
115
  },
116
  {
117
- "epoch": 7.47,
118
- "eval_accuracy": 0.9904761904761905,
119
- "eval_loss": 0.01840730383992195,
120
- "eval_runtime": 12.4229,
121
- "eval_samples_per_second": 8.452,
122
- "eval_steps_per_second": 0.322,
123
- "step": 56
124
  },
125
  {
126
- "epoch": 7.47,
127
- "step": 56,
128
- "total_flos": 5.438387167052636e+17,
129
- "train_loss": 0.4356716935123716,
130
- "train_runtime": 2360.1881,
131
- "train_samples_per_second": 3.183,
132
- "train_steps_per_second": 0.024
133
  }
134
  ],
135
  "logging_steps": 8,
136
- "max_steps": 56,
137
  "num_train_epochs": 8,
138
  "save_steps": 500,
139
- "total_flos": 5.438387167052636e+17,
140
  "trial_name": null,
141
  "trial_params": null
142
  }
 
1
  {
2
+ "best_metric": 0.9842931937172775,
3
+ "best_model_checkpoint": "model/checkpoint-94",
4
+ "epoch": 7.703703703703704,
5
  "eval_steps": 500,
6
+ "global_step": 104,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.59,
13
+ "learning_rate": 0.00036363636363636367,
14
+ "loss": 1.0999,
15
+ "step": 8
 
 
 
16
  },
17
  {
18
+ "epoch": 0.96,
19
+ "eval_accuracy": 0.643979057591623,
20
+ "eval_loss": 0.7986512780189514,
21
+ "eval_runtime": 28.581,
22
+ "eval_samples_per_second": 6.683,
23
+ "eval_steps_per_second": 0.21,
24
+ "step": 13
25
+ },
26
+ {
27
+ "epoch": 1.19,
28
+ "learning_rate": 0.0004731182795698925,
29
+ "loss": 1.0029,
30
+ "step": 16
31
+ },
32
+ {
33
+ "epoch": 1.78,
34
+ "learning_rate": 0.00043010752688172043,
35
+ "loss": 0.6342,
36
+ "step": 24
37
  },
38
  {
39
  "epoch": 2.0,
40
+ "eval_accuracy": 0.9424083769633508,
41
+ "eval_loss": 0.24137574434280396,
42
+ "eval_runtime": 26.3088,
43
+ "eval_samples_per_second": 7.26,
44
+ "eval_steps_per_second": 0.228,
45
+ "step": 27
46
  },
47
  {
48
+ "epoch": 2.37,
49
+ "learning_rate": 0.0003870967741935484,
50
+ "loss": 0.5732,
51
+ "step": 32
52
  },
53
  {
54
+ "epoch": 2.96,
55
+ "learning_rate": 0.0003440860215053764,
56
+ "loss": 0.4882,
57
+ "step": 40
 
 
 
58
  },
59
  {
60
+ "epoch": 2.96,
61
+ "eval_accuracy": 0.9633507853403142,
62
+ "eval_loss": 0.16461053490638733,
63
+ "eval_runtime": 26.318,
64
+ "eval_samples_per_second": 7.257,
65
+ "eval_steps_per_second": 0.228,
66
+ "step": 40
67
+ },
68
+ {
69
+ "epoch": 3.56,
70
+ "learning_rate": 0.0003010752688172043,
71
+ "loss": 0.463,
72
+ "step": 48
73
  },
74
  {
75
  "epoch": 4.0,
76
+ "eval_accuracy": 0.9424083769633508,
77
+ "eval_loss": 0.25284695625305176,
78
+ "eval_runtime": 26.2832,
79
+ "eval_samples_per_second": 7.267,
80
+ "eval_steps_per_second": 0.228,
81
+ "step": 54
82
  },
83
  {
84
+ "epoch": 4.15,
85
+ "learning_rate": 0.00025806451612903227,
86
+ "loss": 0.4286,
87
+ "step": 56
88
  },
89
  {
90
+ "epoch": 4.74,
91
+ "learning_rate": 0.00021505376344086021,
92
+ "loss": 0.4609,
93
+ "step": 64
94
+ },
95
+ {
96
+ "epoch": 4.96,
97
+ "eval_accuracy": 0.9790575916230366,
98
+ "eval_loss": 0.11301162838935852,
99
+ "eval_runtime": 26.3727,
100
+ "eval_samples_per_second": 7.242,
101
+ "eval_steps_per_second": 0.228,
102
+ "step": 67
103
  },
104
  {
105
  "epoch": 5.33,
106
+ "learning_rate": 0.0001720430107526882,
107
+ "loss": 0.4636,
108
+ "step": 72
109
+ },
110
+ {
111
+ "epoch": 5.93,
112
+ "learning_rate": 0.00012903225806451613,
113
+ "loss": 0.4251,
114
+ "step": 80
115
  },
116
  {
117
  "epoch": 6.0,
118
+ "eval_accuracy": 0.9633507853403142,
119
+ "eval_loss": 0.13039104640483856,
120
+ "eval_runtime": 26.3002,
121
+ "eval_samples_per_second": 7.262,
122
+ "eval_steps_per_second": 0.228,
123
+ "step": 81
124
  },
125
  {
126
+ "epoch": 6.52,
127
+ "learning_rate": 8.60215053763441e-05,
128
+ "loss": 0.3802,
129
+ "step": 88
130
  },
131
  {
132
+ "epoch": 6.96,
133
+ "eval_accuracy": 0.9842931937172775,
134
+ "eval_loss": 0.07386188954114914,
135
+ "eval_runtime": 26.267,
136
+ "eval_samples_per_second": 7.271,
137
+ "eval_steps_per_second": 0.228,
138
+ "step": 94
139
  },
140
  {
141
+ "epoch": 7.11,
142
+ "learning_rate": 4.301075268817205e-05,
143
+ "loss": 0.378,
144
+ "step": 96
145
+ },
146
+ {
147
+ "epoch": 7.7,
148
  "learning_rate": 0.0,
149
+ "loss": 0.4147,
150
+ "step": 104
151
  },
152
  {
153
+ "epoch": 7.7,
154
+ "eval_accuracy": 0.9842931937172775,
155
+ "eval_loss": 0.06754852086305618,
156
+ "eval_runtime": 26.3749,
157
+ "eval_samples_per_second": 7.242,
158
+ "eval_steps_per_second": 0.227,
159
+ "step": 104
160
  },
161
  {
162
+ "epoch": 7.7,
163
+ "step": 104,
164
+ "total_flos": 1.0251773186064077e+18,
165
+ "train_loss": 0.5548124955250666,
166
+ "train_runtime": 4572.4853,
167
+ "train_samples_per_second": 3.004,
168
+ "train_steps_per_second": 0.023
169
  }
170
  ],
171
  "logging_steps": 8,
172
+ "max_steps": 104,
173
  "num_train_epochs": 8,
174
  "save_steps": 500,
175
+ "total_flos": 1.0251773186064077e+18,
176
  "trial_name": null,
177
  "trial_params": null
178
  }