RohanK447 commited on
Commit
fcf861f
1 Parent(s): 3fbb56e

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 10.0,
3
  "eval_accuracy": 1.0,
4
  "eval_loss": 0.5404492020606995,
5
  "eval_runtime": 0.0787,
6
  "eval_samples_per_second": 50.832,
7
  "eval_steps_per_second": 12.708,
8
- "total_flos": 8699596145049600.0,
9
- "train_loss": 0.20386319160461425,
10
- "train_runtime": 41.2868,
11
- "train_samples_per_second": 8.477,
12
- "train_steps_per_second": 0.242
13
  }
 
1
  {
2
+ "epoch": 20.0,
3
  "eval_accuracy": 1.0,
4
  "eval_loss": 0.5404492020606995,
5
  "eval_runtime": 0.0787,
6
  "eval_samples_per_second": 50.832,
7
  "eval_steps_per_second": 12.708,
8
+ "total_flos": 1.73991922900992e+16,
9
+ "train_loss": 0.15340265035629272,
10
+ "train_runtime": 48.7906,
11
+ "train_samples_per_second": 14.347,
12
+ "train_steps_per_second": 0.41
13
  }
runs/Sep06_02-49-21_8a3aa9d02c1c/1662432936.4683797/events.out.tfevents.1662432936.8a3aa9d02c1c.69.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5165775fa9b52edd356ac81b99b9edbbc5a5d992f56842535f9287a290c719c
3
+ size 5494
runs/Sep06_02-49-21_8a3aa9d02c1c/events.out.tfevents.1662432936.8a3aa9d02c1c.69.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c39f49f7b23d1e894bff63ace3a6f02330eef95725f434cea471aeb41ea81cd9
3
+ size 4317
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 10.0,
3
- "total_flos": 8699596145049600.0,
4
- "train_loss": 0.20386319160461425,
5
- "train_runtime": 41.2868,
6
- "train_samples_per_second": 8.477,
7
- "train_steps_per_second": 0.242
8
  }
 
1
  {
2
+ "epoch": 20.0,
3
+ "total_flos": 1.73991922900992e+16,
4
+ "train_loss": 0.15340265035629272,
5
+ "train_runtime": 48.7906,
6
+ "train_samples_per_second": 14.347,
7
+ "train_steps_per_second": 0.41
8
  }
trainer_state.json CHANGED
@@ -1,121 +1,217 @@
1
  {
2
- "best_metric": 1.0,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-vosap/checkpoint-1",
4
- "epoch": 10.0,
5
- "global_step": 10,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_accuracy": 1.0,
13
- "eval_loss": 0.5404492020606995,
14
- "eval_runtime": 0.0625,
15
- "eval_samples_per_second": 64.034,
16
- "eval_steps_per_second": 16.008,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 2.0,
21
- "eval_accuracy": 1.0,
22
- "eval_loss": 0.4876060485839844,
23
- "eval_runtime": 0.0737,
24
- "eval_samples_per_second": 54.286,
25
- "eval_steps_per_second": 13.571,
26
  "step": 2
27
  },
28
  {
29
  "epoch": 3.0,
30
- "eval_accuracy": 1.0,
31
- "eval_loss": 0.44556379318237305,
32
- "eval_runtime": 0.0672,
33
- "eval_samples_per_second": 59.503,
34
- "eval_steps_per_second": 14.876,
35
  "step": 3
36
  },
37
  {
38
  "epoch": 4.0,
39
- "eval_accuracy": 1.0,
40
- "eval_loss": 0.41716501116752625,
41
- "eval_runtime": 0.0654,
42
- "eval_samples_per_second": 61.169,
43
- "eval_steps_per_second": 15.292,
44
  "step": 4
45
  },
46
  {
47
  "epoch": 5.0,
48
- "eval_accuracy": 1.0,
49
- "eval_loss": 0.3770451843738556,
50
- "eval_runtime": 0.0686,
51
- "eval_samples_per_second": 58.32,
52
- "eval_steps_per_second": 14.58,
53
  "step": 5
54
  },
55
  {
56
  "epoch": 6.0,
57
- "eval_accuracy": 1.0,
58
- "eval_loss": 0.3442598283290863,
59
- "eval_runtime": 0.0676,
60
- "eval_samples_per_second": 59.13,
61
- "eval_steps_per_second": 14.783,
62
  "step": 6
63
  },
64
  {
65
  "epoch": 7.0,
66
- "eval_accuracy": 1.0,
67
- "eval_loss": 0.32264935970306396,
68
- "eval_runtime": 0.0634,
69
- "eval_samples_per_second": 63.066,
70
- "eval_steps_per_second": 15.767,
71
  "step": 7
72
  },
73
  {
74
  "epoch": 8.0,
75
- "eval_accuracy": 1.0,
76
- "eval_loss": 0.3132918179035187,
77
- "eval_runtime": 0.0661,
78
- "eval_samples_per_second": 60.478,
79
- "eval_steps_per_second": 15.12,
80
  "step": 8
81
  },
82
  {
83
  "epoch": 9.0,
84
- "eval_accuracy": 1.0,
85
- "eval_loss": 0.30815836787223816,
86
- "eval_runtime": 0.0661,
87
- "eval_samples_per_second": 60.509,
88
- "eval_steps_per_second": 15.127,
89
  "step": 9
90
  },
91
  {
92
  "epoch": 10.0,
93
- "learning_rate": 0.0,
94
- "loss": 0.2039,
95
  "step": 10
96
  },
97
  {
98
  "epoch": 10.0,
99
- "eval_accuracy": 1.0,
100
- "eval_loss": 0.30541735887527466,
101
- "eval_runtime": 0.0689,
102
- "eval_samples_per_second": 58.029,
103
- "eval_steps_per_second": 14.507,
104
  "step": 10
105
  },
106
  {
107
- "epoch": 10.0,
108
- "step": 10,
109
- "total_flos": 8699596145049600.0,
110
- "train_loss": 0.20386319160461425,
111
- "train_runtime": 41.2868,
112
- "train_samples_per_second": 8.477,
113
- "train_steps_per_second": 0.242
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
114
  }
115
  ],
116
- "max_steps": 10,
117
- "num_train_epochs": 10,
118
- "total_flos": 8699596145049600.0,
119
  "trial_name": null,
120
  "trial_params": null
121
  }
 
1
  {
2
+ "best_metric": 0.75,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-vosap/checkpoint-11",
4
+ "epoch": 20.0,
5
+ "global_step": 20,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_accuracy": 0.5,
13
+ "eval_loss": 0.6076761484146118,
14
+ "eval_runtime": 0.0775,
15
+ "eval_samples_per_second": 51.64,
16
+ "eval_steps_per_second": 12.91,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 2.0,
21
+ "eval_accuracy": 0.5,
22
+ "eval_loss": 0.5957173705101013,
23
+ "eval_runtime": 0.0821,
24
+ "eval_samples_per_second": 48.732,
25
+ "eval_steps_per_second": 12.183,
26
  "step": 2
27
  },
28
  {
29
  "epoch": 3.0,
30
+ "eval_accuracy": 0.5,
31
+ "eval_loss": 0.6553595662117004,
32
+ "eval_runtime": 0.0814,
33
+ "eval_samples_per_second": 49.141,
34
+ "eval_steps_per_second": 12.285,
35
  "step": 3
36
  },
37
  {
38
  "epoch": 4.0,
39
+ "eval_accuracy": 0.25,
40
+ "eval_loss": 0.7486120462417603,
41
+ "eval_runtime": 0.092,
42
+ "eval_samples_per_second": 43.462,
43
+ "eval_steps_per_second": 10.866,
44
  "step": 4
45
  },
46
  {
47
  "epoch": 5.0,
48
+ "eval_accuracy": 0.25,
49
+ "eval_loss": 0.8207159042358398,
50
+ "eval_runtime": 0.0849,
51
+ "eval_samples_per_second": 47.103,
52
+ "eval_steps_per_second": 11.776,
53
  "step": 5
54
  },
55
  {
56
  "epoch": 6.0,
57
+ "eval_accuracy": 0.25,
58
+ "eval_loss": 0.8213469386100769,
59
+ "eval_runtime": 0.0786,
60
+ "eval_samples_per_second": 50.921,
61
+ "eval_steps_per_second": 12.73,
62
  "step": 6
63
  },
64
  {
65
  "epoch": 7.0,
66
+ "eval_accuracy": 0.5,
67
+ "eval_loss": 0.7957496643066406,
68
+ "eval_runtime": 0.1037,
69
+ "eval_samples_per_second": 38.557,
70
+ "eval_steps_per_second": 9.639,
71
  "step": 7
72
  },
73
  {
74
  "epoch": 8.0,
75
+ "eval_accuracy": 0.5,
76
+ "eval_loss": 0.7098022699356079,
77
+ "eval_runtime": 0.0873,
78
+ "eval_samples_per_second": 45.794,
79
+ "eval_steps_per_second": 11.449,
80
  "step": 8
81
  },
82
  {
83
  "epoch": 9.0,
84
+ "eval_accuracy": 0.5,
85
+ "eval_loss": 0.6372093558311462,
86
+ "eval_runtime": 0.0953,
87
+ "eval_samples_per_second": 41.99,
88
+ "eval_steps_per_second": 10.497,
89
  "step": 9
90
  },
91
  {
92
  "epoch": 10.0,
93
+ "learning_rate": 2.777777777777778e-05,
94
+ "loss": 0.2113,
95
  "step": 10
96
  },
97
  {
98
  "epoch": 10.0,
99
+ "eval_accuracy": 0.5,
100
+ "eval_loss": 0.5358340740203857,
101
+ "eval_runtime": 0.085,
102
+ "eval_samples_per_second": 47.079,
103
+ "eval_steps_per_second": 11.77,
104
  "step": 10
105
  },
106
  {
107
+ "epoch": 11.0,
108
+ "eval_accuracy": 0.75,
109
+ "eval_loss": 0.48944157361984253,
110
+ "eval_runtime": 0.0964,
111
+ "eval_samples_per_second": 41.48,
112
+ "eval_steps_per_second": 10.37,
113
+ "step": 11
114
+ },
115
+ {
116
+ "epoch": 12.0,
117
+ "eval_accuracy": 0.75,
118
+ "eval_loss": 0.4506962299346924,
119
+ "eval_runtime": 0.111,
120
+ "eval_samples_per_second": 36.02,
121
+ "eval_steps_per_second": 9.005,
122
+ "step": 12
123
+ },
124
+ {
125
+ "epoch": 13.0,
126
+ "eval_accuracy": 0.75,
127
+ "eval_loss": 0.43113046884536743,
128
+ "eval_runtime": 0.0817,
129
+ "eval_samples_per_second": 48.933,
130
+ "eval_steps_per_second": 12.233,
131
+ "step": 13
132
+ },
133
+ {
134
+ "epoch": 14.0,
135
+ "eval_accuracy": 0.75,
136
+ "eval_loss": 0.4339416027069092,
137
+ "eval_runtime": 0.1033,
138
+ "eval_samples_per_second": 38.72,
139
+ "eval_steps_per_second": 9.68,
140
+ "step": 14
141
+ },
142
+ {
143
+ "epoch": 15.0,
144
+ "eval_accuracy": 0.75,
145
+ "eval_loss": 0.46003320813179016,
146
+ "eval_runtime": 0.0837,
147
+ "eval_samples_per_second": 47.81,
148
+ "eval_steps_per_second": 11.952,
149
+ "step": 15
150
+ },
151
+ {
152
+ "epoch": 16.0,
153
+ "eval_accuracy": 0.5,
154
+ "eval_loss": 0.49817201495170593,
155
+ "eval_runtime": 0.1026,
156
+ "eval_samples_per_second": 38.983,
157
+ "eval_steps_per_second": 9.746,
158
+ "step": 16
159
+ },
160
+ {
161
+ "epoch": 17.0,
162
+ "eval_accuracy": 0.5,
163
+ "eval_loss": 0.5298565626144409,
164
+ "eval_runtime": 0.0879,
165
+ "eval_samples_per_second": 45.53,
166
+ "eval_steps_per_second": 11.383,
167
+ "step": 17
168
+ },
169
+ {
170
+ "epoch": 18.0,
171
+ "eval_accuracy": 0.5,
172
+ "eval_loss": 0.5602237582206726,
173
+ "eval_runtime": 0.0988,
174
+ "eval_samples_per_second": 40.497,
175
+ "eval_steps_per_second": 10.124,
176
+ "step": 18
177
+ },
178
+ {
179
+ "epoch": 19.0,
180
+ "eval_accuracy": 0.5,
181
+ "eval_loss": 0.5776747465133667,
182
+ "eval_runtime": 0.0845,
183
+ "eval_samples_per_second": 47.319,
184
+ "eval_steps_per_second": 11.83,
185
+ "step": 19
186
+ },
187
+ {
188
+ "epoch": 20.0,
189
+ "learning_rate": 0.0,
190
+ "loss": 0.0955,
191
+ "step": 20
192
+ },
193
+ {
194
+ "epoch": 20.0,
195
+ "eval_accuracy": 0.5,
196
+ "eval_loss": 0.5813302993774414,
197
+ "eval_runtime": 0.101,
198
+ "eval_samples_per_second": 39.589,
199
+ "eval_steps_per_second": 9.897,
200
+ "step": 20
201
+ },
202
+ {
203
+ "epoch": 20.0,
204
+ "step": 20,
205
+ "total_flos": 1.73991922900992e+16,
206
+ "train_loss": 0.15340265035629272,
207
+ "train_runtime": 48.7906,
208
+ "train_samples_per_second": 14.347,
209
+ "train_steps_per_second": 0.41
210
  }
211
  ],
212
+ "max_steps": 20,
213
+ "num_train_epochs": 20,
214
+ "total_flos": 1.73991922900992e+16,
215
  "trial_name": null,
216
  "trial_params": null
217
  }