usamaaleem99tech commited on
Commit
214102c
1 Parent(s): 2b584c3

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 13.33,
3
- "total_flos": 8.7520382681131e+16,
4
- "train_loss": 0.4070509672164917,
5
- "train_runtime": 340.2477,
6
- "train_samples_per_second": 15.342,
7
- "train_steps_per_second": 0.059
8
  }
 
1
  {
2
+ "epoch": 8.89,
3
+ "total_flos": 5.786635923932774e+16,
4
+ "train_loss": 0.14985284606615704,
5
+ "train_runtime": 220.5615,
6
+ "train_samples_per_second": 11.833,
7
+ "train_steps_per_second": 0.272
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37f20549ae026562cafe99e6acb0d4f97265b244202f65647251001be890fc79
3
  size 110397937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4563d6972195df7e6376768904924263a6abee86a55392b526b72c4e46457d08
3
  size 110397937
runs/Jul23_10-21-56_00db9bc3da89/events.out.tfevents.1690108534.00db9bc3da89.10544.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aad00be1ecdf42cd008410747f842a33b4a7a7c6fe55a1aef7c86417e9d2f0cd
3
+ size 551
runs/Jul23_10-21-56_00db9bc3da89/events.out.tfevents.1690109486.00db9bc3da89.10544.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79441b3af117fc3be0399cd3b7b1feb061d83a94dd24dc8d9c5e78564c652000
3
+ size 5084
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 13.33,
3
- "total_flos": 8.7520382681131e+16,
4
- "train_loss": 0.4070509672164917,
5
- "train_runtime": 340.2477,
6
- "train_samples_per_second": 15.342,
7
- "train_steps_per_second": 0.059
8
  }
 
1
  {
2
+ "epoch": 8.89,
3
+ "total_flos": 5.786635923932774e+16,
4
+ "train_loss": 0.14985284606615704,
5
+ "train_runtime": 220.5615,
6
+ "train_samples_per_second": 11.833,
7
+ "train_steps_per_second": 0.272
8
  }
trainer_state.json CHANGED
@@ -1,163 +1,169 @@
1
  {
2
- "best_metric": 0.896551724137931,
3
- "best_model_checkpoint": "segformer-class-classWeights-augmentation/checkpoint-13",
4
- "epoch": 13.333333333333334,
5
- "global_step": 20,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 1.0,
12
- "eval_accuracy": 0.27586206896551724,
13
- "eval_loss": 1.1699918508529663,
14
- "eval_runtime": 1.1929,
15
- "eval_samples_per_second": 24.31,
16
- "eval_steps_per_second": 0.838,
17
- "step": 1
18
- },
19
- {
20
- "epoch": 2.0,
21
- "eval_accuracy": 0.3793103448275862,
22
- "eval_loss": 1.0350514650344849,
23
- "eval_runtime": 0.7976,
24
- "eval_samples_per_second": 36.36,
25
- "eval_steps_per_second": 1.254,
26
- "step": 3
27
- },
28
- {
29
- "epoch": 3.0,
30
- "eval_accuracy": 0.5172413793103449,
31
- "eval_loss": 0.9730662107467651,
32
- "eval_runtime": 0.8014,
33
- "eval_samples_per_second": 36.186,
34
- "eval_steps_per_second": 1.248,
35
- "step": 5
36
- },
37
- {
38
- "epoch": 4.0,
39
- "eval_accuracy": 0.5172413793103449,
40
- "eval_loss": 0.9361577033996582,
41
- "eval_runtime": 1.0363,
42
- "eval_samples_per_second": 27.984,
43
- "eval_steps_per_second": 0.965,
44
  "step": 6
45
  },
46
  {
47
- "epoch": 5.0,
48
- "eval_accuracy": 0.5517241379310345,
49
- "eval_loss": 0.8889826536178589,
50
- "eval_runtime": 0.7918,
51
- "eval_samples_per_second": 36.624,
52
- "eval_steps_per_second": 1.263,
53
- "step": 7
54
- },
55
- {
56
- "epoch": 6.0,
57
- "eval_accuracy": 0.7586206896551724,
58
- "eval_loss": 0.7596346735954285,
59
- "eval_runtime": 0.8269,
60
- "eval_samples_per_second": 35.071,
61
- "eval_steps_per_second": 1.209,
62
- "step": 9
63
- },
64
- {
65
- "epoch": 6.67,
66
- "learning_rate": 2.777777777777778e-05,
67
- "loss": 0.5024,
68
  "step": 10
69
  },
70
  {
71
- "epoch": 7.0,
72
- "eval_accuracy": 0.8620689655172413,
73
- "eval_loss": 0.6531320810317993,
74
- "eval_runtime": 0.7953,
75
- "eval_samples_per_second": 36.466,
76
- "eval_steps_per_second": 1.257,
77
- "step": 11
78
- },
79
- {
80
- "epoch": 8.0,
81
- "eval_accuracy": 0.8620689655172413,
82
- "eval_loss": 0.6170477271080017,
83
- "eval_runtime": 1.0429,
84
- "eval_samples_per_second": 27.806,
85
- "eval_steps_per_second": 0.959,
86
- "step": 12
87
- },
88
- {
89
- "epoch": 9.0,
90
- "eval_accuracy": 0.896551724137931,
91
- "eval_loss": 0.5878463387489319,
92
- "eval_runtime": 0.7888,
93
- "eval_samples_per_second": 36.767,
94
- "eval_steps_per_second": 1.268,
95
  "step": 13
96
  },
97
  {
98
- "epoch": 10.0,
99
- "eval_accuracy": 0.8620689655172413,
100
- "eval_loss": 0.5418170094490051,
101
- "eval_runtime": 0.8158,
102
- "eval_samples_per_second": 35.546,
103
- "eval_steps_per_second": 1.226,
104
- "step": 15
105
- },
106
- {
107
- "epoch": 11.0,
108
- "eval_accuracy": 0.8620689655172413,
109
- "eval_loss": 0.5121886730194092,
110
- "eval_runtime": 0.8148,
111
- "eval_samples_per_second": 35.592,
112
- "eval_steps_per_second": 1.227,
113
- "step": 17
114
- },
115
- {
116
- "epoch": 12.0,
117
- "eval_accuracy": 0.8620689655172413,
118
- "eval_loss": 0.5020919442176819,
119
- "eval_runtime": 1.0894,
120
- "eval_samples_per_second": 26.62,
121
- "eval_steps_per_second": 0.918,
122
- "step": 18
123
- },
124
- {
125
- "epoch": 13.0,
126
- "eval_accuracy": 0.8620689655172413,
127
- "eval_loss": 0.4927540421485901,
128
- "eval_runtime": 0.8053,
129
- "eval_samples_per_second": 36.014,
130
- "eval_steps_per_second": 1.242,
131
- "step": 19
132
  },
133
  {
134
- "epoch": 13.33,
135
- "learning_rate": 0.0,
136
- "loss": 0.3117,
 
 
 
 
 
 
137
  "step": 20
138
  },
139
  {
140
- "epoch": 13.33,
141
- "eval_accuracy": 0.8620689655172413,
142
- "eval_loss": 0.4871620237827301,
143
- "eval_runtime": 0.7941,
144
- "eval_samples_per_second": 36.521,
145
- "eval_steps_per_second": 1.259,
146
- "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
147
  },
148
  {
149
- "epoch": 13.33,
150
- "step": 20,
151
- "total_flos": 8.7520382681131e+16,
152
- "train_loss": 0.4070509672164917,
153
- "train_runtime": 340.2477,
154
- "train_samples_per_second": 15.342,
155
- "train_steps_per_second": 0.059
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
156
  }
157
  ],
158
- "max_steps": 20,
159
- "num_train_epochs": 20,
160
- "total_flos": 8.7520382681131e+16,
161
  "trial_name": null,
162
  "trial_params": null
163
  }
 
1
  {
2
+ "best_metric": 1.0,
3
+ "best_model_checkpoint": "segformer-class-classWeights-augmentation/checkpoint-6",
4
+ "epoch": 8.88888888888889,
5
+ "global_step": 60,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.89,
12
+ "eval_accuracy": 1.0,
13
+ "eval_f1": 1.0,
14
+ "eval_loss": 0.04543434828519821,
15
+ "eval_precision": 1.0,
16
+ "eval_recall": 1.0,
17
+ "eval_runtime": 0.9849,
18
+ "eval_samples_per_second": 29.446,
19
+ "eval_steps_per_second": 3.046,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20
  "step": 6
21
  },
22
  {
23
+ "epoch": 1.48,
24
+ "learning_rate": 1.992337164750958e-05,
25
+ "loss": 0.1558,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  "step": 10
27
  },
28
  {
29
+ "epoch": 1.93,
30
+ "eval_accuracy": 0.9655172413793104,
31
+ "eval_f1": 0.964683592269799,
32
+ "eval_loss": 0.08155026286840439,
33
+ "eval_precision": 0.9674329501915708,
34
+ "eval_recall": 0.9655172413793104,
35
+ "eval_runtime": 0.7233,
36
+ "eval_samples_per_second": 40.093,
37
+ "eval_steps_per_second": 4.148,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  "step": 13
39
  },
40
  {
41
+ "epoch": 2.96,
42
+ "learning_rate": 1.9846743295019158e-05,
43
+ "loss": 0.1727,
44
+ "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
45
  },
46
  {
47
+ "epoch": 2.96,
48
+ "eval_accuracy": 0.9655172413793104,
49
+ "eval_f1": 0.964683592269799,
50
+ "eval_loss": 0.07752516865730286,
51
+ "eval_precision": 0.9674329501915708,
52
+ "eval_recall": 0.9655172413793104,
53
+ "eval_runtime": 0.9304,
54
+ "eval_samples_per_second": 31.17,
55
+ "eval_steps_per_second": 3.225,
56
  "step": 20
57
  },
58
  {
59
+ "epoch": 4.0,
60
+ "eval_accuracy": 0.9655172413793104,
61
+ "eval_f1": 0.964683592269799,
62
+ "eval_loss": 0.04428544268012047,
63
+ "eval_precision": 0.9674329501915708,
64
+ "eval_recall": 0.9655172413793104,
65
+ "eval_runtime": 0.7055,
66
+ "eval_samples_per_second": 41.107,
67
+ "eval_steps_per_second": 4.252,
68
+ "step": 27
69
+ },
70
+ {
71
+ "epoch": 4.44,
72
+ "learning_rate": 1.9770114942528737e-05,
73
+ "loss": 0.1299,
74
+ "step": 30
75
+ },
76
+ {
77
+ "epoch": 4.89,
78
+ "eval_accuracy": 0.9655172413793104,
79
+ "eval_f1": 0.964683592269799,
80
+ "eval_loss": 0.053459376096725464,
81
+ "eval_precision": 0.9674329501915708,
82
+ "eval_recall": 0.9655172413793104,
83
+ "eval_runtime": 0.7107,
84
+ "eval_samples_per_second": 40.805,
85
+ "eval_steps_per_second": 4.221,
86
+ "step": 33
87
+ },
88
+ {
89
+ "epoch": 5.93,
90
+ "learning_rate": 1.9693486590038315e-05,
91
+ "loss": 0.1808,
92
+ "step": 40
93
+ },
94
+ {
95
+ "epoch": 5.93,
96
+ "eval_accuracy": 0.9655172413793104,
97
+ "eval_f1": 0.964683592269799,
98
+ "eval_loss": 0.029818205162882805,
99
+ "eval_precision": 0.9674329501915708,
100
+ "eval_recall": 0.9655172413793104,
101
+ "eval_runtime": 0.932,
102
+ "eval_samples_per_second": 31.115,
103
+ "eval_steps_per_second": 3.219,
104
+ "step": 40
105
+ },
106
+ {
107
+ "epoch": 6.96,
108
+ "eval_accuracy": 1.0,
109
+ "eval_f1": 1.0,
110
+ "eval_loss": 0.019522428512573242,
111
+ "eval_precision": 1.0,
112
+ "eval_recall": 1.0,
113
+ "eval_runtime": 0.699,
114
+ "eval_samples_per_second": 41.486,
115
+ "eval_steps_per_second": 4.292,
116
+ "step": 47
117
+ },
118
+ {
119
+ "epoch": 7.41,
120
+ "learning_rate": 1.9616858237547893e-05,
121
+ "loss": 0.1406,
122
+ "step": 50
123
  },
124
  {
125
+ "epoch": 8.0,
126
+ "eval_accuracy": 0.9655172413793104,
127
+ "eval_f1": 0.964683592269799,
128
+ "eval_loss": 0.05264897271990776,
129
+ "eval_precision": 0.9674329501915708,
130
+ "eval_recall": 0.9655172413793104,
131
+ "eval_runtime": 0.6927,
132
+ "eval_samples_per_second": 41.863,
133
+ "eval_steps_per_second": 4.331,
134
+ "step": 54
135
+ },
136
+ {
137
+ "epoch": 8.89,
138
+ "learning_rate": 1.9540229885057475e-05,
139
+ "loss": 0.1193,
140
+ "step": 60
141
+ },
142
+ {
143
+ "epoch": 8.89,
144
+ "eval_accuracy": 0.9655172413793104,
145
+ "eval_f1": 0.964683592269799,
146
+ "eval_loss": 0.14525191485881805,
147
+ "eval_precision": 0.9674329501915708,
148
+ "eval_recall": 0.9655172413793104,
149
+ "eval_runtime": 0.9816,
150
+ "eval_samples_per_second": 29.543,
151
+ "eval_steps_per_second": 3.056,
152
+ "step": 60
153
+ },
154
+ {
155
+ "epoch": 8.89,
156
+ "step": 60,
157
+ "total_flos": 5.786635923932774e+16,
158
+ "train_loss": 0.14985284606615704,
159
+ "train_runtime": 220.5615,
160
+ "train_samples_per_second": 11.833,
161
+ "train_steps_per_second": 0.272
162
  }
163
  ],
164
+ "max_steps": 60,
165
+ "num_train_epochs": 10,
166
+ "total_flos": 5.786635923932774e+16,
167
  "trial_name": null,
168
  "trial_params": null
169
  }