jayanthspratap commited on
Commit
bdea67f
1 Parent(s): 8d2f41e

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -6,8 +6,8 @@
6
  "eval_samples_per_second": 86.013,
7
  "eval_steps_per_second": 21.503,
8
  "total_flos": 1.583041221586944e+16,
9
- "train_loss": 0.4837726652622223,
10
- "train_runtime": 41.4007,
11
- "train_samples_per_second": 15.217,
12
- "train_steps_per_second": 0.966
13
  }
 
6
  "eval_samples_per_second": 86.013,
7
  "eval_steps_per_second": 21.503,
8
  "total_flos": 1.583041221586944e+16,
9
+ "train_loss": 0.6278304576873779,
10
+ "train_runtime": 51.4123,
11
+ "train_samples_per_second": 12.254,
12
+ "train_steps_per_second": 0.778
13
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76aac07035d0bf55a59bc86f0420629de8ae74dc673ea5ea8e907d1ed9d7fc31
3
  size 111349029
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:727d603ceea024febde4faa0e6f92c89f481fbe52fa4402e540dc402c70a5baf
3
  size 111349029
runs/May27_21-05-28_0922109e5cf6/1685221531.0906715/events.out.tfevents.1685221531.0922109e5cf6.8213.25 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a36c00322078dda0181539359e2e4372e180f9004ea74d928274fc0a74d5dfe7
3
+ size 5949
runs/May27_21-05-28_0922109e5cf6/events.out.tfevents.1685221531.0922109e5cf6.8213.24 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48d016292dd9e2c7916bc06dd1c00bb224c4381a5d804f3d62344be44208a527
3
+ size 4531
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
  "total_flos": 1.583041221586944e+16,
4
- "train_loss": 0.4837726652622223,
5
- "train_runtime": 41.4007,
6
- "train_samples_per_second": 15.217,
7
- "train_steps_per_second": 0.966
8
  }
 
1
  {
2
  "epoch": 10.0,
3
  "total_flos": 1.583041221586944e+16,
4
+ "train_loss": 0.6278304576873779,
5
+ "train_runtime": 51.4123,
6
+ "train_samples_per_second": 12.254,
7
+ "train_steps_per_second": 0.778
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.875,
3
- "best_model_checkpoint": "convnext-tiny-224-drfx-surgery-classifier/checkpoint-8",
4
  "epoch": 10.0,
5
  "global_step": 40,
6
  "is_hyper_param_search": false,
@@ -9,126 +9,126 @@
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_accuracy": 0.6875,
13
- "eval_loss": 0.6467709541320801,
14
- "eval_runtime": 0.1396,
15
- "eval_samples_per_second": 114.574,
16
- "eval_steps_per_second": 28.643,
17
  "step": 4
18
  },
19
  {
20
  "epoch": 2.0,
21
- "eval_accuracy": 0.875,
22
- "eval_loss": 0.4960244596004486,
23
- "eval_runtime": 0.2812,
24
- "eval_samples_per_second": 56.9,
25
- "eval_steps_per_second": 14.225,
26
  "step": 8
27
  },
28
  {
29
  "epoch": 2.5,
30
- "learning_rate": 4.166666666666667e-05,
31
- "loss": 0.6461,
32
  "step": 10
33
  },
34
  {
35
  "epoch": 3.0,
36
- "eval_accuracy": 0.875,
37
- "eval_loss": 0.4355894923210144,
38
- "eval_runtime": 0.2068,
39
- "eval_samples_per_second": 77.351,
40
- "eval_steps_per_second": 19.338,
41
  "step": 12
42
  },
43
  {
44
  "epoch": 4.0,
45
- "eval_accuracy": 0.875,
46
- "eval_loss": 0.3915722072124481,
47
- "eval_runtime": 0.1349,
48
- "eval_samples_per_second": 118.579,
49
- "eval_steps_per_second": 29.645,
50
  "step": 16
51
  },
52
  {
53
  "epoch": 5.0,
54
- "learning_rate": 2.777777777777778e-05,
55
- "loss": 0.4586,
56
  "step": 20
57
  },
58
  {
59
  "epoch": 5.0,
60
- "eval_accuracy": 0.875,
61
- "eval_loss": 0.3885435461997986,
62
- "eval_runtime": 0.1295,
63
- "eval_samples_per_second": 123.544,
64
- "eval_steps_per_second": 30.886,
65
  "step": 20
66
  },
67
  {
68
  "epoch": 6.0,
69
- "eval_accuracy": 0.875,
70
- "eval_loss": 0.38064631819725037,
71
- "eval_runtime": 0.1351,
72
- "eval_samples_per_second": 118.447,
73
- "eval_steps_per_second": 29.612,
74
  "step": 24
75
  },
76
  {
77
  "epoch": 7.0,
78
- "eval_accuracy": 0.875,
79
- "eval_loss": 0.3729676604270935,
80
- "eval_runtime": 0.1372,
81
- "eval_samples_per_second": 116.595,
82
- "eval_steps_per_second": 29.149,
83
  "step": 28
84
  },
85
  {
86
  "epoch": 7.5,
87
- "learning_rate": 1.388888888888889e-05,
88
- "loss": 0.3969,
89
  "step": 30
90
  },
91
  {
92
  "epoch": 8.0,
93
- "eval_accuracy": 0.875,
94
- "eval_loss": 0.3685373067855835,
95
- "eval_runtime": 0.1332,
96
- "eval_samples_per_second": 120.143,
97
- "eval_steps_per_second": 30.036,
98
  "step": 32
99
  },
100
  {
101
  "epoch": 9.0,
102
- "eval_accuracy": 0.875,
103
- "eval_loss": 0.3655328154563904,
104
- "eval_runtime": 0.169,
105
- "eval_samples_per_second": 94.697,
106
- "eval_steps_per_second": 23.674,
107
  "step": 36
108
  },
109
  {
110
  "epoch": 10.0,
111
  "learning_rate": 0.0,
112
- "loss": 0.4335,
113
  "step": 40
114
  },
115
  {
116
  "epoch": 10.0,
117
- "eval_accuracy": 0.875,
118
- "eval_loss": 0.36532726883888245,
119
- "eval_runtime": 0.1343,
120
- "eval_samples_per_second": 119.146,
121
- "eval_steps_per_second": 29.786,
122
  "step": 40
123
  },
124
  {
125
  "epoch": 10.0,
126
  "step": 40,
127
  "total_flos": 1.583041221586944e+16,
128
- "train_loss": 0.4837726652622223,
129
- "train_runtime": 41.4007,
130
- "train_samples_per_second": 15.217,
131
- "train_steps_per_second": 0.966
132
  }
133
  ],
134
  "max_steps": 40,
 
1
  {
2
+ "best_metric": 0.625,
3
+ "best_model_checkpoint": "convnext-tiny-224-drfx-surgery-classifier/checkpoint-16",
4
  "epoch": 10.0,
5
  "global_step": 40,
6
  "is_hyper_param_search": false,
 
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_accuracy": 0.5625,
13
+ "eval_loss": 0.6742807626724243,
14
+ "eval_runtime": 0.1742,
15
+ "eval_samples_per_second": 91.859,
16
+ "eval_steps_per_second": 22.965,
17
  "step": 4
18
  },
19
  {
20
  "epoch": 2.0,
21
+ "eval_accuracy": 0.5625,
22
+ "eval_loss": 0.6683036088943481,
23
+ "eval_runtime": 0.2648,
24
+ "eval_samples_per_second": 60.432,
25
+ "eval_steps_per_second": 15.108,
26
  "step": 8
27
  },
28
  {
29
  "epoch": 2.5,
30
+ "learning_rate": 8.333333333333333e-07,
31
+ "loss": 0.649,
32
  "step": 10
33
  },
34
  {
35
  "epoch": 3.0,
36
+ "eval_accuracy": 0.5625,
37
+ "eval_loss": 0.6634215116500854,
38
+ "eval_runtime": 0.1434,
39
+ "eval_samples_per_second": 111.587,
40
+ "eval_steps_per_second": 27.897,
41
  "step": 12
42
  },
43
  {
44
  "epoch": 4.0,
45
+ "eval_accuracy": 0.625,
46
+ "eval_loss": 0.6593766808509827,
47
+ "eval_runtime": 0.1368,
48
+ "eval_samples_per_second": 116.941,
49
+ "eval_steps_per_second": 29.235,
50
  "step": 16
51
  },
52
  {
53
  "epoch": 5.0,
54
+ "learning_rate": 5.555555555555555e-07,
55
+ "loss": 0.6178,
56
  "step": 20
57
  },
58
  {
59
  "epoch": 5.0,
60
+ "eval_accuracy": 0.625,
61
+ "eval_loss": 0.656198263168335,
62
+ "eval_runtime": 0.2701,
63
+ "eval_samples_per_second": 59.234,
64
+ "eval_steps_per_second": 14.808,
65
  "step": 20
66
  },
67
  {
68
  "epoch": 6.0,
69
+ "eval_accuracy": 0.625,
70
+ "eval_loss": 0.6535187363624573,
71
+ "eval_runtime": 0.1357,
72
+ "eval_samples_per_second": 117.874,
73
+ "eval_steps_per_second": 29.468,
74
  "step": 24
75
  },
76
  {
77
  "epoch": 7.0,
78
+ "eval_accuracy": 0.5625,
79
+ "eval_loss": 0.6514049768447876,
80
+ "eval_runtime": 0.1802,
81
+ "eval_samples_per_second": 88.8,
82
+ "eval_steps_per_second": 22.2,
83
  "step": 28
84
  },
85
  {
86
  "epoch": 7.5,
87
+ "learning_rate": 2.7777777777777776e-07,
88
+ "loss": 0.6236,
89
  "step": 30
90
  },
91
  {
92
  "epoch": 8.0,
93
+ "eval_accuracy": 0.5625,
94
+ "eval_loss": 0.649865448474884,
95
+ "eval_runtime": 0.1601,
96
+ "eval_samples_per_second": 99.945,
97
+ "eval_steps_per_second": 24.986,
98
  "step": 32
99
  },
100
  {
101
  "epoch": 9.0,
102
+ "eval_accuracy": 0.5625,
103
+ "eval_loss": 0.648896336555481,
104
+ "eval_runtime": 0.2183,
105
+ "eval_samples_per_second": 73.288,
106
+ "eval_steps_per_second": 18.322,
107
  "step": 36
108
  },
109
  {
110
  "epoch": 10.0,
111
  "learning_rate": 0.0,
112
+ "loss": 0.621,
113
  "step": 40
114
  },
115
  {
116
  "epoch": 10.0,
117
+ "eval_accuracy": 0.5625,
118
+ "eval_loss": 0.6485264897346497,
119
+ "eval_runtime": 0.1395,
120
+ "eval_samples_per_second": 114.686,
121
+ "eval_steps_per_second": 28.672,
122
  "step": 40
123
  },
124
  {
125
  "epoch": 10.0,
126
  "step": 40,
127
  "total_flos": 1.583041221586944e+16,
128
+ "train_loss": 0.6278304576873779,
129
+ "train_runtime": 51.4123,
130
+ "train_samples_per_second": 12.254,
131
+ "train_steps_per_second": 0.778
132
  }
133
  ],
134
  "max_steps": 40,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95a73c2826fec298fed7b5f439180d56cf54d9ed76f341d9b98001a39889bed6
3
  size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af67709ce9988745a26b4af07d220b26aed77bc68e74c8007253fca9ee38f462
3
  size 3643