jayanthspratap commited on
Commit
c394681
1 Parent(s): a698090

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 10.0,
3
  "eval_accuracy": 0.875,
4
- "eval_loss": 0.4960244596004486,
5
- "eval_runtime": 0.186,
6
- "eval_samples_per_second": 86.013,
7
- "eval_steps_per_second": 21.503,
8
  "total_flos": 1.583041221586944e+16,
9
- "train_loss": 0.6278304576873779,
10
- "train_runtime": 51.4123,
11
- "train_samples_per_second": 12.254,
12
- "train_steps_per_second": 0.778
13
  }
 
1
  {
2
  "epoch": 10.0,
3
  "eval_accuracy": 0.875,
4
+ "eval_loss": 0.6159822940826416,
5
+ "eval_runtime": 0.1862,
6
+ "eval_samples_per_second": 85.94,
7
+ "eval_steps_per_second": 21.485,
8
  "total_flos": 1.583041221586944e+16,
9
+ "train_loss": 0.6517677068710327,
10
+ "train_runtime": 52.1182,
11
+ "train_samples_per_second": 12.088,
12
+ "train_steps_per_second": 0.767
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
  "eval_accuracy": 0.875,
4
- "eval_loss": 0.4960244596004486,
5
- "eval_runtime": 0.186,
6
- "eval_samples_per_second": 86.013,
7
- "eval_steps_per_second": 21.503
8
  }
 
1
  {
2
  "epoch": 10.0,
3
  "eval_accuracy": 0.875,
4
+ "eval_loss": 0.6159822940826416,
5
+ "eval_runtime": 0.1862,
6
+ "eval_samples_per_second": 85.94,
7
+ "eval_steps_per_second": 21.485
8
  }
runs/May27_21-05-28_0922109e5cf6/events.out.tfevents.1685221613.0922109e5cf6.8213.26 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7e0f98f4622ab933de81d619471a51423cd30564f75ef0467ce5c633c2927ac
3
+ size 405
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
  "total_flos": 1.583041221586944e+16,
4
- "train_loss": 0.6278304576873779,
5
- "train_runtime": 51.4123,
6
- "train_samples_per_second": 12.254,
7
- "train_steps_per_second": 0.778
8
  }
 
1
  {
2
  "epoch": 10.0,
3
  "total_flos": 1.583041221586944e+16,
4
+ "train_loss": 0.6517677068710327,
5
+ "train_runtime": 52.1182,
6
+ "train_samples_per_second": 12.088,
7
+ "train_steps_per_second": 0.767
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.625,
3
- "best_model_checkpoint": "convnext-tiny-224-drfx-surgery-classifier/checkpoint-16",
4
  "epoch": 10.0,
5
  "global_step": 40,
6
  "is_hyper_param_search": false,
@@ -9,126 +9,126 @@
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_accuracy": 0.5625,
13
- "eval_loss": 0.6742807626724243,
14
- "eval_runtime": 0.1742,
15
- "eval_samples_per_second": 91.859,
16
- "eval_steps_per_second": 22.965,
17
  "step": 4
18
  },
19
  {
20
  "epoch": 2.0,
21
- "eval_accuracy": 0.5625,
22
- "eval_loss": 0.6683036088943481,
23
- "eval_runtime": 0.2648,
24
- "eval_samples_per_second": 60.432,
25
- "eval_steps_per_second": 15.108,
26
  "step": 8
27
  },
28
  {
29
  "epoch": 2.5,
30
- "learning_rate": 8.333333333333333e-07,
31
- "loss": 0.649,
32
  "step": 10
33
  },
34
  {
35
  "epoch": 3.0,
36
- "eval_accuracy": 0.5625,
37
- "eval_loss": 0.6634215116500854,
38
- "eval_runtime": 0.1434,
39
- "eval_samples_per_second": 111.587,
40
- "eval_steps_per_second": 27.897,
41
  "step": 12
42
  },
43
  {
44
  "epoch": 4.0,
45
- "eval_accuracy": 0.625,
46
- "eval_loss": 0.6593766808509827,
47
- "eval_runtime": 0.1368,
48
- "eval_samples_per_second": 116.941,
49
- "eval_steps_per_second": 29.235,
50
  "step": 16
51
  },
52
  {
53
  "epoch": 5.0,
54
- "learning_rate": 5.555555555555555e-07,
55
- "loss": 0.6178,
56
  "step": 20
57
  },
58
  {
59
  "epoch": 5.0,
60
- "eval_accuracy": 0.625,
61
- "eval_loss": 0.656198263168335,
62
- "eval_runtime": 0.2701,
63
- "eval_samples_per_second": 59.234,
64
- "eval_steps_per_second": 14.808,
65
  "step": 20
66
  },
67
  {
68
  "epoch": 6.0,
69
- "eval_accuracy": 0.625,
70
- "eval_loss": 0.6535187363624573,
71
- "eval_runtime": 0.1357,
72
- "eval_samples_per_second": 117.874,
73
- "eval_steps_per_second": 29.468,
74
  "step": 24
75
  },
76
  {
77
  "epoch": 7.0,
78
- "eval_accuracy": 0.5625,
79
- "eval_loss": 0.6514049768447876,
80
- "eval_runtime": 0.1802,
81
- "eval_samples_per_second": 88.8,
82
- "eval_steps_per_second": 22.2,
83
  "step": 28
84
  },
85
  {
86
  "epoch": 7.5,
87
- "learning_rate": 2.7777777777777776e-07,
88
- "loss": 0.6236,
89
  "step": 30
90
  },
91
  {
92
  "epoch": 8.0,
93
- "eval_accuracy": 0.5625,
94
- "eval_loss": 0.649865448474884,
95
- "eval_runtime": 0.1601,
96
- "eval_samples_per_second": 99.945,
97
- "eval_steps_per_second": 24.986,
98
  "step": 32
99
  },
100
  {
101
  "epoch": 9.0,
102
- "eval_accuracy": 0.5625,
103
- "eval_loss": 0.648896336555481,
104
- "eval_runtime": 0.2183,
105
- "eval_samples_per_second": 73.288,
106
- "eval_steps_per_second": 18.322,
107
  "step": 36
108
  },
109
  {
110
  "epoch": 10.0,
111
  "learning_rate": 0.0,
112
- "loss": 0.621,
113
  "step": 40
114
  },
115
  {
116
  "epoch": 10.0,
117
- "eval_accuracy": 0.5625,
118
- "eval_loss": 0.6485264897346497,
119
- "eval_runtime": 0.1395,
120
- "eval_samples_per_second": 114.686,
121
- "eval_steps_per_second": 28.672,
122
  "step": 40
123
  },
124
  {
125
  "epoch": 10.0,
126
  "step": 40,
127
  "total_flos": 1.583041221586944e+16,
128
- "train_loss": 0.6278304576873779,
129
- "train_runtime": 51.4123,
130
- "train_samples_per_second": 12.254,
131
- "train_steps_per_second": 0.778
132
  }
133
  ],
134
  "max_steps": 40,
 
1
  {
2
+ "best_metric": 0.875,
3
+ "best_model_checkpoint": "convnext-tiny-224-drfx-surgery-classifier/checkpoint-28",
4
  "epoch": 10.0,
5
  "global_step": 40,
6
  "is_hyper_param_search": false,
 
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_accuracy": 0.375,
13
+ "eval_loss": 0.7140131592750549,
14
+ "eval_runtime": 0.1678,
15
+ "eval_samples_per_second": 95.342,
16
+ "eval_steps_per_second": 23.836,
17
  "step": 4
18
  },
19
  {
20
  "epoch": 2.0,
21
+ "eval_accuracy": 0.5,
22
+ "eval_loss": 0.6876102685928345,
23
+ "eval_runtime": 0.2806,
24
+ "eval_samples_per_second": 57.029,
25
+ "eval_steps_per_second": 14.257,
26
  "step": 8
27
  },
28
  {
29
  "epoch": 2.5,
30
+ "learning_rate": 4.166666666666667e-06,
31
+ "loss": 0.7104,
32
  "step": 10
33
  },
34
  {
35
  "epoch": 3.0,
36
+ "eval_accuracy": 0.625,
37
+ "eval_loss": 0.6665950417518616,
38
+ "eval_runtime": 0.1311,
39
+ "eval_samples_per_second": 122.003,
40
+ "eval_steps_per_second": 30.501,
41
  "step": 12
42
  },
43
  {
44
  "epoch": 4.0,
45
+ "eval_accuracy": 0.6875,
46
+ "eval_loss": 0.6494508981704712,
47
+ "eval_runtime": 0.1354,
48
+ "eval_samples_per_second": 118.202,
49
+ "eval_steps_per_second": 29.55,
50
  "step": 16
51
  },
52
  {
53
  "epoch": 5.0,
54
+ "learning_rate": 2.7777777777777783e-06,
55
+ "loss": 0.6567,
56
  "step": 20
57
  },
58
  {
59
  "epoch": 5.0,
60
+ "eval_accuracy": 0.75,
61
+ "eval_loss": 0.6359503865242004,
62
+ "eval_runtime": 0.1374,
63
+ "eval_samples_per_second": 116.463,
64
+ "eval_steps_per_second": 29.116,
65
  "step": 20
66
  },
67
  {
68
  "epoch": 6.0,
69
+ "eval_accuracy": 0.8125,
70
+ "eval_loss": 0.6247015595436096,
71
+ "eval_runtime": 0.139,
72
+ "eval_samples_per_second": 115.068,
73
+ "eval_steps_per_second": 28.767,
74
  "step": 24
75
  },
76
  {
77
  "epoch": 7.0,
78
+ "eval_accuracy": 0.875,
79
+ "eval_loss": 0.6159822940826416,
80
+ "eval_runtime": 0.1357,
81
+ "eval_samples_per_second": 117.933,
82
+ "eval_steps_per_second": 29.483,
83
  "step": 28
84
  },
85
  {
86
  "epoch": 7.5,
87
+ "learning_rate": 1.3888888888888892e-06,
88
+ "loss": 0.6277,
89
  "step": 30
90
  },
91
  {
92
  "epoch": 8.0,
93
+ "eval_accuracy": 0.875,
94
+ "eval_loss": 0.6097759008407593,
95
+ "eval_runtime": 0.1545,
96
+ "eval_samples_per_second": 103.542,
97
+ "eval_steps_per_second": 25.886,
98
  "step": 32
99
  },
100
  {
101
  "epoch": 9.0,
102
+ "eval_accuracy": 0.875,
103
+ "eval_loss": 0.6058341264724731,
104
+ "eval_runtime": 0.1381,
105
+ "eval_samples_per_second": 115.852,
106
+ "eval_steps_per_second": 28.963,
107
  "step": 36
108
  },
109
  {
110
  "epoch": 10.0,
111
  "learning_rate": 0.0,
112
+ "loss": 0.6122,
113
  "step": 40
114
  },
115
  {
116
  "epoch": 10.0,
117
+ "eval_accuracy": 0.875,
118
+ "eval_loss": 0.6043429374694824,
119
+ "eval_runtime": 0.1712,
120
+ "eval_samples_per_second": 93.452,
121
+ "eval_steps_per_second": 23.363,
122
  "step": 40
123
  },
124
  {
125
  "epoch": 10.0,
126
  "step": 40,
127
  "total_flos": 1.583041221586944e+16,
128
+ "train_loss": 0.6517677068710327,
129
+ "train_runtime": 52.1182,
130
+ "train_samples_per_second": 12.088,
131
+ "train_steps_per_second": 0.767
132
  }
133
  ],
134
  "max_steps": 40,