Metal079 commited on
Commit
6f10643
1 Parent(s): fd1f89d

Upload 4 files

Browse files
Files changed (3) hide show
  1. config.json +1 -1
  2. pytorch_model.bin +1 -1
  3. trainer_state.json +149 -48
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "facebook/convnext-base-384",
3
  "architectures": [
4
  "ConvNextForImageClassification"
5
  ],
 
1
  {
2
+ "_name_or_path": "facebook/convnext-base-384-22k-1k",
3
  "architectures": [
4
  "ConvNextForImageClassification"
5
  ],
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9242be7ffa69645eee2593b9c9fe787512b0801740430c8e0a4c11049c4b3586
3
  size 350446061
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd4d6897c65fc76cc210003c9552b14442dd4d5786bab4e5b323c52bafa2e877
3
  size 350446061
trainer_state.json CHANGED
@@ -1,76 +1,177 @@
1
  {
2
- "best_metric": 0.13731054961681366,
3
- "best_model_checkpoint": "./SonicCharacterClassifier\\checkpoint-158",
4
- "epoch": 2.0,
5
- "global_step": 158,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.25,
12
- "learning_rate": 0.0001949367088607595,
13
- "loss": 0.3933,
14
- "step": 20
15
  },
16
  {
17
- "epoch": 0.51,
18
- "learning_rate": 0.00018987341772151899,
19
- "loss": 0.3066,
20
- "step": 40
21
  },
22
  {
23
- "epoch": 0.76,
24
- "learning_rate": 0.0001848101265822785,
25
- "loss": 0.2891,
26
- "step": 60
 
 
 
 
 
27
  },
28
  {
29
- "epoch": 1.0,
30
- "eval_accuracy": 0.5269461077844312,
31
- "eval_loss": 0.24304752051830292,
32
- "eval_runtime": 34.0361,
33
- "eval_samples_per_second": 9.813,
34
- "eval_steps_per_second": 1.234,
35
- "step": 79
36
  },
37
  {
38
- "epoch": 1.01,
39
- "learning_rate": 0.000179746835443038,
40
- "loss": 0.2675,
41
- "step": 80
42
  },
43
  {
44
- "epoch": 1.27,
45
- "learning_rate": 0.00017468354430379748,
46
- "loss": 0.2181,
47
- "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
48
  },
49
  {
50
- "epoch": 1.52,
51
- "learning_rate": 0.00016962025316455696,
52
- "loss": 0.183,
53
- "step": 120
54
  },
55
  {
56
- "epoch": 1.77,
57
- "learning_rate": 0.00016455696202531648,
58
- "loss": 0.1681,
59
- "step": 140
60
  },
61
  {
62
- "epoch": 2.0,
63
- "eval_accuracy": 0.7724550898203593,
64
- "eval_loss": 0.13731054961681366,
65
- "eval_runtime": 33.5178,
66
- "eval_samples_per_second": 9.965,
67
- "eval_steps_per_second": 1.253,
68
- "step": 158
 
 
69
  }
70
  ],
71
- "max_steps": 790,
72
  "num_train_epochs": 10,
73
- "total_flos": 1.16230208864256e+18,
74
  "trial_name": null,
75
  "trial_params": null
76
  }
 
1
  {
2
+ "best_metric": 0.09438519924879074,
3
+ "best_model_checkpoint": "./SonicCharacterClassifier\\checkpoint-1400",
4
+ "epoch": 4.093567251461988,
5
+ "global_step": 1400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.29,
12
+ "learning_rate": 4.853801169590643e-05,
13
+ "loss": 0.3188,
14
+ "step": 100
15
  },
16
  {
17
+ "epoch": 0.58,
18
+ "learning_rate": 4.707602339181287e-05,
19
+ "loss": 0.2087,
20
+ "step": 200
21
  },
22
  {
23
+ "epoch": 0.58,
24
+ "eval_accuracy": 0.9407407407407361,
25
+ "eval_loss": 0.16877754032611847,
26
+ "eval_precision": 0.6539702845075653,
27
+ "eval_recall": 0.5742313120602596,
28
+ "eval_runtime": 161.9664,
29
+ "eval_samples_per_second": 8.446,
30
+ "eval_steps_per_second": 1.056,
31
+ "step": 200
32
  },
33
  {
34
+ "epoch": 0.88,
35
+ "learning_rate": 4.56140350877193e-05,
36
+ "loss": 0.1663,
37
+ "step": 300
 
 
 
38
  },
39
  {
40
+ "epoch": 1.17,
41
+ "learning_rate": 4.4152046783625734e-05,
42
+ "loss": 0.1155,
43
+ "step": 400
44
  },
45
  {
46
+ "epoch": 1.17,
47
+ "eval_accuracy": 0.9615009746588669,
48
+ "eval_loss": 0.12015020102262497,
49
+ "eval_precision": 0.8305708768976313,
50
+ "eval_recall": 0.7801112001221648,
51
+ "eval_runtime": 161.8616,
52
+ "eval_samples_per_second": 8.452,
53
+ "eval_steps_per_second": 1.056,
54
+ "step": 400
55
+ },
56
+ {
57
+ "epoch": 1.46,
58
+ "learning_rate": 4.269005847953216e-05,
59
+ "loss": 0.095,
60
+ "step": 500
61
+ },
62
+ {
63
+ "epoch": 1.75,
64
+ "learning_rate": 4.12280701754386e-05,
65
+ "loss": 0.0932,
66
+ "step": 600
67
+ },
68
+ {
69
+ "epoch": 1.75,
70
+ "eval_accuracy": 0.964278752436644,
71
+ "eval_loss": 0.1112869530916214,
72
+ "eval_precision": 0.8358102748453625,
73
+ "eval_recall": 0.7573138768314205,
74
+ "eval_runtime": 160.6953,
75
+ "eval_samples_per_second": 8.513,
76
+ "eval_steps_per_second": 1.064,
77
+ "step": 600
78
+ },
79
+ {
80
+ "epoch": 2.05,
81
+ "learning_rate": 3.976608187134503e-05,
82
+ "loss": 0.087,
83
+ "step": 700
84
+ },
85
+ {
86
+ "epoch": 2.34,
87
+ "learning_rate": 3.8304093567251465e-05,
88
+ "loss": 0.0489,
89
+ "step": 800
90
+ },
91
+ {
92
+ "epoch": 2.34,
93
+ "eval_accuracy": 0.9684697855750467,
94
+ "eval_loss": 0.09839322417974472,
95
+ "eval_precision": 0.877861029889539,
96
+ "eval_recall": 0.8274951210258222,
97
+ "eval_runtime": 160.5107,
98
+ "eval_samples_per_second": 8.523,
99
+ "eval_steps_per_second": 1.065,
100
+ "step": 800
101
+ },
102
+ {
103
+ "epoch": 2.63,
104
+ "learning_rate": 3.6842105263157895e-05,
105
+ "loss": 0.0506,
106
+ "step": 900
107
+ },
108
+ {
109
+ "epoch": 2.92,
110
+ "learning_rate": 3.538011695906433e-05,
111
+ "loss": 0.0503,
112
+ "step": 1000
113
+ },
114
+ {
115
+ "epoch": 2.92,
116
+ "eval_accuracy": 0.9692495126705621,
117
+ "eval_loss": 0.09646110981702805,
118
+ "eval_precision": 0.8755529497305813,
119
+ "eval_recall": 0.8374415545468176,
120
+ "eval_runtime": 161.798,
121
+ "eval_samples_per_second": 8.455,
122
+ "eval_steps_per_second": 1.057,
123
+ "step": 1000
124
+ },
125
+ {
126
+ "epoch": 3.22,
127
+ "learning_rate": 3.391812865497076e-05,
128
+ "loss": 0.0297,
129
+ "step": 1100
130
+ },
131
+ {
132
+ "epoch": 3.51,
133
+ "learning_rate": 3.24561403508772e-05,
134
+ "loss": 0.0245,
135
+ "step": 1200
136
+ },
137
+ {
138
+ "epoch": 3.51,
139
+ "eval_accuracy": 0.9697855750487306,
140
+ "eval_loss": 0.09691683202981949,
141
+ "eval_precision": 0.8796307635671673,
142
+ "eval_recall": 0.8392919296428067,
143
+ "eval_runtime": 163.6772,
144
+ "eval_samples_per_second": 8.358,
145
+ "eval_steps_per_second": 1.045,
146
+ "step": 1200
147
  },
148
  {
149
+ "epoch": 3.8,
150
+ "learning_rate": 3.0994152046783626e-05,
151
+ "loss": 0.026,
152
+ "step": 1300
153
  },
154
  {
155
+ "epoch": 4.09,
156
+ "learning_rate": 2.9532163742690062e-05,
157
+ "loss": 0.0231,
158
+ "step": 1400
159
  },
160
  {
161
+ "epoch": 4.09,
162
+ "eval_accuracy": 0.9713937621832336,
163
+ "eval_loss": 0.09438519924879074,
164
+ "eval_precision": 0.8850769600769599,
165
+ "eval_recall": 0.8511938435184049,
166
+ "eval_runtime": 161.9688,
167
+ "eval_samples_per_second": 8.446,
168
+ "eval_steps_per_second": 1.056,
169
+ "step": 1400
170
  }
171
  ],
172
+ "max_steps": 3420,
173
  "num_train_epochs": 10,
174
+ "total_flos": 5.207113357118669e+18,
175
  "trial_name": null,
176
  "trial_params": null
177
  }