Augusto777 commited on
Commit
a3f4952
1 Parent(s): 87b97af

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.7166666666666667
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.8134
36
- - Accuracy: 0.7167
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.7333333333333333
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.8095
36
+ - Accuracy: 0.7333
37
 
38
  ## Model description
39
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 10.0,
3
- "eval_accuracy": 0.5833333333333334,
4
- "eval_loss": 1.2348047494888306,
5
- "eval_runtime": 1.3572,
6
- "eval_samples_per_second": 44.207,
7
- "eval_steps_per_second": 1.474,
8
- "train_loss": 1.2905001163482666,
9
- "train_runtime": 87.3836,
10
- "train_samples_per_second": 27.465,
11
- "train_steps_per_second": 0.229
12
  }
 
1
  {
2
+ "epoch": 9.23,
3
+ "eval_accuracy": 0.7333333333333333,
4
+ "eval_loss": 0.809493362903595,
5
+ "eval_runtime": 1.3092,
6
+ "eval_samples_per_second": 45.831,
7
+ "eval_steps_per_second": 1.528,
8
+ "train_loss": 0.9177195443047418,
9
+ "train_runtime": 195.1818,
10
+ "train_samples_per_second": 62.762,
11
+ "train_steps_per_second": 0.461
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 10.0,
3
- "eval_accuracy": 0.5833333333333334,
4
- "eval_loss": 1.2348047494888306,
5
- "eval_runtime": 1.3572,
6
- "eval_samples_per_second": 44.207,
7
- "eval_steps_per_second": 1.474
8
  }
 
1
  {
2
+ "epoch": 9.23,
3
+ "eval_accuracy": 0.7333333333333333,
4
+ "eval_loss": 0.809493362903595,
5
+ "eval_runtime": 1.3092,
6
+ "eval_samples_per_second": 45.831,
7
+ "eval_steps_per_second": 1.528
8
  }
runs/May24_07-57-29_DESKTOP-SKBE9FB/events.out.tfevents.1716559321.DESKTOP-SKBE9FB.10960.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f2af94f1dcafcc46d3cbf3e8dba445c2d7248858c3a96155c7bf846ad6b11d8
3
+ size 405
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 10.0,
3
- "train_loss": 1.2905001163482666,
4
- "train_runtime": 87.3836,
5
- "train_samples_per_second": 27.465,
6
- "train_steps_per_second": 0.229
7
  }
 
1
  {
2
+ "epoch": 9.23,
3
+ "train_loss": 0.9177195443047418,
4
+ "train_runtime": 195.1818,
5
+ "train_samples_per_second": 62.762,
6
+ "train_steps_per_second": 0.461
7
  }
trainer_state.json CHANGED
@@ -1,131 +1,173 @@
1
  {
2
- "best_metric": 0.5833333333333334,
3
- "best_model_checkpoint": "vit-base-patch16-224-RU5-10\\checkpoint-16",
4
- "epoch": 10.0,
5
  "eval_steps": 500,
6
- "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 1.0,
13
- "eval_accuracy": 0.48333333333333334,
14
- "eval_loss": 1.371477723121643,
15
- "eval_runtime": 1.144,
16
- "eval_samples_per_second": 52.447,
17
- "eval_steps_per_second": 1.748,
18
- "step": 2
19
  },
20
  {
21
- "epoch": 2.0,
22
- "eval_accuracy": 0.4666666666666667,
23
- "eval_loss": 1.3415111303329468,
24
- "eval_runtime": 1.0274,
25
- "eval_samples_per_second": 58.399,
26
- "eval_steps_per_second": 1.947,
27
- "step": 4
28
  },
29
  {
30
- "epoch": 3.0,
31
- "eval_accuracy": 0.4666666666666667,
32
- "eval_loss": 1.31484854221344,
33
- "eval_runtime": 1.0106,
34
- "eval_samples_per_second": 59.368,
35
- "eval_steps_per_second": 1.979,
36
- "step": 6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  },
38
  {
39
  "epoch": 4.0,
40
- "eval_accuracy": 0.48333333333333334,
41
- "eval_loss": 1.2919448614120483,
42
- "eval_runtime": 1.0367,
43
- "eval_samples_per_second": 57.876,
44
- "eval_steps_per_second": 1.929,
45
- "step": 8
46
  },
47
  {
48
- "epoch": 5.0,
49
- "learning_rate": 2.894736842105263e-05,
50
- "loss": 1.3369,
51
- "step": 10
52
  },
53
  {
54
- "epoch": 5.0,
55
- "eval_accuracy": 0.48333333333333334,
56
- "eval_loss": 1.272611141204834,
57
- "eval_runtime": 0.996,
58
- "eval_samples_per_second": 60.243,
59
- "eval_steps_per_second": 2.008,
60
- "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
61
  },
62
  {
63
- "epoch": 6.0,
64
- "eval_accuracy": 0.5,
65
- "eval_loss": 1.2568950653076172,
66
- "eval_runtime": 1.0111,
67
- "eval_samples_per_second": 59.34,
68
- "eval_steps_per_second": 1.978,
69
- "step": 12
70
  },
71
  {
72
- "epoch": 7.0,
73
- "eval_accuracy": 0.55,
74
- "eval_loss": 1.24420964717865,
75
- "eval_runtime": 1.0116,
76
- "eval_samples_per_second": 59.311,
77
- "eval_steps_per_second": 1.977,
78
- "step": 14
79
  },
80
  {
81
  "epoch": 8.0,
82
- "eval_accuracy": 0.5833333333333334,
83
- "eval_loss": 1.2348047494888306,
84
- "eval_runtime": 1.0128,
85
- "eval_samples_per_second": 59.24,
86
- "eval_steps_per_second": 1.975,
87
- "step": 16
88
  },
89
  {
90
- "epoch": 9.0,
91
- "eval_accuracy": 0.5833333333333334,
92
- "eval_loss": 1.2286779880523682,
93
- "eval_runtime": 1.0097,
94
- "eval_samples_per_second": 59.423,
95
- "eval_steps_per_second": 1.981,
96
- "step": 18
 
 
 
 
 
 
97
  },
98
  {
99
- "epoch": 10.0,
100
  "learning_rate": 0.0,
101
- "loss": 1.2441,
102
- "step": 20
103
  },
104
  {
105
- "epoch": 10.0,
106
- "eval_accuracy": 0.5666666666666667,
107
- "eval_loss": 1.2260597944259644,
108
- "eval_runtime": 1.032,
109
- "eval_samples_per_second": 58.141,
110
- "eval_steps_per_second": 1.938,
111
- "step": 20
112
  },
113
  {
114
- "epoch": 10.0,
115
- "step": 20,
116
- "total_flos": 1.859841088487424e+17,
117
- "train_loss": 1.2905001163482666,
118
- "train_runtime": 87.3836,
119
- "train_samples_per_second": 27.465,
120
- "train_steps_per_second": 0.229
121
  }
122
  ],
123
  "logging_steps": 10,
124
- "max_steps": 20,
125
  "num_input_tokens_seen": 0,
126
  "num_train_epochs": 10,
127
  "save_steps": 500,
128
- "total_flos": 1.859841088487424e+17,
129
  "train_batch_size": 32,
130
  "trial_name": null,
131
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.7333333333333333,
3
+ "best_model_checkpoint": "vit-base-patch16-224-RU5-10\\checkpoint-87",
4
+ "epoch": 9.23076923076923,
5
  "eval_steps": 500,
6
+ "global_step": 90,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.92,
13
+ "eval_accuracy": 0.4666666666666667,
14
+ "eval_loss": 1.293900728225708,
15
+ "eval_runtime": 1.019,
16
+ "eval_samples_per_second": 58.879,
17
+ "eval_steps_per_second": 1.963,
18
+ "step": 9
19
  },
20
  {
21
+ "epoch": 1.03,
22
+ "learning_rate": 5.1764705882352943e-05,
23
+ "loss": 1.3501,
24
+ "step": 10
 
 
 
25
  },
26
  {
27
+ "epoch": 1.95,
28
+ "eval_accuracy": 0.5833333333333334,
29
+ "eval_loss": 1.170591115951538,
30
+ "eval_runtime": 1.0727,
31
+ "eval_samples_per_second": 55.933,
32
+ "eval_steps_per_second": 1.864,
33
+ "step": 19
34
+ },
35
+ {
36
+ "epoch": 2.05,
37
+ "learning_rate": 4.5294117647058826e-05,
38
+ "loss": 1.2272,
39
+ "step": 20
40
+ },
41
+ {
42
+ "epoch": 2.97,
43
+ "eval_accuracy": 0.6333333333333333,
44
+ "eval_loss": 1.0594052076339722,
45
+ "eval_runtime": 1.0633,
46
+ "eval_samples_per_second": 56.426,
47
+ "eval_steps_per_second": 1.881,
48
+ "step": 29
49
+ },
50
+ {
51
+ "epoch": 3.08,
52
+ "learning_rate": 3.882352941176471e-05,
53
+ "loss": 1.0941,
54
+ "step": 30
55
  },
56
  {
57
  "epoch": 4.0,
58
+ "eval_accuracy": 0.6,
59
+ "eval_loss": 0.9773460030555725,
60
+ "eval_runtime": 1.0306,
61
+ "eval_samples_per_second": 58.221,
62
+ "eval_steps_per_second": 1.941,
63
+ "step": 39
64
  },
65
  {
66
+ "epoch": 4.1,
67
+ "learning_rate": 3.235294117647059e-05,
68
+ "loss": 0.979,
69
+ "step": 40
70
  },
71
  {
72
+ "epoch": 4.92,
73
+ "eval_accuracy": 0.6833333333333333,
74
+ "eval_loss": 0.9141623377799988,
75
+ "eval_runtime": 1.0244,
76
+ "eval_samples_per_second": 58.572,
77
+ "eval_steps_per_second": 1.952,
78
+ "step": 48
79
+ },
80
+ {
81
+ "epoch": 5.13,
82
+ "learning_rate": 2.5882352941176472e-05,
83
+ "loss": 0.8694,
84
+ "step": 50
85
+ },
86
+ {
87
+ "epoch": 5.95,
88
+ "eval_accuracy": 0.7,
89
+ "eval_loss": 0.8568627238273621,
90
+ "eval_runtime": 1.0443,
91
+ "eval_samples_per_second": 57.453,
92
+ "eval_steps_per_second": 1.915,
93
+ "step": 58
94
+ },
95
+ {
96
+ "epoch": 6.15,
97
+ "learning_rate": 1.9411764705882355e-05,
98
+ "loss": 0.7662,
99
+ "step": 60
100
  },
101
  {
102
+ "epoch": 6.97,
103
+ "eval_accuracy": 0.6833333333333333,
104
+ "eval_loss": 0.8363937139511108,
105
+ "eval_runtime": 1.067,
106
+ "eval_samples_per_second": 56.233,
107
+ "eval_steps_per_second": 1.874,
108
+ "step": 68
109
  },
110
  {
111
+ "epoch": 7.18,
112
+ "learning_rate": 1.2941176470588236e-05,
113
+ "loss": 0.7002,
114
+ "step": 70
 
 
 
115
  },
116
  {
117
  "epoch": 8.0,
118
+ "eval_accuracy": 0.7,
119
+ "eval_loss": 0.8071037530899048,
120
+ "eval_runtime": 1.0561,
121
+ "eval_samples_per_second": 56.814,
122
+ "eval_steps_per_second": 1.894,
123
+ "step": 78
124
  },
125
  {
126
+ "epoch": 8.21,
127
+ "learning_rate": 6.470588235294118e-06,
128
+ "loss": 0.6443,
129
+ "step": 80
130
+ },
131
+ {
132
+ "epoch": 8.92,
133
+ "eval_accuracy": 0.7333333333333333,
134
+ "eval_loss": 0.809493362903595,
135
+ "eval_runtime": 1.0229,
136
+ "eval_samples_per_second": 58.655,
137
+ "eval_steps_per_second": 1.955,
138
+ "step": 87
139
  },
140
  {
141
+ "epoch": 9.23,
142
  "learning_rate": 0.0,
143
+ "loss": 0.629,
144
+ "step": 90
145
  },
146
  {
147
+ "epoch": 9.23,
148
+ "eval_accuracy": 0.7166666666666667,
149
+ "eval_loss": 0.8133583664894104,
150
+ "eval_runtime": 1.0093,
151
+ "eval_samples_per_second": 59.45,
152
+ "eval_steps_per_second": 1.982,
153
+ "step": 90
154
  },
155
  {
156
+ "epoch": 9.23,
157
+ "step": 90,
158
+ "total_flos": 8.766825930857595e+17,
159
+ "train_loss": 0.9177195443047418,
160
+ "train_runtime": 195.1818,
161
+ "train_samples_per_second": 62.762,
162
+ "train_steps_per_second": 0.461
163
  }
164
  ],
165
  "logging_steps": 10,
166
+ "max_steps": 90,
167
  "num_input_tokens_seen": 0,
168
  "num_train_epochs": 10,
169
  "save_steps": 500,
170
+ "total_flos": 8.766825930857595e+17,
171
  "train_batch_size": 32,
172
  "trial_name": null,
173
  "trial_params": null