omar22allam commited on
Commit
48d1988
1 Parent(s): 852474e

Training Completed!

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.9176470588235294
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.3352
36
- - Accuracy: 0.9176
37
 
38
  ## Model description
39
 
@@ -58,10 +58,13 @@ The following hyperparameters were used during training:
58
  - seed: 42
59
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
60
  - lr_scheduler_type: linear
61
- - num_epochs: 5
62
 
63
  ### Training results
64
 
 
 
 
65
 
66
 
67
  ### Framework versions
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.8941176470588236
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.4515
36
+ - Accuracy: 0.8941
37
 
38
  ## Model description
39
 
 
58
  - seed: 42
59
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
60
  - lr_scheduler_type: linear
61
+ - num_epochs: 10
62
 
63
  ### Training results
64
 
65
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy |
66
+ |:-------------:|:------:|:----:|:---------------:|:--------:|
67
+ | 0.0236 | 5.5556 | 100 | 0.4515 | 0.8941 |
68
 
69
 
70
  ### Framework versions
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_accuracy": 0.9176470588235294,
4
- "eval_loss": 0.33524250984191895,
5
- "eval_runtime": 2.2283,
6
- "eval_samples_per_second": 38.145,
7
- "eval_steps_per_second": 4.936,
8
- "total_flos": 1.104270749148672e+17,
9
- "train_loss": 0.3459944127334489,
10
- "train_runtime": 65.8041,
11
- "train_samples_per_second": 21.655,
12
- "train_steps_per_second": 1.368
13
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.8941176470588236,
4
+ "eval_loss": 0.4515226483345032,
5
+ "eval_runtime": 1.8149,
6
+ "eval_samples_per_second": 46.836,
7
+ "eval_steps_per_second": 6.061,
8
+ "total_flos": 2.208541498297344e+17,
9
+ "train_loss": 0.17066083699982199,
10
+ "train_runtime": 133.3595,
11
+ "train_samples_per_second": 21.371,
12
+ "train_steps_per_second": 1.35
13
  }
config.json CHANGED
@@ -9,17 +9,17 @@
9
  "hidden_dropout_prob": 0.0,
10
  "hidden_size": 768,
11
  "id2label": {
12
- "0": "normal",
13
- "1": "Cancer",
14
- "2": "Benign"
15
  },
16
  "image_size": 224,
17
  "initializer_range": 0.02,
18
  "intermediate_size": 3072,
19
  "label2id": {
20
- "Benign": 2,
21
- "Cancer": 1,
22
- "normal": 0
23
  },
24
  "layer_norm_eps": 1e-12,
25
  "model_type": "vit",
 
9
  "hidden_dropout_prob": 0.0,
10
  "hidden_size": 768,
11
  "id2label": {
12
+ "0": "bengin",
13
+ "1": "cancer",
14
+ "2": "normal"
15
  },
16
  "image_size": 224,
17
  "initializer_range": 0.02,
18
  "intermediate_size": 3072,
19
  "label2id": {
20
+ "bengin": 0,
21
+ "cancer": 1,
22
+ "normal": 2
23
  },
24
  "layer_norm_eps": 1e-12,
25
  "model_type": "vit",
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_accuracy": 0.9176470588235294,
4
- "eval_loss": 0.33524250984191895,
5
- "eval_runtime": 2.2283,
6
- "eval_samples_per_second": 38.145,
7
- "eval_steps_per_second": 4.936
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_accuracy": 0.8941176470588236,
4
+ "eval_loss": 0.4515226483345032,
5
+ "eval_runtime": 1.8149,
6
+ "eval_samples_per_second": 46.836,
7
+ "eval_steps_per_second": 6.061
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7763f5afe02e29f88388f4d07a5b5b5bd4cd5110f49ff485033ddd04a27b9c18
3
  size 343227052
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abb8cd2dafb6e3adda18265ed82f7d65d75ead47ddecbc89d2abdbbb4e78d1fb
3
  size 343227052
runs/May10_19-31-52_b9d6e8b22a3b/events.out.tfevents.1715369517.b9d6e8b22a3b.3702.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba02c8a3d3c8f9cc1584242152a43062f5fe2cdb0332340c5c69c438fcc7df46
3
+ size 7833
runs/May10_19-31-52_b9d6e8b22a3b/events.out.tfevents.1715369631.b9d6e8b22a3b.3702.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47039229f259fd0b954f3be9b198b8af011516e2c45b2cc31486d865b489aaf6
3
+ size 405
runs/May10_19-34-04_b9d6e8b22a3b/events.out.tfevents.1715369648.b9d6e8b22a3b.3702.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09146dcb9bed8c9e93652e304fe9b1c01660b8954ef25753575a7afba0a64194
3
+ size 13627
runs/May10_19-34-04_b9d6e8b22a3b/events.out.tfevents.1715369921.b9d6e8b22a3b.3702.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d53451e5f353d6f08925bd8ddb6bccf77b42434c1126089e2b1c1f3bf63697d1
3
+ size 411
runs/May10_19-53-24_b9d6e8b22a3b/events.out.tfevents.1715370809.b9d6e8b22a3b.3702.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23a013409bff29a7946cf28334961aec0027213ae8ed1c081d83a67b9e18e03a
3
+ size 9106
runs/May10_19-53-24_b9d6e8b22a3b/events.out.tfevents.1715371068.b9d6e8b22a3b.3702.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:374ed9c830b4fcc1f41e08d757239be6c80426e2dbb10edcbca07628498dd4bf
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 5.0,
3
- "total_flos": 1.104270749148672e+17,
4
- "train_loss": 0.3459944127334489,
5
- "train_runtime": 65.8041,
6
- "train_samples_per_second": 21.655,
7
- "train_steps_per_second": 1.368
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "total_flos": 2.208541498297344e+17,
4
+ "train_loss": 0.17066083699982199,
5
+ "train_runtime": 133.3595,
6
+ "train_samples_per_second": 21.371,
7
+ "train_steps_per_second": 1.35
8
  }
trainer_state.json CHANGED
@@ -1,92 +1,164 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 5.0,
5
  "eval_steps": 100,
6
- "global_step": 90,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.5555555555555556,
13
- "grad_norm": 10.430541038513184,
14
- "learning_rate": 0.00017777777777777779,
15
- "loss": 1.1321,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 1.1111111111111112,
20
- "grad_norm": 3.6575100421905518,
21
- "learning_rate": 0.00015555555555555556,
22
- "loss": 0.6351,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 1.6666666666666665,
27
- "grad_norm": 4.778464317321777,
28
- "learning_rate": 0.00013333333333333334,
29
- "loss": 0.4087,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 2.2222222222222223,
34
- "grad_norm": 7.901824951171875,
35
- "learning_rate": 0.00011111111111111112,
36
- "loss": 0.3833,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 2.7777777777777777,
41
- "grad_norm": 1.8277825117111206,
42
- "learning_rate": 8.888888888888889e-05,
43
- "loss": 0.2095,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 3.3333333333333335,
48
- "grad_norm": 6.244271755218506,
49
- "learning_rate": 6.666666666666667e-05,
50
- "loss": 0.2673,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 3.888888888888889,
55
- "grad_norm": 3.88458251953125,
56
- "learning_rate": 4.4444444444444447e-05,
57
- "loss": 0.0374,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 4.444444444444445,
62
- "grad_norm": 0.08572948724031448,
63
- "learning_rate": 2.2222222222222223e-05,
64
- "loss": 0.0341,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 5.0,
69
- "grad_norm": 0.26313289999961853,
70
- "learning_rate": 0.0,
71
- "loss": 0.0065,
72
  "step": 90
73
  },
74
  {
75
- "epoch": 5.0,
76
- "step": 90,
77
- "total_flos": 1.104270749148672e+17,
78
- "train_loss": 0.3459944127334489,
79
- "train_runtime": 65.8041,
80
- "train_samples_per_second": 21.655,
81
- "train_steps_per_second": 1.368
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
82
  }
83
  ],
84
  "logging_steps": 10,
85
- "max_steps": 90,
86
  "num_input_tokens_seen": 0,
87
- "num_train_epochs": 5,
88
  "save_steps": 100,
89
- "total_flos": 1.104270749148672e+17,
90
  "train_batch_size": 16,
91
  "trial_name": null,
92
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.4515226483345032,
3
+ "best_model_checkpoint": "./MRI_vit/checkpoint-100",
4
+ "epoch": 10.0,
5
  "eval_steps": 100,
6
+ "global_step": 180,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.5555555555555556,
13
+ "grad_norm": 7.522036552429199,
14
+ "learning_rate": 0.00018888888888888888,
15
+ "loss": 0.974,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 1.1111111111111112,
20
+ "grad_norm": 2.3464157581329346,
21
+ "learning_rate": 0.00017777777777777779,
22
+ "loss": 0.6625,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 1.6666666666666665,
27
+ "grad_norm": 9.9130220413208,
28
+ "learning_rate": 0.0001666666666666667,
29
+ "loss": 0.4228,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 2.2222222222222223,
34
+ "grad_norm": 9.101266860961914,
35
+ "learning_rate": 0.00015555555555555556,
36
+ "loss": 0.4918,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 2.7777777777777777,
41
+ "grad_norm": 7.912335395812988,
42
+ "learning_rate": 0.00014444444444444444,
43
+ "loss": 0.1294,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 3.3333333333333335,
48
+ "grad_norm": 1.002270221710205,
49
+ "learning_rate": 0.00013333333333333334,
50
+ "loss": 0.1837,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 3.888888888888889,
55
+ "grad_norm": 0.04989054054021835,
56
+ "learning_rate": 0.00012222222222222224,
57
+ "loss": 0.0559,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 4.444444444444445,
62
+ "grad_norm": 7.236814498901367,
63
+ "learning_rate": 0.00011111111111111112,
64
+ "loss": 0.0396,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 5.0,
69
+ "grad_norm": 5.21504545211792,
70
+ "learning_rate": 0.0001,
71
+ "loss": 0.0791,
72
  "step": 90
73
  },
74
  {
75
+ "epoch": 5.555555555555555,
76
+ "grad_norm": 0.02051878347992897,
77
+ "learning_rate": 8.888888888888889e-05,
78
+ "loss": 0.0236,
79
+ "step": 100
80
+ },
81
+ {
82
+ "epoch": 5.555555555555555,
83
+ "eval_accuracy": 0.8941176470588236,
84
+ "eval_loss": 0.4515226483345032,
85
+ "eval_runtime": 1.7177,
86
+ "eval_samples_per_second": 49.485,
87
+ "eval_steps_per_second": 6.404,
88
+ "step": 100
89
+ },
90
+ {
91
+ "epoch": 6.111111111111111,
92
+ "grad_norm": 0.013602614402770996,
93
+ "learning_rate": 7.777777777777778e-05,
94
+ "loss": 0.0038,
95
+ "step": 110
96
+ },
97
+ {
98
+ "epoch": 6.666666666666667,
99
+ "grad_norm": 0.006600651424378157,
100
+ "learning_rate": 6.666666666666667e-05,
101
+ "loss": 0.0013,
102
+ "step": 120
103
+ },
104
+ {
105
+ "epoch": 7.222222222222222,
106
+ "grad_norm": 0.004217671230435371,
107
+ "learning_rate": 5.555555555555556e-05,
108
+ "loss": 0.001,
109
+ "step": 130
110
+ },
111
+ {
112
+ "epoch": 7.777777777777778,
113
+ "grad_norm": 0.009464713744819164,
114
+ "learning_rate": 4.4444444444444447e-05,
115
+ "loss": 0.0019,
116
+ "step": 140
117
+ },
118
+ {
119
+ "epoch": 8.333333333333334,
120
+ "grad_norm": 0.008202188648283482,
121
+ "learning_rate": 3.3333333333333335e-05,
122
+ "loss": 0.0003,
123
+ "step": 150
124
+ },
125
+ {
126
+ "epoch": 8.88888888888889,
127
+ "grad_norm": 0.019373826682567596,
128
+ "learning_rate": 2.2222222222222223e-05,
129
+ "loss": 0.0004,
130
+ "step": 160
131
+ },
132
+ {
133
+ "epoch": 9.444444444444445,
134
+ "grad_norm": 0.004279292654246092,
135
+ "learning_rate": 1.1111111111111112e-05,
136
+ "loss": 0.0004,
137
+ "step": 170
138
+ },
139
+ {
140
+ "epoch": 10.0,
141
+ "grad_norm": 0.004037588369101286,
142
+ "learning_rate": 0.0,
143
+ "loss": 0.0004,
144
+ "step": 180
145
+ },
146
+ {
147
+ "epoch": 10.0,
148
+ "step": 180,
149
+ "total_flos": 2.208541498297344e+17,
150
+ "train_loss": 0.17066083699982199,
151
+ "train_runtime": 133.3595,
152
+ "train_samples_per_second": 21.371,
153
+ "train_steps_per_second": 1.35
154
  }
155
  ],
156
  "logging_steps": 10,
157
+ "max_steps": 180,
158
  "num_input_tokens_seen": 0,
159
+ "num_train_epochs": 10,
160
  "save_steps": 100,
161
+ "total_flos": 2.208541498297344e+17,
162
  "train_batch_size": 16,
163
  "trial_name": null,
164
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38d2c494673091293489e3472ca6d10994f0227f778a0da413f2755d2ceb0f2e
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b987baef7b866740d84e200bd5fa07044adfb2ec3c219e723726032bd8426f73
3
  size 4984