xiaopch commited on
Commit
39002ec
1 Parent(s): 76eae22

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_accuracy": 0.9809264305177112,
4
- "eval_loss": 0.07860878109931946,
5
- "eval_runtime": 5.4221,
6
- "eval_samples_per_second": 67.687,
7
- "eval_steps_per_second": 2.213,
8
- "total_flos": 7.678887715683717e+17,
9
- "train_loss": 0.36344620203360534,
10
- "train_runtime": 415.1296,
11
- "train_samples_per_second": 23.87,
12
- "train_steps_per_second": 0.188
13
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_accuracy": 0.6746987951807228,
4
+ "eval_loss": 1.1532235145568848,
5
+ "eval_runtime": 8.0102,
6
+ "eval_samples_per_second": 62.171,
7
+ "eval_steps_per_second": 1.997,
8
+ "total_flos": 1.0402373155785892e+18,
9
+ "train_loss": 1.5203653063092912,
10
+ "train_runtime": 531.0704,
11
+ "train_samples_per_second": 25.273,
12
+ "train_steps_per_second": 0.198
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_accuracy": 0.9809264305177112,
4
- "eval_loss": 0.07860878109931946,
5
- "eval_runtime": 5.4221,
6
- "eval_samples_per_second": 67.687,
7
- "eval_steps_per_second": 2.213
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_accuracy": 0.6746987951807228,
4
+ "eval_loss": 1.1532235145568848,
5
+ "eval_runtime": 8.0102,
6
+ "eval_samples_per_second": 62.171,
7
+ "eval_steps_per_second": 1.997
8
  }
runs/Nov30_13-49-19_4b23d0e9dade/events.out.tfevents.1701352758.4b23d0e9dade.2219.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b42ca4a5a3cabea59983fea349942f7b779dc374cba6baa20644ea1c5e5ec76
3
+ size 405
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "total_flos": 7.678887715683717e+17,
4
- "train_loss": 0.36344620203360534,
5
- "train_runtime": 415.1296,
6
- "train_samples_per_second": 23.87,
7
- "train_steps_per_second": 0.188
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "total_flos": 1.0402373155785892e+18,
4
+ "train_loss": 1.5203653063092912,
5
+ "train_runtime": 531.0704,
6
+ "train_samples_per_second": 25.273,
7
+ "train_steps_per_second": 0.198
8
  }
trainer_state.json CHANGED
@@ -1,97 +1,115 @@
1
  {
2
- "best_metric": 0.9809264305177112,
3
- "best_model_checkpoint": "vit-base-patch16-224-finetuned/checkpoint-52",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 78,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.38,
13
- "learning_rate": 4.8571428571428576e-05,
14
- "loss": 1.5192,
15
  "step": 10
16
  },
17
  {
18
- "epoch": 0.77,
19
- "learning_rate": 4.1428571428571437e-05,
20
- "loss": 0.5888,
21
  "step": 20
22
  },
23
  {
24
- "epoch": 1.0,
25
- "eval_accuracy": 0.9700272479564033,
26
- "eval_loss": 0.17195835709571838,
27
- "eval_runtime": 5.5957,
28
- "eval_samples_per_second": 65.586,
29
- "eval_steps_per_second": 2.145,
30
- "step": 26
31
  },
32
  {
33
- "epoch": 1.15,
34
- "learning_rate": 3.428571428571429e-05,
35
- "loss": 0.2357,
36
- "step": 30
 
 
 
37
  },
38
  {
39
- "epoch": 1.54,
40
- "learning_rate": 2.714285714285714e-05,
41
- "loss": 0.1499,
42
  "step": 40
43
  },
44
  {
45
- "epoch": 1.92,
46
- "learning_rate": 2e-05,
47
- "loss": 0.1027,
48
  "step": 50
49
  },
50
  {
51
- "epoch": 2.0,
52
- "eval_accuracy": 0.9809264305177112,
53
- "eval_loss": 0.07860878109931946,
54
- "eval_runtime": 5.4987,
55
- "eval_samples_per_second": 66.743,
56
- "eval_steps_per_second": 2.182,
57
- "step": 52
58
  },
59
  {
60
- "epoch": 2.31,
61
- "learning_rate": 1.2857142857142857e-05,
62
- "loss": 0.0989,
63
- "step": 60
64
  },
65
  {
66
- "epoch": 2.69,
67
- "learning_rate": 5.7142857142857145e-06,
68
- "loss": 0.0809,
 
 
 
69
  "step": 70
70
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
71
  {
72
  "epoch": 3.0,
73
- "eval_accuracy": 0.9809264305177112,
74
- "eval_loss": 0.07304801046848297,
75
- "eval_runtime": 5.4275,
76
- "eval_samples_per_second": 67.619,
77
- "eval_steps_per_second": 2.211,
78
- "step": 78
79
  },
80
  {
81
  "epoch": 3.0,
82
- "step": 78,
83
- "total_flos": 7.678887715683717e+17,
84
- "train_loss": 0.36344620203360534,
85
- "train_runtime": 415.1296,
86
- "train_samples_per_second": 23.87,
87
- "train_steps_per_second": 0.188
88
  }
89
  ],
90
  "logging_steps": 10,
91
- "max_steps": 78,
92
  "num_train_epochs": 3,
93
  "save_steps": 500,
94
- "total_flos": 7.678887715683717e+17,
95
  "trial_name": null,
96
  "trial_params": null
97
  }
 
1
  {
2
+ "best_metric": 0.6746987951807228,
3
+ "best_model_checkpoint": "vit-base-patch16-224-finetuned/checkpoint-105",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 105,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.29,
13
+ "learning_rate": 4.545454545454546e-05,
14
+ "loss": 2.8668,
15
  "step": 10
16
  },
17
  {
18
+ "epoch": 0.57,
19
+ "learning_rate": 4.5212765957446815e-05,
20
+ "loss": 2.2489,
21
  "step": 20
22
  },
23
  {
24
+ "epoch": 0.86,
25
+ "learning_rate": 3.9893617021276594e-05,
26
+ "loss": 1.8046,
27
+ "step": 30
 
 
 
28
  },
29
  {
30
+ "epoch": 1.0,
31
+ "eval_accuracy": 0.6004016064257028,
32
+ "eval_loss": 1.5307656526565552,
33
+ "eval_runtime": 7.8884,
34
+ "eval_samples_per_second": 63.131,
35
+ "eval_steps_per_second": 2.028,
36
+ "step": 35
37
  },
38
  {
39
+ "epoch": 1.14,
40
+ "learning_rate": 3.4574468085106386e-05,
41
+ "loss": 1.505,
42
  "step": 40
43
  },
44
  {
45
+ "epoch": 1.43,
46
+ "learning_rate": 2.925531914893617e-05,
47
+ "loss": 1.3769,
48
  "step": 50
49
  },
50
  {
51
+ "epoch": 1.71,
52
+ "learning_rate": 2.393617021276596e-05,
53
+ "loss": 1.2191,
54
+ "step": 60
 
 
 
55
  },
56
  {
57
+ "epoch": 2.0,
58
+ "learning_rate": 1.8617021276595745e-05,
59
+ "loss": 1.1931,
60
+ "step": 70
61
  },
62
  {
63
+ "epoch": 2.0,
64
+ "eval_accuracy": 0.6526104417670683,
65
+ "eval_loss": 1.2079730033874512,
66
+ "eval_runtime": 8.2786,
67
+ "eval_samples_per_second": 60.155,
68
+ "eval_steps_per_second": 1.933,
69
  "step": 70
70
  },
71
+ {
72
+ "epoch": 2.29,
73
+ "learning_rate": 1.3297872340425532e-05,
74
+ "loss": 1.0954,
75
+ "step": 80
76
+ },
77
+ {
78
+ "epoch": 2.57,
79
+ "learning_rate": 7.97872340425532e-06,
80
+ "loss": 1.0719,
81
+ "step": 90
82
+ },
83
+ {
84
+ "epoch": 2.86,
85
+ "learning_rate": 2.6595744680851065e-06,
86
+ "loss": 1.0292,
87
+ "step": 100
88
+ },
89
  {
90
  "epoch": 3.0,
91
+ "eval_accuracy": 0.6746987951807228,
92
+ "eval_loss": 1.1532235145568848,
93
+ "eval_runtime": 7.6457,
94
+ "eval_samples_per_second": 65.135,
95
+ "eval_steps_per_second": 2.093,
96
+ "step": 105
97
  },
98
  {
99
  "epoch": 3.0,
100
+ "step": 105,
101
+ "total_flos": 1.0402373155785892e+18,
102
+ "train_loss": 1.5203653063092912,
103
+ "train_runtime": 531.0704,
104
+ "train_samples_per_second": 25.273,
105
+ "train_steps_per_second": 0.198
106
  }
107
  ],
108
  "logging_steps": 10,
109
+ "max_steps": 105,
110
  "num_train_epochs": 3,
111
  "save_steps": 500,
112
+ "total_flos": 1.0402373155785892e+18,
113
  "trial_name": null,
114
  "trial_params": null
115
  }