paul commited on
Commit
d9ae9f5
1 Parent(s): ac29669

Training in progress, epoch 0

Browse files
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.89,
3
+ "total_flos": 1.3244442196920238e+18,
4
+ "train_loss": 0.9847671677668889,
5
+ "train_runtime": 282.6595,
6
+ "train_samples_per_second": 61.134,
7
+ "train_steps_per_second": 0.212
8
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91f1e21b4efbc795b3213a2be94be099f1aa797564526c550954b193f3826806
3
  size 343334641
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:034114a0efe89d79a82c07eb97fde02ef1dfd83832450c7003a93a1da84dfaf7
3
  size 343334641
runs/Jan18_23-31-36_teesta/events.out.tfevents.1674064916.teesta.15918.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3dcf80287f8a1f30b7882cb1d3bb1d1a8d724fb8d8ffccc1d7e882ccad6d0a8e
3
- size 5464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76982b92ba47aa3623a1afa39a47cfef5ab1a05df4f92041d2e8f820e5f4340f
3
+ size 10903
runs/Jan18_23-37-50_teesta/1674065278.833225/events.out.tfevents.1674065278.teesta.15918.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8218e425882c512a281e73a87fbaaa5f0a8ee21c6af17c19a19857cbd25505f3
3
+ size 5571
runs/Jan18_23-37-50_teesta/events.out.tfevents.1674065278.teesta.15918.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f4b076c59870f2500a2565d5f933453ba8b162363cbc5ab6f96f9ad64e25867
3
+ size 5541
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.89,
3
+ "total_flos": 1.3244442196920238e+18,
4
+ "train_loss": 0.9847671677668889,
5
+ "train_runtime": 282.6595,
6
+ "train_samples_per_second": 61.134,
7
+ "train_steps_per_second": 0.212
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,181 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.875,
3
+ "best_model_checkpoint": "google-vit-base-patch16-224-cartoon-face-recognition/checkpoint-48",
4
+ "epoch": 9.88888888888889,
5
+ "global_step": 60,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.89,
12
+ "eval_accuracy": 0.24074074074074073,
13
+ "eval_f1": 0.1643869480887188,
14
+ "eval_loss": 2.792280435562134,
15
+ "eval_precision": 0.20461543357832349,
16
+ "eval_recall": 0.24074074074074073,
17
+ "eval_runtime": 7.7909,
18
+ "eval_samples_per_second": 55.449,
19
+ "eval_steps_per_second": 0.898,
20
+ "step": 6
21
+ },
22
+ {
23
+ "epoch": 1.59,
24
+ "learning_rate": 0.00011111111111111112,
25
+ "loss": 3.0606,
26
+ "step": 10
27
+ },
28
+ {
29
+ "epoch": 1.89,
30
+ "eval_accuracy": 0.5,
31
+ "eval_f1": 0.4341708558476282,
32
+ "eval_loss": 2.0185298919677734,
33
+ "eval_precision": 0.50652873651949,
34
+ "eval_recall": 0.5,
35
+ "eval_runtime": 6.5876,
36
+ "eval_samples_per_second": 65.578,
37
+ "eval_steps_per_second": 1.063,
38
+ "step": 12
39
+ },
40
+ {
41
+ "epoch": 2.89,
42
+ "eval_accuracy": 0.6620370370370371,
43
+ "eval_f1": 0.6279977278642492,
44
+ "eval_loss": 1.4164462089538574,
45
+ "eval_precision": 0.6524558387748216,
46
+ "eval_recall": 0.6620370370370371,
47
+ "eval_runtime": 6.5774,
48
+ "eval_samples_per_second": 65.679,
49
+ "eval_steps_per_second": 1.064,
50
+ "step": 18
51
+ },
52
+ {
53
+ "epoch": 3.3,
54
+ "learning_rate": 8.888888888888888e-05,
55
+ "loss": 1.688,
56
+ "step": 20
57
+ },
58
+ {
59
+ "epoch": 3.89,
60
+ "eval_accuracy": 0.7685185185185185,
61
+ "eval_f1": 0.7520520641207192,
62
+ "eval_loss": 1.0344423055648804,
63
+ "eval_precision": 0.7687545261419606,
64
+ "eval_recall": 0.7685185185185185,
65
+ "eval_runtime": 6.6855,
66
+ "eval_samples_per_second": 64.618,
67
+ "eval_steps_per_second": 1.047,
68
+ "step": 24
69
+ },
70
+ {
71
+ "epoch": 4.89,
72
+ "learning_rate": 6.666666666666667e-05,
73
+ "loss": 0.6694,
74
+ "step": 30
75
+ },
76
+ {
77
+ "epoch": 4.89,
78
+ "eval_accuracy": 0.8310185185185185,
79
+ "eval_f1": 0.8204789843927855,
80
+ "eval_loss": 0.8109782338142395,
81
+ "eval_precision": 0.8419593068227221,
82
+ "eval_recall": 0.8310185185185185,
83
+ "eval_runtime": 6.4692,
84
+ "eval_samples_per_second": 66.778,
85
+ "eval_steps_per_second": 1.082,
86
+ "step": 30
87
+ },
88
+ {
89
+ "epoch": 5.89,
90
+ "eval_accuracy": 0.8495370370370371,
91
+ "eval_f1": 0.8431889196512385,
92
+ "eval_loss": 0.680189847946167,
93
+ "eval_precision": 0.8577619498091635,
94
+ "eval_recall": 0.8495370370370371,
95
+ "eval_runtime": 6.5265,
96
+ "eval_samples_per_second": 66.192,
97
+ "eval_steps_per_second": 1.073,
98
+ "step": 36
99
+ },
100
+ {
101
+ "epoch": 6.59,
102
+ "learning_rate": 4.444444444444444e-05,
103
+ "loss": 0.285,
104
+ "step": 40
105
+ },
106
+ {
107
+ "epoch": 6.89,
108
+ "eval_accuracy": 0.8495370370370371,
109
+ "eval_f1": 0.8436215206983917,
110
+ "eval_loss": 0.6132100224494934,
111
+ "eval_precision": 0.8540014281192293,
112
+ "eval_recall": 0.8495370370370371,
113
+ "eval_runtime": 6.6157,
114
+ "eval_samples_per_second": 65.299,
115
+ "eval_steps_per_second": 1.058,
116
+ "step": 42
117
+ },
118
+ {
119
+ "epoch": 7.89,
120
+ "eval_accuracy": 0.875,
121
+ "eval_f1": 0.8707588213347532,
122
+ "eval_loss": 0.5606003403663635,
123
+ "eval_precision": 0.8799090872795438,
124
+ "eval_recall": 0.875,
125
+ "eval_runtime": 6.6491,
126
+ "eval_samples_per_second": 64.971,
127
+ "eval_steps_per_second": 1.053,
128
+ "step": 48
129
+ },
130
+ {
131
+ "epoch": 8.3,
132
+ "learning_rate": 2.222222222222222e-05,
133
+ "loss": 0.1277,
134
+ "step": 50
135
+ },
136
+ {
137
+ "epoch": 8.89,
138
+ "eval_accuracy": 0.8680555555555556,
139
+ "eval_f1": 0.864629496735875,
140
+ "eval_loss": 0.5443260669708252,
141
+ "eval_precision": 0.8753500264010703,
142
+ "eval_recall": 0.8680555555555556,
143
+ "eval_runtime": 6.7428,
144
+ "eval_samples_per_second": 64.068,
145
+ "eval_steps_per_second": 1.038,
146
+ "step": 54
147
+ },
148
+ {
149
+ "epoch": 9.89,
150
+ "learning_rate": 0.0,
151
+ "loss": 0.0779,
152
+ "step": 60
153
+ },
154
+ {
155
+ "epoch": 9.89,
156
+ "eval_accuracy": 0.8611111111111112,
157
+ "eval_f1": 0.8553095447735699,
158
+ "eval_loss": 0.5382117033004761,
159
+ "eval_precision": 0.8637558340439363,
160
+ "eval_recall": 0.8611111111111112,
161
+ "eval_runtime": 6.6834,
162
+ "eval_samples_per_second": 64.638,
163
+ "eval_steps_per_second": 1.047,
164
+ "step": 60
165
+ },
166
+ {
167
+ "epoch": 9.89,
168
+ "step": 60,
169
+ "total_flos": 1.3244442196920238e+18,
170
+ "train_loss": 0.9847671677668889,
171
+ "train_runtime": 282.6595,
172
+ "train_samples_per_second": 61.134,
173
+ "train_steps_per_second": 0.212
174
+ }
175
+ ],
176
+ "max_steps": 60,
177
+ "num_train_epochs": 10,
178
+ "total_flos": 1.3244442196920238e+18,
179
+ "trial_name": null,
180
+ "trial_params": null
181
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40feadefafde05a3eb0285865b8be78dafd5c10f6a540d0c21756a28e4fae7b0
3
  size 3439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87d5d54b686cf99be03ac991f0d0beca7d1767779b1ae8ccfa2c2784899a3894
3
  size 3439