File size: 4,819 Bytes
3a04ddc |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 |
{
"best_metric": 0.49596309111880044,
"best_model_checkpoint": "beit-base-patch16-224-pt22k-ft22k-finetuned-FER2013CKPlus-7e-05-finetuned-SFEW-7e-05/checkpoint-126",
"epoch": 9.96551724137931,
"global_step": 140,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.69,
"learning_rate": 4.9999999999999996e-05,
"loss": 2.1509,
"step": 10
},
{
"epoch": 0.97,
"eval_accuracy": 0.37254901960784315,
"eval_loss": 1.6920275688171387,
"eval_runtime": 10.5629,
"eval_samples_per_second": 82.079,
"eval_steps_per_second": 2.651,
"step": 14
},
{
"epoch": 1.41,
"learning_rate": 6.666666666666666e-05,
"loss": 1.6764,
"step": 20
},
{
"epoch": 1.97,
"eval_accuracy": 0.46943483275663206,
"eval_loss": 1.5035290718078613,
"eval_runtime": 15.6046,
"eval_samples_per_second": 55.561,
"eval_steps_per_second": 1.794,
"step": 28
},
{
"epoch": 2.14,
"learning_rate": 6.111111111111111e-05,
"loss": 1.4471,
"step": 30
},
{
"epoch": 2.83,
"learning_rate": 5.5555555555555545e-05,
"loss": 1.2723,
"step": 40
},
{
"epoch": 2.97,
"eval_accuracy": 0.46943483275663206,
"eval_loss": 1.5060927867889404,
"eval_runtime": 10.6696,
"eval_samples_per_second": 81.259,
"eval_steps_per_second": 2.624,
"step": 42
},
{
"epoch": 3.55,
"learning_rate": 4.9999999999999996e-05,
"loss": 1.1746,
"step": 50
},
{
"epoch": 3.97,
"eval_accuracy": 0.4728950403690888,
"eval_loss": 1.5421292781829834,
"eval_runtime": 11.4458,
"eval_samples_per_second": 75.748,
"eval_steps_per_second": 2.446,
"step": 56
},
{
"epoch": 4.28,
"learning_rate": 4.444444444444444e-05,
"loss": 1.153,
"step": 60
},
{
"epoch": 4.97,
"learning_rate": 3.8888888888888884e-05,
"loss": 0.9954,
"step": 70
},
{
"epoch": 4.97,
"eval_accuracy": 0.4786620530565167,
"eval_loss": 1.565744400024414,
"eval_runtime": 10.8831,
"eval_samples_per_second": 79.665,
"eval_steps_per_second": 2.573,
"step": 70
},
{
"epoch": 5.69,
"learning_rate": 3.333333333333333e-05,
"loss": 1.0029,
"step": 80
},
{
"epoch": 5.97,
"eval_accuracy": 0.4844290657439446,
"eval_loss": 1.586708664894104,
"eval_runtime": 10.6127,
"eval_samples_per_second": 81.695,
"eval_steps_per_second": 2.638,
"step": 84
},
{
"epoch": 6.41,
"learning_rate": 2.7777777777777772e-05,
"loss": 0.9139,
"step": 90
},
{
"epoch": 6.97,
"eval_accuracy": 0.48788927335640137,
"eval_loss": 1.594279408454895,
"eval_runtime": 10.6847,
"eval_samples_per_second": 81.144,
"eval_steps_per_second": 2.621,
"step": 98
},
{
"epoch": 7.14,
"learning_rate": 2.222222222222222e-05,
"loss": 0.9519,
"step": 100
},
{
"epoch": 7.83,
"learning_rate": 1.6666666666666664e-05,
"loss": 0.8335,
"step": 110
},
{
"epoch": 7.97,
"eval_accuracy": 0.48904267589388695,
"eval_loss": 1.6002804040908813,
"eval_runtime": 11.2046,
"eval_samples_per_second": 77.379,
"eval_steps_per_second": 2.499,
"step": 112
},
{
"epoch": 8.55,
"learning_rate": 1.111111111111111e-05,
"loss": 0.8382,
"step": 120
},
{
"epoch": 8.97,
"eval_accuracy": 0.49596309111880044,
"eval_loss": 1.5628858804702759,
"eval_runtime": 10.522,
"eval_samples_per_second": 82.399,
"eval_steps_per_second": 2.661,
"step": 126
},
{
"epoch": 9.28,
"learning_rate": 5.555555555555555e-06,
"loss": 0.7749,
"step": 130
},
{
"epoch": 9.97,
"learning_rate": 0.0,
"loss": 0.7169,
"step": 140
},
{
"epoch": 9.97,
"eval_accuracy": 0.4855824682814302,
"eval_loss": 1.5772030353546143,
"eval_runtime": 10.4436,
"eval_samples_per_second": 83.017,
"eval_steps_per_second": 2.681,
"step": 140
},
{
"epoch": 9.97,
"step": 140,
"total_flos": 1.427863337526786e+18,
"train_loss": 1.1358447994504657,
"train_runtime": 1053.1568,
"train_samples_per_second": 17.557,
"train_steps_per_second": 0.133
}
],
"max_steps": 140,
"num_train_epochs": 10,
"total_flos": 1.427863337526786e+18,
"trial_name": null,
"trial_params": null
}
|