swin-tiny-patch4-window7-224-finetuned-teeth_dataset-finetuned-teeth_dataset-V2
/
trainer_state.json
{ | |
"best_metric": 0.9260869565217391, | |
"best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-teeth_dataset-finetuned-teeth_dataset-V2/checkpoint-135", | |
"epoch": 40.0, | |
"eval_steps": 500, | |
"global_step": 150, | |
"is_hyper_param_search": false, | |
"is_local_process_zero": true, | |
"is_world_process_zero": true, | |
"log_history": [ | |
{ | |
"epoch": 0.8, | |
"eval_accuracy": 0.8391304347826087, | |
"eval_loss": 1.1266765594482422, | |
"eval_runtime": 299.2277, | |
"eval_samples_per_second": 1.537, | |
"eval_steps_per_second": 0.05, | |
"step": 3 | |
}, | |
{ | |
"epoch": 1.87, | |
"eval_accuracy": 0.8304347826086956, | |
"eval_loss": 1.0719478130340576, | |
"eval_runtime": 4.3394, | |
"eval_samples_per_second": 106.006, | |
"eval_steps_per_second": 3.457, | |
"step": 7 | |
}, | |
{ | |
"epoch": 2.67, | |
"grad_norm": 11.345915794372559, | |
"learning_rate": 3.3333333333333335e-05, | |
"loss": 0.5709, | |
"step": 10 | |
}, | |
{ | |
"epoch": 2.93, | |
"eval_accuracy": 0.8478260869565217, | |
"eval_loss": 0.944671630859375, | |
"eval_runtime": 4.3766, | |
"eval_samples_per_second": 105.105, | |
"eval_steps_per_second": 3.427, | |
"step": 11 | |
}, | |
{ | |
"epoch": 4.0, | |
"eval_accuracy": 0.8652173913043478, | |
"eval_loss": 0.8441539406776428, | |
"eval_runtime": 4.5501, | |
"eval_samples_per_second": 101.097, | |
"eval_steps_per_second": 3.297, | |
"step": 15 | |
}, | |
{ | |
"epoch": 4.8, | |
"eval_accuracy": 0.8826086956521739, | |
"eval_loss": 0.7064985632896423, | |
"eval_runtime": 4.6867, | |
"eval_samples_per_second": 98.149, | |
"eval_steps_per_second": 3.201, | |
"step": 18 | |
}, | |
{ | |
"epoch": 5.33, | |
"grad_norm": 7.515535354614258, | |
"learning_rate": 4.814814814814815e-05, | |
"loss": 0.3317, | |
"step": 20 | |
}, | |
{ | |
"epoch": 5.87, | |
"eval_accuracy": 0.8891304347826087, | |
"eval_loss": 0.6930130124092102, | |
"eval_runtime": 4.6291, | |
"eval_samples_per_second": 99.372, | |
"eval_steps_per_second": 3.24, | |
"step": 22 | |
}, | |
{ | |
"epoch": 6.93, | |
"eval_accuracy": 0.8978260869565218, | |
"eval_loss": 0.5629937648773193, | |
"eval_runtime": 4.4716, | |
"eval_samples_per_second": 102.872, | |
"eval_steps_per_second": 3.355, | |
"step": 26 | |
}, | |
{ | |
"epoch": 8.0, | |
"grad_norm": 5.26043701171875, | |
"learning_rate": 4.4444444444444447e-05, | |
"loss": 0.1576, | |
"step": 30 | |
}, | |
{ | |
"epoch": 8.0, | |
"eval_accuracy": 0.8826086956521739, | |
"eval_loss": 0.5882498025894165, | |
"eval_runtime": 4.326, | |
"eval_samples_per_second": 106.334, | |
"eval_steps_per_second": 3.467, | |
"step": 30 | |
}, | |
{ | |
"epoch": 8.8, | |
"eval_accuracy": 0.908695652173913, | |
"eval_loss": 0.5198363065719604, | |
"eval_runtime": 4.262, | |
"eval_samples_per_second": 107.93, | |
"eval_steps_per_second": 3.519, | |
"step": 33 | |
}, | |
{ | |
"epoch": 9.87, | |
"eval_accuracy": 0.9043478260869565, | |
"eval_loss": 0.4424881935119629, | |
"eval_runtime": 4.3408, | |
"eval_samples_per_second": 105.972, | |
"eval_steps_per_second": 3.456, | |
"step": 37 | |
}, | |
{ | |
"epoch": 10.67, | |
"grad_norm": 2.913085460662842, | |
"learning_rate": 4.074074074074074e-05, | |
"loss": 0.0883, | |
"step": 40 | |
}, | |
{ | |
"epoch": 10.93, | |
"eval_accuracy": 0.8978260869565218, | |
"eval_loss": 0.4727242887020111, | |
"eval_runtime": 4.3328, | |
"eval_samples_per_second": 106.168, | |
"eval_steps_per_second": 3.462, | |
"step": 41 | |
}, | |
{ | |
"epoch": 12.0, | |
"eval_accuracy": 0.9021739130434783, | |
"eval_loss": 0.4314464330673218, | |
"eval_runtime": 4.6644, | |
"eval_samples_per_second": 98.619, | |
"eval_steps_per_second": 3.216, | |
"step": 45 | |
}, | |
{ | |
"epoch": 12.8, | |
"eval_accuracy": 0.9021739130434783, | |
"eval_loss": 0.40110892057418823, | |
"eval_runtime": 4.8419, | |
"eval_samples_per_second": 95.004, | |
"eval_steps_per_second": 3.098, | |
"step": 48 | |
}, | |
{ | |
"epoch": 13.33, | |
"grad_norm": 1.2048002481460571, | |
"learning_rate": 3.7037037037037037e-05, | |
"loss": 0.051, | |
"step": 50 | |
}, | |
{ | |
"epoch": 13.87, | |
"eval_accuracy": 0.9173913043478261, | |
"eval_loss": 0.404487669467926, | |
"eval_runtime": 4.5406, | |
"eval_samples_per_second": 101.309, | |
"eval_steps_per_second": 3.304, | |
"step": 52 | |
}, | |
{ | |
"epoch": 14.93, | |
"eval_accuracy": 0.9108695652173913, | |
"eval_loss": 0.3745279610157013, | |
"eval_runtime": 4.2415, | |
"eval_samples_per_second": 108.451, | |
"eval_steps_per_second": 3.536, | |
"step": 56 | |
}, | |
{ | |
"epoch": 16.0, | |
"grad_norm": 2.0225095748901367, | |
"learning_rate": 3.3333333333333335e-05, | |
"loss": 0.0415, | |
"step": 60 | |
}, | |
{ | |
"epoch": 16.0, | |
"eval_accuracy": 0.9152173913043479, | |
"eval_loss": 0.3597088158130646, | |
"eval_runtime": 4.2243, | |
"eval_samples_per_second": 108.894, | |
"eval_steps_per_second": 3.551, | |
"step": 60 | |
}, | |
{ | |
"epoch": 16.8, | |
"eval_accuracy": 0.9065217391304348, | |
"eval_loss": 0.40161189436912537, | |
"eval_runtime": 4.2256, | |
"eval_samples_per_second": 108.86, | |
"eval_steps_per_second": 3.55, | |
"step": 63 | |
}, | |
{ | |
"epoch": 17.87, | |
"eval_accuracy": 0.9152173913043479, | |
"eval_loss": 0.3803761899471283, | |
"eval_runtime": 4.2098, | |
"eval_samples_per_second": 109.269, | |
"eval_steps_per_second": 3.563, | |
"step": 67 | |
}, | |
{ | |
"epoch": 18.67, | |
"grad_norm": 0.8873955607414246, | |
"learning_rate": 2.962962962962963e-05, | |
"loss": 0.0307, | |
"step": 70 | |
}, | |
{ | |
"epoch": 18.93, | |
"eval_accuracy": 0.9217391304347826, | |
"eval_loss": 0.351882666349411, | |
"eval_runtime": 4.3177, | |
"eval_samples_per_second": 106.538, | |
"eval_steps_per_second": 3.474, | |
"step": 71 | |
}, | |
{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.8934782608695652, | |
"eval_loss": 0.4131200909614563, | |
"eval_runtime": 4.523, | |
"eval_samples_per_second": 101.703, | |
"eval_steps_per_second": 3.316, | |
"step": 75 | |
}, | |
{ | |
"epoch": 20.8, | |
"eval_accuracy": 0.9, | |
"eval_loss": 0.4047200679779053, | |
"eval_runtime": 4.74, | |
"eval_samples_per_second": 97.047, | |
"eval_steps_per_second": 3.165, | |
"step": 78 | |
}, | |
{ | |
"epoch": 21.33, | |
"grad_norm": 1.1633386611938477, | |
"learning_rate": 2.5925925925925925e-05, | |
"loss": 0.0262, | |
"step": 80 | |
}, | |
{ | |
"epoch": 21.87, | |
"eval_accuracy": 0.9173913043478261, | |
"eval_loss": 0.34501612186431885, | |
"eval_runtime": 4.8375, | |
"eval_samples_per_second": 95.09, | |
"eval_steps_per_second": 3.101, | |
"step": 82 | |
}, | |
{ | |
"epoch": 22.93, | |
"eval_accuracy": 0.9108695652173913, | |
"eval_loss": 0.36392879486083984, | |
"eval_runtime": 4.5545, | |
"eval_samples_per_second": 101.0, | |
"eval_steps_per_second": 3.293, | |
"step": 86 | |
}, | |
{ | |
"epoch": 24.0, | |
"grad_norm": 3.2603185176849365, | |
"learning_rate": 2.2222222222222223e-05, | |
"loss": 0.0208, | |
"step": 90 | |
}, | |
{ | |
"epoch": 24.0, | |
"eval_accuracy": 0.9043478260869565, | |
"eval_loss": 0.38431569933891296, | |
"eval_runtime": 4.371, | |
"eval_samples_per_second": 105.239, | |
"eval_steps_per_second": 3.432, | |
"step": 90 | |
}, | |
{ | |
"epoch": 24.8, | |
"eval_accuracy": 0.8978260869565218, | |
"eval_loss": 0.37965938448905945, | |
"eval_runtime": 4.2698, | |
"eval_samples_per_second": 107.734, | |
"eval_steps_per_second": 3.513, | |
"step": 93 | |
}, | |
{ | |
"epoch": 25.87, | |
"eval_accuracy": 0.9152173913043479, | |
"eval_loss": 0.36596596240997314, | |
"eval_runtime": 4.2147, | |
"eval_samples_per_second": 109.141, | |
"eval_steps_per_second": 3.559, | |
"step": 97 | |
}, | |
{ | |
"epoch": 26.67, | |
"grad_norm": 0.3663266599178314, | |
"learning_rate": 1.8518518518518518e-05, | |
"loss": 0.0141, | |
"step": 100 | |
}, | |
{ | |
"epoch": 26.93, | |
"eval_accuracy": 0.9152173913043479, | |
"eval_loss": 0.34451282024383545, | |
"eval_runtime": 4.4007, | |
"eval_samples_per_second": 104.529, | |
"eval_steps_per_second": 3.409, | |
"step": 101 | |
}, | |
{ | |
"epoch": 28.0, | |
"eval_accuracy": 0.9239130434782609, | |
"eval_loss": 0.3131215572357178, | |
"eval_runtime": 4.5955, | |
"eval_samples_per_second": 100.098, | |
"eval_steps_per_second": 3.264, | |
"step": 105 | |
}, | |
{ | |
"epoch": 28.8, | |
"eval_accuracy": 0.9195652173913044, | |
"eval_loss": 0.30694660544395447, | |
"eval_runtime": 4.7949, | |
"eval_samples_per_second": 95.936, | |
"eval_steps_per_second": 3.128, | |
"step": 108 | |
}, | |
{ | |
"epoch": 29.33, | |
"grad_norm": 0.8458459973335266, | |
"learning_rate": 1.4814814814814815e-05, | |
"loss": 0.0114, | |
"step": 110 | |
}, | |
{ | |
"epoch": 29.87, | |
"eval_accuracy": 0.9195652173913044, | |
"eval_loss": 0.30062630772590637, | |
"eval_runtime": 4.6098, | |
"eval_samples_per_second": 99.787, | |
"eval_steps_per_second": 3.254, | |
"step": 112 | |
}, | |
{ | |
"epoch": 30.93, | |
"eval_accuracy": 0.9239130434782609, | |
"eval_loss": 0.30970004200935364, | |
"eval_runtime": 4.5805, | |
"eval_samples_per_second": 100.425, | |
"eval_steps_per_second": 3.275, | |
"step": 116 | |
}, | |
{ | |
"epoch": 32.0, | |
"grad_norm": 0.6790540814399719, | |
"learning_rate": 1.1111111111111112e-05, | |
"loss": 0.014, | |
"step": 120 | |
}, | |
{ | |
"epoch": 32.0, | |
"eval_accuracy": 0.9173913043478261, | |
"eval_loss": 0.31208136677742004, | |
"eval_runtime": 4.2755, | |
"eval_samples_per_second": 107.59, | |
"eval_steps_per_second": 3.508, | |
"step": 120 | |
}, | |
{ | |
"epoch": 32.8, | |
"eval_accuracy": 0.9173913043478261, | |
"eval_loss": 0.3241799473762512, | |
"eval_runtime": 4.2702, | |
"eval_samples_per_second": 107.722, | |
"eval_steps_per_second": 3.513, | |
"step": 123 | |
}, | |
{ | |
"epoch": 33.87, | |
"eval_accuracy": 0.9217391304347826, | |
"eval_loss": 0.32906806468963623, | |
"eval_runtime": 4.2635, | |
"eval_samples_per_second": 107.894, | |
"eval_steps_per_second": 3.518, | |
"step": 127 | |
}, | |
{ | |
"epoch": 34.67, | |
"grad_norm": 0.5736334919929504, | |
"learning_rate": 7.4074074074074075e-06, | |
"loss": 0.016, | |
"step": 130 | |
}, | |
{ | |
"epoch": 34.93, | |
"eval_accuracy": 0.9217391304347826, | |
"eval_loss": 0.31564629077911377, | |
"eval_runtime": 4.3281, | |
"eval_samples_per_second": 106.281, | |
"eval_steps_per_second": 3.466, | |
"step": 131 | |
}, | |
{ | |
"epoch": 36.0, | |
"eval_accuracy": 0.9260869565217391, | |
"eval_loss": 0.30808836221694946, | |
"eval_runtime": 4.5545, | |
"eval_samples_per_second": 100.999, | |
"eval_steps_per_second": 3.293, | |
"step": 135 | |
}, | |
{ | |
"epoch": 36.8, | |
"eval_accuracy": 0.9260869565217391, | |
"eval_loss": 0.3083609640598297, | |
"eval_runtime": 4.8866, | |
"eval_samples_per_second": 94.135, | |
"eval_steps_per_second": 3.07, | |
"step": 138 | |
}, | |
{ | |
"epoch": 37.33, | |
"grad_norm": 1.5394645929336548, | |
"learning_rate": 3.7037037037037037e-06, | |
"loss": 0.0114, | |
"step": 140 | |
}, | |
{ | |
"epoch": 37.87, | |
"eval_accuracy": 0.9195652173913044, | |
"eval_loss": 0.3148006796836853, | |
"eval_runtime": 4.6556, | |
"eval_samples_per_second": 98.806, | |
"eval_steps_per_second": 3.222, | |
"step": 142 | |
}, | |
{ | |
"epoch": 38.93, | |
"eval_accuracy": 0.9173913043478261, | |
"eval_loss": 0.3191043436527252, | |
"eval_runtime": 4.4147, | |
"eval_samples_per_second": 104.198, | |
"eval_steps_per_second": 3.398, | |
"step": 146 | |
}, | |
{ | |
"epoch": 40.0, | |
"grad_norm": 0.860876202583313, | |
"learning_rate": 0.0, | |
"loss": 0.0091, | |
"step": 150 | |
}, | |
{ | |
"epoch": 40.0, | |
"eval_accuracy": 0.9173913043478261, | |
"eval_loss": 0.31911081075668335, | |
"eval_runtime": 4.2782, | |
"eval_samples_per_second": 107.523, | |
"eval_steps_per_second": 3.506, | |
"step": 150 | |
}, | |
{ | |
"epoch": 40.0, | |
"step": 150, | |
"total_flos": 4.585003492737024e+17, | |
"train_loss": 0.09297615384062131, | |
"train_runtime": 1186.4042, | |
"train_samples_per_second": 19.386, | |
"train_steps_per_second": 0.126 | |
} | |
], | |
"logging_steps": 10, | |
"max_steps": 150, | |
"num_input_tokens_seen": 0, | |
"num_train_epochs": 50, | |
"save_steps": 500, | |
"total_flos": 4.585003492737024e+17, | |
"train_batch_size": 32, | |
"trial_name": null, | |
"trial_params": null | |
} | |