File size: 2,076 Bytes
c3bd583 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 |
{
"best_metric": 0.3263157894736842,
"best_model_checkpoint": "cvt-13-finetuned-eurosat/checkpoint-23",
"epoch": 2.8085106382978724,
"eval_steps": 500,
"global_step": 33,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.851063829787234,
"grad_norm": 1.9627628326416016,
"learning_rate": 3.965517241379311e-05,
"loss": 2.2813,
"step": 10
},
{
"epoch": 0.9361702127659575,
"eval_accuracy": 0.21578947368421053,
"eval_loss": 2.223036766052246,
"eval_runtime": 5.5013,
"eval_samples_per_second": 34.537,
"eval_steps_per_second": 1.091,
"step": 11
},
{
"epoch": 1.702127659574468,
"grad_norm": 2.595986843109131,
"learning_rate": 2.2413793103448276e-05,
"loss": 2.2185,
"step": 20
},
{
"epoch": 1.9574468085106385,
"eval_accuracy": 0.3263157894736842,
"eval_loss": 2.154409646987915,
"eval_runtime": 6.5383,
"eval_samples_per_second": 29.059,
"eval_steps_per_second": 0.918,
"step": 23
},
{
"epoch": 2.5531914893617023,
"grad_norm": 3.4765965938568115,
"learning_rate": 5.172413793103448e-06,
"loss": 2.1776,
"step": 30
},
{
"epoch": 2.8085106382978724,
"eval_accuracy": 0.32105263157894737,
"eval_loss": 2.1354737281799316,
"eval_runtime": 6.5898,
"eval_samples_per_second": 28.832,
"eval_steps_per_second": 0.91,
"step": 33
},
{
"epoch": 2.8085106382978724,
"step": 33,
"total_flos": 7.469420390498304e+16,
"train_loss": 2.222061128327341,
"train_runtime": 204.1055,
"train_samples_per_second": 22.047,
"train_steps_per_second": 0.162
}
],
"logging_steps": 10,
"max_steps": 33,
"num_input_tokens_seen": 0,
"num_train_epochs": 3,
"save_steps": 500,
"total_flos": 7.469420390498304e+16,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}
|