dima806's picture
Upload folder using huggingface_hub
99773c7
raw
history blame contribute delete
No virus
9.55 kB
{
"best_metric": 0.7137995958328247,
"best_model_checkpoint": "dogs_70_breeds_image_detection/checkpoint-7020",
"epoch": 30.0,
"eval_steps": 500,
"global_step": 7020,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.5700534759358289,
"eval_loss": 3.8619625568389893,
"eval_runtime": 16.943,
"eval_samples_per_second": 110.37,
"eval_steps_per_second": 13.811,
"step": 234
},
{
"epoch": 2.0,
"eval_accuracy": 0.7903743315508022,
"eval_loss": 3.442793846130371,
"eval_runtime": 16.7743,
"eval_samples_per_second": 111.48,
"eval_steps_per_second": 13.95,
"step": 468
},
{
"epoch": 2.14,
"learning_rate": 9.354375896700143e-06,
"loss": 3.8066,
"step": 500
},
{
"epoch": 3.0,
"eval_accuracy": 0.8385026737967914,
"eval_loss": 3.106651782989502,
"eval_runtime": 16.721,
"eval_samples_per_second": 111.835,
"eval_steps_per_second": 13.994,
"step": 702
},
{
"epoch": 4.0,
"eval_accuracy": 0.8625668449197861,
"eval_loss": 2.8242247104644775,
"eval_runtime": 16.6814,
"eval_samples_per_second": 112.101,
"eval_steps_per_second": 14.028,
"step": 936
},
{
"epoch": 4.27,
"learning_rate": 8.637015781922526e-06,
"loss": 2.9436,
"step": 1000
},
{
"epoch": 5.0,
"eval_accuracy": 0.8748663101604278,
"eval_loss": 2.583355665206909,
"eval_runtime": 16.6174,
"eval_samples_per_second": 112.533,
"eval_steps_per_second": 14.082,
"step": 1170
},
{
"epoch": 6.0,
"eval_accuracy": 0.8903743315508021,
"eval_loss": 2.3684189319610596,
"eval_runtime": 16.679,
"eval_samples_per_second": 112.117,
"eval_steps_per_second": 14.03,
"step": 1404
},
{
"epoch": 6.41,
"learning_rate": 7.919655667144908e-06,
"loss": 2.3544,
"step": 1500
},
{
"epoch": 7.0,
"eval_accuracy": 0.8935828877005347,
"eval_loss": 2.177172899246216,
"eval_runtime": 16.7621,
"eval_samples_per_second": 111.561,
"eval_steps_per_second": 13.96,
"step": 1638
},
{
"epoch": 8.0,
"eval_accuracy": 0.9058823529411765,
"eval_loss": 2.007451295852661,
"eval_runtime": 16.6026,
"eval_samples_per_second": 112.633,
"eval_steps_per_second": 14.094,
"step": 1872
},
{
"epoch": 8.55,
"learning_rate": 7.202295552367289e-06,
"loss": 1.9032,
"step": 2000
},
{
"epoch": 9.0,
"eval_accuracy": 0.902139037433155,
"eval_loss": 1.8538062572479248,
"eval_runtime": 16.685,
"eval_samples_per_second": 112.077,
"eval_steps_per_second": 14.025,
"step": 2106
},
{
"epoch": 10.0,
"eval_accuracy": 0.9058823529411765,
"eval_loss": 1.7170625925064087,
"eval_runtime": 16.7001,
"eval_samples_per_second": 111.975,
"eval_steps_per_second": 14.012,
"step": 2340
},
{
"epoch": 10.68,
"learning_rate": 6.48493543758967e-06,
"loss": 1.5446,
"step": 2500
},
{
"epoch": 11.0,
"eval_accuracy": 0.9074866310160428,
"eval_loss": 1.5915807485580444,
"eval_runtime": 16.4868,
"eval_samples_per_second": 113.424,
"eval_steps_per_second": 14.193,
"step": 2574
},
{
"epoch": 12.0,
"eval_accuracy": 0.9117647058823529,
"eval_loss": 1.4730502367019653,
"eval_runtime": 16.6406,
"eval_samples_per_second": 112.376,
"eval_steps_per_second": 14.062,
"step": 2808
},
{
"epoch": 12.82,
"learning_rate": 5.767575322812053e-06,
"loss": 1.2629,
"step": 3000
},
{
"epoch": 13.0,
"eval_accuracy": 0.9187165775401069,
"eval_loss": 1.3681436777114868,
"eval_runtime": 16.7454,
"eval_samples_per_second": 111.672,
"eval_steps_per_second": 13.974,
"step": 3042
},
{
"epoch": 14.0,
"eval_accuracy": 0.9165775401069519,
"eval_loss": 1.2735283374786377,
"eval_runtime": 16.5505,
"eval_samples_per_second": 112.987,
"eval_steps_per_second": 14.139,
"step": 3276
},
{
"epoch": 14.96,
"learning_rate": 5.050215208034433e-06,
"loss": 1.0405,
"step": 3500
},
{
"epoch": 15.0,
"eval_accuracy": 0.9181818181818182,
"eval_loss": 1.1897326707839966,
"eval_runtime": 16.574,
"eval_samples_per_second": 112.827,
"eval_steps_per_second": 14.118,
"step": 3510
},
{
"epoch": 16.0,
"eval_accuracy": 0.9229946524064171,
"eval_loss": 1.1123002767562866,
"eval_runtime": 16.7899,
"eval_samples_per_second": 111.377,
"eval_steps_per_second": 13.937,
"step": 3744
},
{
"epoch": 17.0,
"eval_accuracy": 0.9262032085561497,
"eval_loss": 1.0538486242294312,
"eval_runtime": 16.5745,
"eval_samples_per_second": 112.824,
"eval_steps_per_second": 14.118,
"step": 3978
},
{
"epoch": 17.09,
"learning_rate": 4.332855093256815e-06,
"loss": 0.8665,
"step": 4000
},
{
"epoch": 18.0,
"eval_accuracy": 0.925668449197861,
"eval_loss": 0.9949386715888977,
"eval_runtime": 16.5637,
"eval_samples_per_second": 112.897,
"eval_steps_per_second": 14.127,
"step": 4212
},
{
"epoch": 19.0,
"eval_accuracy": 0.9262032085561497,
"eval_loss": 0.9491089582443237,
"eval_runtime": 16.5976,
"eval_samples_per_second": 112.667,
"eval_steps_per_second": 14.098,
"step": 4446
},
{
"epoch": 19.23,
"learning_rate": 3.615494978479197e-06,
"loss": 0.7318,
"step": 4500
},
{
"epoch": 20.0,
"eval_accuracy": 0.9315508021390374,
"eval_loss": 0.8963261246681213,
"eval_runtime": 16.6332,
"eval_samples_per_second": 112.426,
"eval_steps_per_second": 14.068,
"step": 4680
},
{
"epoch": 21.0,
"eval_accuracy": 0.9294117647058824,
"eval_loss": 0.8556962609291077,
"eval_runtime": 17.2231,
"eval_samples_per_second": 108.575,
"eval_steps_per_second": 13.586,
"step": 4914
},
{
"epoch": 21.37,
"learning_rate": 2.898134863701578e-06,
"loss": 0.6322,
"step": 5000
},
{
"epoch": 22.0,
"eval_accuracy": 0.9336898395721925,
"eval_loss": 0.8246510624885559,
"eval_runtime": 16.769,
"eval_samples_per_second": 111.515,
"eval_steps_per_second": 13.954,
"step": 5148
},
{
"epoch": 23.0,
"eval_accuracy": 0.932620320855615,
"eval_loss": 0.8025164604187012,
"eval_runtime": 16.8215,
"eval_samples_per_second": 111.167,
"eval_steps_per_second": 13.911,
"step": 5382
},
{
"epoch": 23.5,
"learning_rate": 2.18077474892396e-06,
"loss": 0.5623,
"step": 5500
},
{
"epoch": 24.0,
"eval_accuracy": 0.9299465240641711,
"eval_loss": 0.778028666973114,
"eval_runtime": 16.7832,
"eval_samples_per_second": 111.421,
"eval_steps_per_second": 13.943,
"step": 5616
},
{
"epoch": 25.0,
"eval_accuracy": 0.9347593582887701,
"eval_loss": 0.7549712657928467,
"eval_runtime": 16.589,
"eval_samples_per_second": 112.725,
"eval_steps_per_second": 14.106,
"step": 5850
},
{
"epoch": 25.64,
"learning_rate": 1.4634146341463414e-06,
"loss": 0.5055,
"step": 6000
},
{
"epoch": 26.0,
"eval_accuracy": 0.9336898395721925,
"eval_loss": 0.7411012649536133,
"eval_runtime": 16.9543,
"eval_samples_per_second": 110.297,
"eval_steps_per_second": 13.802,
"step": 6084
},
{
"epoch": 27.0,
"eval_accuracy": 0.9358288770053476,
"eval_loss": 0.729629397392273,
"eval_runtime": 16.9047,
"eval_samples_per_second": 110.62,
"eval_steps_per_second": 13.842,
"step": 6318
},
{
"epoch": 27.78,
"learning_rate": 7.460545193687231e-07,
"loss": 0.4743,
"step": 6500
},
{
"epoch": 28.0,
"eval_accuracy": 0.9331550802139037,
"eval_loss": 0.7210513949394226,
"eval_runtime": 16.6036,
"eval_samples_per_second": 112.626,
"eval_steps_per_second": 14.093,
"step": 6552
},
{
"epoch": 29.0,
"eval_accuracy": 0.9358288770053476,
"eval_loss": 0.7155081629753113,
"eval_runtime": 16.7145,
"eval_samples_per_second": 111.879,
"eval_steps_per_second": 14.0,
"step": 6786
},
{
"epoch": 29.91,
"learning_rate": 2.869440459110474e-08,
"loss": 0.457,
"step": 7000
},
{
"epoch": 30.0,
"eval_accuracy": 0.9352941176470588,
"eval_loss": 0.7137995958328247,
"eval_runtime": 16.6482,
"eval_samples_per_second": 112.325,
"eval_steps_per_second": 14.056,
"step": 7020
}
],
"logging_steps": 500,
"max_steps": 7020,
"num_train_epochs": 30,
"save_steps": 500,
"total_flos": 1.7390651600583475e+19,
"trial_name": null,
"trial_params": null
}