albert-base-spanish-finetuned-pos / trainer_state.json
josecannete's picture
adding model finetuned on POS
ceeb921
{
"best_metric": 0.06187893822789192,
"best_model_checkpoint": "/data/jcanete/all_results/pos/albeto_base/epochs_4_bs_32_lr_5e-5/checkpoint-1350",
"epoch": 4.0,
"global_step": 1792,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.11,
"eval_accuracy": 0.9025092763592619,
"eval_f1": 0.8763735719801217,
"eval_loss": 0.4775541126728058,
"eval_precision": 0.8685320722877382,
"eval_recall": 0.8843579548860163,
"eval_runtime": 2.1198,
"eval_samples_per_second": 780.25,
"eval_steps_per_second": 24.53,
"step": 50
},
{
"epoch": 0.22,
"eval_accuracy": 0.9586079531014384,
"eval_f1": 0.9548124582381745,
"eval_loss": 0.18812087178230286,
"eval_precision": 0.9532058940661091,
"eval_recall": 0.9564244470639948,
"eval_runtime": 2.0628,
"eval_samples_per_second": 801.819,
"eval_steps_per_second": 25.208,
"step": 100
},
{
"epoch": 0.33,
"eval_accuracy": 0.9670795140712628,
"eval_f1": 0.9638712895984035,
"eval_loss": 0.1361953318119049,
"eval_precision": 0.9626898393590305,
"eval_recall": 0.9650556432438913,
"eval_runtime": 2.0682,
"eval_samples_per_second": 799.741,
"eval_steps_per_second": 25.143,
"step": 150
},
{
"epoch": 0.45,
"eval_accuracy": 0.9724504837261314,
"eval_f1": 0.9702885315927622,
"eval_loss": 0.114054836332798,
"eval_precision": 0.9693694412316037,
"eval_recall": 0.9712093664462248,
"eval_runtime": 2.0767,
"eval_samples_per_second": 796.445,
"eval_steps_per_second": 25.039,
"step": 200
},
{
"epoch": 0.56,
"eval_accuracy": 0.9757543925043628,
"eval_f1": 0.9740005591277607,
"eval_loss": 0.09939529001712799,
"eval_precision": 0.9734757010278415,
"eval_recall": 0.9745259834968333,
"eval_runtime": 2.0489,
"eval_samples_per_second": 807.255,
"eval_steps_per_second": 25.379,
"step": 250
},
{
"epoch": 0.67,
"eval_accuracy": 0.9776689652835432,
"eval_f1": 0.9757610820731757,
"eval_loss": 0.088424913585186,
"eval_precision": 0.9743033007310611,
"eval_recall": 0.9772232323030509,
"eval_runtime": 2.0999,
"eval_samples_per_second": 787.646,
"eval_steps_per_second": 24.763,
"step": 300
},
{
"epoch": 0.78,
"eval_accuracy": 0.9774148184544484,
"eval_f1": 0.9754915162941018,
"eval_loss": 0.08702255040407181,
"eval_precision": 0.9740438247011952,
"eval_recall": 0.9769435176120357,
"eval_runtime": 2.0824,
"eval_samples_per_second": 794.288,
"eval_steps_per_second": 24.972,
"step": 350
},
{
"epoch": 0.89,
"eval_accuracy": 0.9789905287948357,
"eval_f1": 0.977314445331205,
"eval_loss": 0.07801014184951782,
"eval_precision": 0.9759708302616111,
"eval_recall": 0.9786617649997003,
"eval_runtime": 2.0909,
"eval_samples_per_second": 791.042,
"eval_steps_per_second": 24.87,
"step": 400
},
{
"epoch": 1.0,
"eval_accuracy": 0.9785669507463445,
"eval_f1": 0.9774886245709268,
"eval_loss": 0.08075062185525894,
"eval_precision": 0.9763779527559056,
"eval_recall": 0.9786018261373399,
"eval_runtime": 2.0836,
"eval_samples_per_second": 793.818,
"eval_steps_per_second": 24.957,
"step": 450
},
{
"epoch": 1.12,
"learning_rate": 3.6132812500000005e-05,
"loss": 0.241,
"step": 500
},
{
"epoch": 1.12,
"eval_accuracy": 0.9803968079158266,
"eval_f1": 0.9791845450735426,
"eval_loss": 0.07434948533773422,
"eval_precision": 0.978091421964396,
"eval_recall": 0.9802801142834309,
"eval_runtime": 2.089,
"eval_samples_per_second": 791.781,
"eval_steps_per_second": 24.893,
"step": 500
},
{
"epoch": 1.23,
"eval_accuracy": 0.9808542722081971,
"eval_f1": 0.9793645725233495,
"eval_loss": 0.0712265595793724,
"eval_precision": 0.9782517691617661,
"eval_recall": 0.9804799104912989,
"eval_runtime": 2.1304,
"eval_samples_per_second": 776.388,
"eval_steps_per_second": 24.409,
"step": 550
},
{
"epoch": 1.34,
"eval_accuracy": 0.981531997085783,
"eval_f1": 0.9805385337032675,
"eval_loss": 0.07107982784509659,
"eval_precision": 0.9795999760703532,
"eval_recall": 0.9814788915306387,
"eval_runtime": 2.1757,
"eval_samples_per_second": 760.207,
"eval_steps_per_second": 23.9,
"step": 600
},
{
"epoch": 1.45,
"eval_accuracy": 0.9790413581606546,
"eval_f1": 0.9788185948968892,
"eval_loss": 0.07391183823347092,
"eval_precision": 0.9784961265074674,
"eval_recall": 0.9791412758985835,
"eval_runtime": 2.0804,
"eval_samples_per_second": 795.028,
"eval_steps_per_second": 24.995,
"step": 650
},
{
"epoch": 1.56,
"eval_accuracy": 0.9813286796225072,
"eval_f1": 0.9801365487502994,
"eval_loss": 0.0686594694852829,
"eval_precision": 0.9793349689825065,
"eval_recall": 0.9809394417693952,
"eval_runtime": 2.0741,
"eval_samples_per_second": 797.437,
"eval_steps_per_second": 25.071,
"step": 700
},
{
"epoch": 1.67,
"eval_accuracy": 0.9802104335744904,
"eval_f1": 0.9797732607501373,
"eval_loss": 0.07021336257457733,
"eval_precision": 0.9796460530520933,
"eval_recall": 0.9799005014884817,
"eval_runtime": 2.1147,
"eval_samples_per_second": 782.145,
"eval_steps_per_second": 24.59,
"step": 750
},
{
"epoch": 1.79,
"eval_accuracy": 0.9814303383541452,
"eval_f1": 0.9805597435923037,
"eval_loss": 0.0652608796954155,
"eval_precision": 0.9800606762205102,
"eval_recall": 0.981059319494116,
"eval_runtime": 2.0748,
"eval_samples_per_second": 797.185,
"eval_steps_per_second": 25.063,
"step": 800
},
{
"epoch": 1.9,
"eval_accuracy": 0.981921688890395,
"eval_f1": 0.9809404063385623,
"eval_loss": 0.06410165876150131,
"eval_precision": 0.9798648352305576,
"eval_recall": 0.9820183412918823,
"eval_runtime": 2.0778,
"eval_samples_per_second": 796.04,
"eval_steps_per_second": 25.027,
"step": 850
},
{
"epoch": 2.01,
"eval_accuracy": 0.9811253621592314,
"eval_f1": 0.9806592046010524,
"eval_loss": 0.06488435715436935,
"eval_precision": 0.9801796407185629,
"eval_recall": 0.9811392379772632,
"eval_runtime": 2.1012,
"eval_samples_per_second": 787.158,
"eval_steps_per_second": 24.747,
"step": 900
},
{
"epoch": 2.12,
"eval_accuracy": 0.981921688890395,
"eval_f1": 0.980970827259839,
"eval_loss": 0.06455742567777634,
"eval_precision": 0.9803835485222805,
"eval_recall": 0.981558810013786,
"eval_runtime": 2.0619,
"eval_samples_per_second": 802.191,
"eval_steps_per_second": 25.22,
"step": 950
},
{
"epoch": 2.23,
"learning_rate": 2.2181919642857143e-05,
"loss": 0.0552,
"step": 1000
},
{
"epoch": 2.23,
"eval_accuracy": 0.9817522576709985,
"eval_f1": 0.9810314877303675,
"eval_loss": 0.06508930027484894,
"eval_precision": 0.9804050683428115,
"eval_recall": 0.9816587081177199,
"eval_runtime": 2.1717,
"eval_samples_per_second": 761.606,
"eval_steps_per_second": 23.944,
"step": 1000
},
{
"epoch": 2.34,
"eval_accuracy": 0.9813117365005676,
"eval_f1": 0.9809139731278326,
"eval_loss": 0.06810390949249268,
"eval_precision": 0.9801703672671415,
"eval_recall": 0.9816587081177199,
"eval_runtime": 2.0658,
"eval_samples_per_second": 800.673,
"eval_steps_per_second": 25.172,
"step": 1050
},
{
"epoch": 2.46,
"eval_accuracy": 0.9818539164026363,
"eval_f1": 0.9811795481094681,
"eval_loss": 0.06340151280164719,
"eval_precision": 0.9806410409930947,
"eval_recall": 0.9817186469800803,
"eval_runtime": 2.0822,
"eval_samples_per_second": 794.348,
"eval_steps_per_second": 24.973,
"step": 1100
},
{
"epoch": 2.57,
"eval_accuracy": 0.9818369732806967,
"eval_f1": 0.9809949692565679,
"eval_loss": 0.06365738064050674,
"eval_precision": 0.9801926874513793,
"eval_recall": 0.9817985654632275,
"eval_runtime": 2.0674,
"eval_samples_per_second": 800.041,
"eval_steps_per_second": 25.152,
"step": 1150
},
{
"epoch": 2.68,
"eval_accuracy": 0.9816336558174209,
"eval_f1": 0.9807511830834048,
"eval_loss": 0.06771722435951233,
"eval_precision": 0.9801640358404342,
"eval_recall": 0.9813390341851311,
"eval_runtime": 2.1084,
"eval_samples_per_second": 784.48,
"eval_steps_per_second": 24.663,
"step": 1200
},
{
"epoch": 2.79,
"eval_accuracy": 0.9821419494756104,
"eval_f1": 0.9814700185699169,
"eval_loss": 0.06466551870107651,
"eval_precision": 0.9808824409810222,
"eval_recall": 0.9820583005334559,
"eval_runtime": 2.0736,
"eval_samples_per_second": 797.648,
"eval_steps_per_second": 25.077,
"step": 1250
},
{
"epoch": 2.9,
"eval_accuracy": 0.9823113806950069,
"eval_f1": 0.9817473789316026,
"eval_loss": 0.06309983134269714,
"eval_precision": 0.9812770713986307,
"eval_recall": 0.9822181374997503,
"eval_runtime": 2.0792,
"eval_samples_per_second": 795.5,
"eval_steps_per_second": 25.01,
"step": 1300
},
{
"epoch": 3.01,
"eval_accuracy": 0.9825994137679809,
"eval_f1": 0.9820124843945068,
"eval_loss": 0.06187893822789192,
"eval_precision": 0.9817869553061469,
"eval_recall": 0.9822381171205371,
"eval_runtime": 2.1014,
"eval_samples_per_second": 787.097,
"eval_steps_per_second": 24.745,
"step": 1350
},
{
"epoch": 3.12,
"eval_accuracy": 0.9825994137679809,
"eval_f1": 0.982114145903031,
"eval_loss": 0.06504332274198532,
"eval_precision": 0.9817905918057663,
"eval_recall": 0.982437913328405,
"eval_runtime": 2.0928,
"eval_samples_per_second": 790.338,
"eval_steps_per_second": 24.847,
"step": 1400
},
{
"epoch": 3.24,
"eval_accuracy": 0.9826502431337998,
"eval_f1": 0.9820854386770786,
"eval_loss": 0.06560202687978745,
"eval_precision": 0.9816933181609471,
"eval_recall": 0.9824778725699786,
"eval_runtime": 2.107,
"eval_samples_per_second": 785.001,
"eval_steps_per_second": 24.68,
"step": 1450
},
{
"epoch": 3.35,
"learning_rate": 8.231026785714286e-06,
"loss": 0.0349,
"step": 1500
},
{
"epoch": 3.35,
"eval_accuracy": 0.9823283238169465,
"eval_f1": 0.9818849987017915,
"eval_loss": 0.06487075239419937,
"eval_precision": 0.9815321340866892,
"eval_recall": 0.9822381171205371,
"eval_runtime": 2.0794,
"eval_samples_per_second": 795.421,
"eval_steps_per_second": 25.007,
"step": 1500
},
{
"epoch": 3.46,
"eval_accuracy": 0.9819894613781536,
"eval_f1": 0.9817542668251226,
"eval_loss": 0.06555231660604477,
"eval_precision": 0.9814504213090531,
"eval_recall": 0.9820583005334559,
"eval_runtime": 2.0691,
"eval_samples_per_second": 799.369,
"eval_steps_per_second": 25.131,
"step": 1550
},
{
"epoch": 3.57,
"eval_accuracy": 0.9817353145490588,
"eval_f1": 0.9813986013986015,
"eval_loss": 0.0676359012722969,
"eval_precision": 0.9814182101540491,
"eval_recall": 0.9813789934267048,
"eval_runtime": 2.0661,
"eval_samples_per_second": 800.526,
"eval_steps_per_second": 25.168,
"step": 1600
},
{
"epoch": 3.68,
"eval_accuracy": 0.9817014283051795,
"eval_f1": 0.9812628593116398,
"eval_loss": 0.06634774059057236,
"eval_precision": 0.981066885023267,
"eval_recall": 0.9814589119098519,
"eval_runtime": 2.0684,
"eval_samples_per_second": 799.649,
"eval_steps_per_second": 25.14,
"step": 1650
},
{
"epoch": 3.79,
"eval_accuracy": 0.9819894613781536,
"eval_f1": 0.981464466903687,
"eval_loss": 0.06648925691843033,
"eval_precision": 0.9811705037838702,
"eval_recall": 0.9817586062216539,
"eval_runtime": 2.0825,
"eval_samples_per_second": 794.254,
"eval_steps_per_second": 24.97,
"step": 1700
},
{
"epoch": 3.91,
"eval_accuracy": 0.9822605513291879,
"eval_f1": 0.9816685969886978,
"eval_loss": 0.06550350040197372,
"eval_precision": 0.9811396068256661,
"eval_recall": 0.9821981578789635,
"eval_runtime": 2.0814,
"eval_samples_per_second": 794.645,
"eval_steps_per_second": 24.983,
"step": 1750
},
{
"epoch": 4.0,
"step": 1792,
"total_flos": 211503244790400.0,
"train_loss": 0.09681594052485057,
"train_runtime": 1409.8405,
"train_samples_per_second": 40.586,
"train_steps_per_second": 1.271
}
],
"max_steps": 1792,
"num_train_epochs": 4,
"total_flos": 211503244790400.0,
"trial_name": null,
"trial_params": null
}