LexLLMv0.0.0.x.10.6.1c / trainer_state.json
andrealexroom's picture
Upload folder using huggingface_hub
d9145a6 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.9333794774182385,
"eval_steps": 93,
"global_step": 2697,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 1e-05,
"loss": 1.466,
"step": 1
},
{
"epoch": 0.03,
"learning_rate": 1e-05,
"loss": 1.3439,
"step": 93
},
{
"epoch": 0.03,
"eval_validation_privacy_sources_loss": 0.9993858337402344,
"eval_validation_privacy_sources_runtime": 208.8742,
"eval_validation_privacy_sources_samples_per_second": 2.758,
"eval_validation_privacy_sources_steps_per_second": 1.379,
"step": 93
},
{
"epoch": 0.03,
"eval_validation_agenda_digitale_loss": 1.5262001752853394,
"eval_validation_agenda_digitale_runtime": 186.7009,
"eval_validation_agenda_digitale_samples_per_second": 2.753,
"eval_validation_agenda_digitale_steps_per_second": 1.377,
"step": 93
},
{
"epoch": 0.03,
"eval_validation_leggepertutti_loss": 1.393169641494751,
"eval_validation_leggepertutti_runtime": 36.5278,
"eval_validation_leggepertutti_samples_per_second": 2.765,
"eval_validation_leggepertutti_steps_per_second": 1.396,
"step": 93
},
{
"epoch": 0.03,
"eval_validation_altalexprivacy_loss": 1.3749068975448608,
"eval_validation_altalexprivacy_runtime": 59.1055,
"eval_validation_altalexprivacy_samples_per_second": 2.758,
"eval_validation_altalexprivacy_steps_per_second": 1.387,
"step": 93
},
{
"epoch": 0.06,
"learning_rate": 1e-05,
"loss": 1.2277,
"step": 186
},
{
"epoch": 0.06,
"eval_validation_privacy_sources_loss": 0.9398746490478516,
"eval_validation_privacy_sources_runtime": 207.7931,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 186
},
{
"epoch": 0.06,
"eval_validation_agenda_digitale_loss": 1.4900918006896973,
"eval_validation_agenda_digitale_runtime": 185.4857,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 186
},
{
"epoch": 0.06,
"eval_validation_leggepertutti_loss": 1.3686381578445435,
"eval_validation_leggepertutti_runtime": 36.4651,
"eval_validation_leggepertutti_samples_per_second": 2.77,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 186
},
{
"epoch": 0.06,
"eval_validation_altalexprivacy_loss": 1.3352404832839966,
"eval_validation_altalexprivacy_runtime": 58.8108,
"eval_validation_altalexprivacy_samples_per_second": 2.772,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 186
},
{
"epoch": 0.1,
"learning_rate": 1e-05,
"loss": 1.1989,
"step": 279
},
{
"epoch": 0.1,
"eval_validation_privacy_sources_loss": 0.9079627990722656,
"eval_validation_privacy_sources_runtime": 207.7801,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 279
},
{
"epoch": 0.1,
"eval_validation_agenda_digitale_loss": 1.4663112163543701,
"eval_validation_agenda_digitale_runtime": 185.4551,
"eval_validation_agenda_digitale_samples_per_second": 2.772,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 279
},
{
"epoch": 0.1,
"eval_validation_leggepertutti_loss": 1.3589648008346558,
"eval_validation_leggepertutti_runtime": 36.4528,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 279
},
{
"epoch": 0.1,
"eval_validation_altalexprivacy_loss": 1.3104432821273804,
"eval_validation_altalexprivacy_runtime": 58.8143,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 279
},
{
"epoch": 0.13,
"learning_rate": 1e-05,
"loss": 1.166,
"step": 372
},
{
"epoch": 0.13,
"eval_validation_privacy_sources_loss": 0.8864494562149048,
"eval_validation_privacy_sources_runtime": 207.7989,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 372
},
{
"epoch": 0.13,
"eval_validation_agenda_digitale_loss": 1.4535290002822876,
"eval_validation_agenda_digitale_runtime": 185.4338,
"eval_validation_agenda_digitale_samples_per_second": 2.772,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 372
},
{
"epoch": 0.13,
"eval_validation_leggepertutti_loss": 1.3470954895019531,
"eval_validation_leggepertutti_runtime": 36.4554,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 372
},
{
"epoch": 0.13,
"eval_validation_altalexprivacy_loss": 1.2923557758331299,
"eval_validation_altalexprivacy_runtime": 58.8034,
"eval_validation_altalexprivacy_samples_per_second": 2.772,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 372
},
{
"epoch": 0.16,
"learning_rate": 1e-05,
"loss": 1.1502,
"step": 465
},
{
"epoch": 0.16,
"eval_validation_privacy_sources_loss": 0.8700113296508789,
"eval_validation_privacy_sources_runtime": 207.7896,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 465
},
{
"epoch": 0.16,
"eval_validation_agenda_digitale_loss": 1.4420515298843384,
"eval_validation_agenda_digitale_runtime": 185.5107,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.385,
"step": 465
},
{
"epoch": 0.16,
"eval_validation_leggepertutti_loss": 1.3380672931671143,
"eval_validation_leggepertutti_runtime": 36.4532,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 465
},
{
"epoch": 0.16,
"eval_validation_altalexprivacy_loss": 1.2828154563903809,
"eval_validation_altalexprivacy_runtime": 58.7825,
"eval_validation_altalexprivacy_samples_per_second": 2.773,
"eval_validation_altalexprivacy_steps_per_second": 1.395,
"step": 465
},
{
"epoch": 0.19,
"learning_rate": 1e-05,
"loss": 1.1293,
"step": 558
},
{
"epoch": 0.19,
"eval_validation_privacy_sources_loss": 0.8583760857582092,
"eval_validation_privacy_sources_runtime": 207.7778,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 558
},
{
"epoch": 0.19,
"eval_validation_agenda_digitale_loss": 1.4329832792282104,
"eval_validation_agenda_digitale_runtime": 185.4109,
"eval_validation_agenda_digitale_samples_per_second": 2.772,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 558
},
{
"epoch": 0.19,
"eval_validation_leggepertutti_loss": 1.332190752029419,
"eval_validation_leggepertutti_runtime": 36.4466,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 558
},
{
"epoch": 0.19,
"eval_validation_altalexprivacy_loss": 1.2727842330932617,
"eval_validation_altalexprivacy_runtime": 58.812,
"eval_validation_altalexprivacy_samples_per_second": 2.772,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 558
},
{
"epoch": 0.23,
"learning_rate": 1e-05,
"loss": 1.1214,
"step": 651
},
{
"epoch": 0.23,
"eval_validation_privacy_sources_loss": 0.8476831912994385,
"eval_validation_privacy_sources_runtime": 207.83,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 651
},
{
"epoch": 0.23,
"eval_validation_agenda_digitale_loss": 1.4262702465057373,
"eval_validation_agenda_digitale_runtime": 185.4527,
"eval_validation_agenda_digitale_samples_per_second": 2.772,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 651
},
{
"epoch": 0.23,
"eval_validation_leggepertutti_loss": 1.3270900249481201,
"eval_validation_leggepertutti_runtime": 36.4393,
"eval_validation_leggepertutti_samples_per_second": 2.772,
"eval_validation_leggepertutti_steps_per_second": 1.4,
"step": 651
},
{
"epoch": 0.23,
"eval_validation_altalexprivacy_loss": 1.260352611541748,
"eval_validation_altalexprivacy_runtime": 58.8334,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 651
},
{
"epoch": 0.26,
"learning_rate": 1e-05,
"loss": 1.1091,
"step": 744
},
{
"epoch": 0.26,
"eval_validation_privacy_sources_loss": 0.8393220901489258,
"eval_validation_privacy_sources_runtime": 207.8694,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.385,
"step": 744
},
{
"epoch": 0.26,
"eval_validation_agenda_digitale_loss": 1.419695258140564,
"eval_validation_agenda_digitale_runtime": 185.5111,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.385,
"step": 744
},
{
"epoch": 0.26,
"eval_validation_leggepertutti_loss": 1.3253276348114014,
"eval_validation_leggepertutti_runtime": 36.4703,
"eval_validation_leggepertutti_samples_per_second": 2.769,
"eval_validation_leggepertutti_steps_per_second": 1.398,
"step": 744
},
{
"epoch": 0.26,
"eval_validation_altalexprivacy_loss": 1.2589938640594482,
"eval_validation_altalexprivacy_runtime": 58.8276,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 744
},
{
"epoch": 0.29,
"learning_rate": 1e-05,
"loss": 1.1054,
"step": 837
},
{
"epoch": 0.29,
"eval_validation_privacy_sources_loss": 0.8303313851356506,
"eval_validation_privacy_sources_runtime": 207.8766,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.385,
"step": 837
},
{
"epoch": 0.29,
"eval_validation_agenda_digitale_loss": 1.4135520458221436,
"eval_validation_agenda_digitale_runtime": 185.5466,
"eval_validation_agenda_digitale_samples_per_second": 2.77,
"eval_validation_agenda_digitale_steps_per_second": 1.385,
"step": 837
},
{
"epoch": 0.29,
"eval_validation_leggepertutti_loss": 1.3197592496871948,
"eval_validation_leggepertutti_runtime": 36.4762,
"eval_validation_leggepertutti_samples_per_second": 2.769,
"eval_validation_leggepertutti_steps_per_second": 1.398,
"step": 837
},
{
"epoch": 0.29,
"eval_validation_altalexprivacy_loss": 1.248721957206726,
"eval_validation_altalexprivacy_runtime": 58.845,
"eval_validation_altalexprivacy_samples_per_second": 2.77,
"eval_validation_altalexprivacy_steps_per_second": 1.393,
"step": 837
},
{
"epoch": 0.32,
"learning_rate": 1e-05,
"loss": 1.0981,
"step": 930
},
{
"epoch": 0.32,
"eval_validation_privacy_sources_loss": 0.8243758678436279,
"eval_validation_privacy_sources_runtime": 207.9136,
"eval_validation_privacy_sources_samples_per_second": 2.77,
"eval_validation_privacy_sources_steps_per_second": 1.385,
"step": 930
},
{
"epoch": 0.32,
"eval_validation_agenda_digitale_loss": 1.4070162773132324,
"eval_validation_agenda_digitale_runtime": 185.5276,
"eval_validation_agenda_digitale_samples_per_second": 2.77,
"eval_validation_agenda_digitale_steps_per_second": 1.385,
"step": 930
},
{
"epoch": 0.32,
"eval_validation_leggepertutti_loss": 1.3205946683883667,
"eval_validation_leggepertutti_runtime": 36.4768,
"eval_validation_leggepertutti_samples_per_second": 2.769,
"eval_validation_leggepertutti_steps_per_second": 1.398,
"step": 930
},
{
"epoch": 0.32,
"eval_validation_altalexprivacy_loss": 1.236555576324463,
"eval_validation_altalexprivacy_runtime": 58.8174,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 930
},
{
"epoch": 0.35,
"learning_rate": 1e-05,
"loss": 1.0826,
"step": 1023
},
{
"epoch": 0.35,
"eval_validation_privacy_sources_loss": 0.8142690062522888,
"eval_validation_privacy_sources_runtime": 207.8182,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1023
},
{
"epoch": 0.35,
"eval_validation_agenda_digitale_loss": 1.4016144275665283,
"eval_validation_agenda_digitale_runtime": 185.5524,
"eval_validation_agenda_digitale_samples_per_second": 2.77,
"eval_validation_agenda_digitale_steps_per_second": 1.385,
"step": 1023
},
{
"epoch": 0.35,
"eval_validation_leggepertutti_loss": 1.314708948135376,
"eval_validation_leggepertutti_runtime": 36.4554,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1023
},
{
"epoch": 0.35,
"eval_validation_altalexprivacy_loss": 1.230077862739563,
"eval_validation_altalexprivacy_runtime": 58.8338,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1023
},
{
"epoch": 0.39,
"learning_rate": 1e-05,
"loss": 1.0854,
"step": 1116
},
{
"epoch": 0.39,
"eval_validation_privacy_sources_loss": 0.8100457787513733,
"eval_validation_privacy_sources_runtime": 207.7761,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1116
},
{
"epoch": 0.39,
"eval_validation_agenda_digitale_loss": 1.3958582878112793,
"eval_validation_agenda_digitale_runtime": 185.4776,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1116
},
{
"epoch": 0.39,
"eval_validation_leggepertutti_loss": 1.3077082633972168,
"eval_validation_leggepertutti_runtime": 36.4414,
"eval_validation_leggepertutti_samples_per_second": 2.772,
"eval_validation_leggepertutti_steps_per_second": 1.4,
"step": 1116
},
{
"epoch": 0.39,
"eval_validation_altalexprivacy_loss": 1.221291422843933,
"eval_validation_altalexprivacy_runtime": 58.8442,
"eval_validation_altalexprivacy_samples_per_second": 2.77,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1116
},
{
"epoch": 0.42,
"learning_rate": 1e-05,
"loss": 1.0771,
"step": 1209
},
{
"epoch": 0.42,
"eval_validation_privacy_sources_loss": 0.8034979701042175,
"eval_validation_privacy_sources_runtime": 207.8146,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1209
},
{
"epoch": 0.42,
"eval_validation_agenda_digitale_loss": 1.3933522701263428,
"eval_validation_agenda_digitale_runtime": 185.4596,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1209
},
{
"epoch": 0.42,
"eval_validation_leggepertutti_loss": 1.3102238178253174,
"eval_validation_leggepertutti_runtime": 36.4505,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1209
},
{
"epoch": 0.42,
"eval_validation_altalexprivacy_loss": 1.2192506790161133,
"eval_validation_altalexprivacy_runtime": 58.8165,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1209
},
{
"epoch": 0.45,
"learning_rate": 1e-05,
"loss": 1.0637,
"step": 1302
},
{
"epoch": 0.45,
"eval_validation_privacy_sources_loss": 0.7970249056816101,
"eval_validation_privacy_sources_runtime": 207.8381,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1302
},
{
"epoch": 0.45,
"eval_validation_agenda_digitale_loss": 1.3897120952606201,
"eval_validation_agenda_digitale_runtime": 185.475,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1302
},
{
"epoch": 0.45,
"eval_validation_leggepertutti_loss": 1.303721308708191,
"eval_validation_leggepertutti_runtime": 36.4613,
"eval_validation_leggepertutti_samples_per_second": 2.77,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1302
},
{
"epoch": 0.45,
"eval_validation_altalexprivacy_loss": 1.2124699354171753,
"eval_validation_altalexprivacy_runtime": 58.8366,
"eval_validation_altalexprivacy_samples_per_second": 2.77,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1302
},
{
"epoch": 0.48,
"learning_rate": 1e-05,
"loss": 1.0566,
"step": 1395
},
{
"epoch": 0.48,
"eval_validation_privacy_sources_loss": 0.7921364307403564,
"eval_validation_privacy_sources_runtime": 207.8584,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1395
},
{
"epoch": 0.48,
"eval_validation_agenda_digitale_loss": 1.3843779563903809,
"eval_validation_agenda_digitale_runtime": 185.4492,
"eval_validation_agenda_digitale_samples_per_second": 2.772,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1395
},
{
"epoch": 0.48,
"eval_validation_leggepertutti_loss": 1.3031646013259888,
"eval_validation_leggepertutti_runtime": 36.4511,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1395
},
{
"epoch": 0.48,
"eval_validation_altalexprivacy_loss": 1.2079439163208008,
"eval_validation_altalexprivacy_runtime": 58.8443,
"eval_validation_altalexprivacy_samples_per_second": 2.77,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1395
},
{
"epoch": 0.51,
"learning_rate": 1e-05,
"loss": 1.0553,
"step": 1488
},
{
"epoch": 0.51,
"eval_validation_privacy_sources_loss": 0.7880584001541138,
"eval_validation_privacy_sources_runtime": 207.9058,
"eval_validation_privacy_sources_samples_per_second": 2.77,
"eval_validation_privacy_sources_steps_per_second": 1.385,
"step": 1488
},
{
"epoch": 0.51,
"eval_validation_agenda_digitale_loss": 1.3801347017288208,
"eval_validation_agenda_digitale_runtime": 185.4606,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1488
},
{
"epoch": 0.51,
"eval_validation_leggepertutti_loss": 1.304322361946106,
"eval_validation_leggepertutti_runtime": 36.4655,
"eval_validation_leggepertutti_samples_per_second": 2.77,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1488
},
{
"epoch": 0.51,
"eval_validation_altalexprivacy_loss": 1.200743556022644,
"eval_validation_altalexprivacy_runtime": 58.8181,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1488
},
{
"epoch": 0.55,
"learning_rate": 1e-05,
"loss": 1.0464,
"step": 1581
},
{
"epoch": 0.55,
"eval_validation_privacy_sources_loss": 0.7845947742462158,
"eval_validation_privacy_sources_runtime": 207.7953,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1581
},
{
"epoch": 0.55,
"eval_validation_agenda_digitale_loss": 1.3774136304855347,
"eval_validation_agenda_digitale_runtime": 185.4238,
"eval_validation_agenda_digitale_samples_per_second": 2.772,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1581
},
{
"epoch": 0.55,
"eval_validation_leggepertutti_loss": 1.2997848987579346,
"eval_validation_leggepertutti_runtime": 36.4545,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1581
},
{
"epoch": 0.55,
"eval_validation_altalexprivacy_loss": 1.196614146232605,
"eval_validation_altalexprivacy_runtime": 58.7946,
"eval_validation_altalexprivacy_samples_per_second": 2.772,
"eval_validation_altalexprivacy_steps_per_second": 1.395,
"step": 1581
},
{
"epoch": 0.58,
"learning_rate": 1e-05,
"loss": 1.0387,
"step": 1674
},
{
"epoch": 0.58,
"eval_validation_privacy_sources_loss": 0.7808618545532227,
"eval_validation_privacy_sources_runtime": 207.8015,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1674
},
{
"epoch": 0.58,
"eval_validation_agenda_digitale_loss": 1.375112533569336,
"eval_validation_agenda_digitale_runtime": 185.4231,
"eval_validation_agenda_digitale_samples_per_second": 2.772,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1674
},
{
"epoch": 0.58,
"eval_validation_leggepertutti_loss": 1.3011507987976074,
"eval_validation_leggepertutti_runtime": 36.4454,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1674
},
{
"epoch": 0.58,
"eval_validation_altalexprivacy_loss": 1.190794825553894,
"eval_validation_altalexprivacy_runtime": 58.8028,
"eval_validation_altalexprivacy_samples_per_second": 2.772,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1674
},
{
"epoch": 0.61,
"learning_rate": 1e-05,
"loss": 1.0318,
"step": 1767
},
{
"epoch": 0.61,
"eval_validation_privacy_sources_loss": 0.7766129970550537,
"eval_validation_privacy_sources_runtime": 207.7465,
"eval_validation_privacy_sources_samples_per_second": 2.773,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1767
},
{
"epoch": 0.61,
"eval_validation_agenda_digitale_loss": 1.372268795967102,
"eval_validation_agenda_digitale_runtime": 185.4359,
"eval_validation_agenda_digitale_samples_per_second": 2.772,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1767
},
{
"epoch": 0.61,
"eval_validation_leggepertutti_loss": 1.2967208623886108,
"eval_validation_leggepertutti_runtime": 36.4479,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1767
},
{
"epoch": 0.61,
"eval_validation_altalexprivacy_loss": 1.1859400272369385,
"eval_validation_altalexprivacy_runtime": 58.8168,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1767
},
{
"epoch": 0.64,
"learning_rate": 1e-05,
"loss": 1.0549,
"step": 1860
},
{
"epoch": 0.64,
"eval_validation_privacy_sources_loss": 0.7737349271774292,
"eval_validation_privacy_sources_runtime": 207.757,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1860
},
{
"epoch": 0.64,
"eval_validation_agenda_digitale_loss": 1.3696516752243042,
"eval_validation_agenda_digitale_runtime": 185.376,
"eval_validation_agenda_digitale_samples_per_second": 2.773,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1860
},
{
"epoch": 0.64,
"eval_validation_leggepertutti_loss": 1.2951971292495728,
"eval_validation_leggepertutti_runtime": 36.4425,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 1860
},
{
"epoch": 0.64,
"eval_validation_altalexprivacy_loss": 1.180280089378357,
"eval_validation_altalexprivacy_runtime": 58.807,
"eval_validation_altalexprivacy_samples_per_second": 2.772,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1860
},
{
"epoch": 0.68,
"learning_rate": 1e-05,
"loss": 1.0244,
"step": 1953
},
{
"epoch": 0.68,
"eval_validation_privacy_sources_loss": 0.7704524993896484,
"eval_validation_privacy_sources_runtime": 207.8153,
"eval_validation_privacy_sources_samples_per_second": 2.772,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 1953
},
{
"epoch": 0.68,
"eval_validation_agenda_digitale_loss": 1.3666201829910278,
"eval_validation_agenda_digitale_runtime": 185.3706,
"eval_validation_agenda_digitale_samples_per_second": 2.773,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 1953
},
{
"epoch": 0.68,
"eval_validation_leggepertutti_loss": 1.2933101654052734,
"eval_validation_leggepertutti_runtime": 36.4405,
"eval_validation_leggepertutti_samples_per_second": 2.772,
"eval_validation_leggepertutti_steps_per_second": 1.4,
"step": 1953
},
{
"epoch": 0.68,
"eval_validation_altalexprivacy_loss": 1.1771676540374756,
"eval_validation_altalexprivacy_runtime": 58.8195,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 1953
},
{
"epoch": 0.71,
"learning_rate": 1e-05,
"loss": 1.0244,
"step": 2046
},
{
"epoch": 0.71,
"eval_validation_privacy_sources_loss": 0.7678720951080322,
"eval_validation_privacy_sources_runtime": 207.6339,
"eval_validation_privacy_sources_samples_per_second": 2.774,
"eval_validation_privacy_sources_steps_per_second": 1.387,
"step": 2046
},
{
"epoch": 0.71,
"eval_validation_agenda_digitale_loss": 1.3635469675064087,
"eval_validation_agenda_digitale_runtime": 185.2599,
"eval_validation_agenda_digitale_samples_per_second": 2.774,
"eval_validation_agenda_digitale_steps_per_second": 1.387,
"step": 2046
},
{
"epoch": 0.71,
"eval_validation_leggepertutti_loss": 1.2988970279693604,
"eval_validation_leggepertutti_runtime": 36.3946,
"eval_validation_leggepertutti_samples_per_second": 2.775,
"eval_validation_leggepertutti_steps_per_second": 1.401,
"step": 2046
},
{
"epoch": 0.71,
"eval_validation_altalexprivacy_loss": 1.1761205196380615,
"eval_validation_altalexprivacy_runtime": 58.7639,
"eval_validation_altalexprivacy_samples_per_second": 2.774,
"eval_validation_altalexprivacy_steps_per_second": 1.395,
"step": 2046
},
{
"epoch": 0.74,
"learning_rate": 1e-05,
"loss": 1.0203,
"step": 2139
},
{
"epoch": 0.74,
"eval_validation_privacy_sources_loss": 0.7644345164299011,
"eval_validation_privacy_sources_runtime": 207.6697,
"eval_validation_privacy_sources_samples_per_second": 2.774,
"eval_validation_privacy_sources_steps_per_second": 1.387,
"step": 2139
},
{
"epoch": 0.74,
"eval_validation_agenda_digitale_loss": 1.3618555068969727,
"eval_validation_agenda_digitale_runtime": 185.3011,
"eval_validation_agenda_digitale_samples_per_second": 2.774,
"eval_validation_agenda_digitale_steps_per_second": 1.387,
"step": 2139
},
{
"epoch": 0.74,
"eval_validation_leggepertutti_loss": 1.2900038957595825,
"eval_validation_leggepertutti_runtime": 36.4155,
"eval_validation_leggepertutti_samples_per_second": 2.774,
"eval_validation_leggepertutti_steps_per_second": 1.401,
"step": 2139
},
{
"epoch": 0.74,
"eval_validation_altalexprivacy_loss": 1.170756220817566,
"eval_validation_altalexprivacy_runtime": 58.7521,
"eval_validation_altalexprivacy_samples_per_second": 2.774,
"eval_validation_altalexprivacy_steps_per_second": 1.396,
"step": 2139
},
{
"epoch": 0.77,
"learning_rate": 1e-05,
"loss": 1.0256,
"step": 2232
},
{
"epoch": 0.77,
"eval_validation_privacy_sources_loss": 0.7612179517745972,
"eval_validation_privacy_sources_runtime": 207.7191,
"eval_validation_privacy_sources_samples_per_second": 2.773,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 2232
},
{
"epoch": 0.77,
"eval_validation_agenda_digitale_loss": 1.3602862358093262,
"eval_validation_agenda_digitale_runtime": 185.3214,
"eval_validation_agenda_digitale_samples_per_second": 2.774,
"eval_validation_agenda_digitale_steps_per_second": 1.387,
"step": 2232
},
{
"epoch": 0.77,
"eval_validation_leggepertutti_loss": 1.288977861404419,
"eval_validation_leggepertutti_runtime": 36.4223,
"eval_validation_leggepertutti_samples_per_second": 2.773,
"eval_validation_leggepertutti_steps_per_second": 1.4,
"step": 2232
},
{
"epoch": 0.77,
"eval_validation_altalexprivacy_loss": 1.1712496280670166,
"eval_validation_altalexprivacy_runtime": 58.7757,
"eval_validation_altalexprivacy_samples_per_second": 2.773,
"eval_validation_altalexprivacy_steps_per_second": 1.395,
"step": 2232
},
{
"epoch": 0.8,
"learning_rate": 1e-05,
"loss": 1.011,
"step": 2325
},
{
"epoch": 0.8,
"eval_validation_privacy_sources_loss": 0.7570701241493225,
"eval_validation_privacy_sources_runtime": 207.9647,
"eval_validation_privacy_sources_samples_per_second": 2.77,
"eval_validation_privacy_sources_steps_per_second": 1.385,
"step": 2325
},
{
"epoch": 0.8,
"eval_validation_agenda_digitale_loss": 1.3573753833770752,
"eval_validation_agenda_digitale_runtime": 185.4907,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 2325
},
{
"epoch": 0.8,
"eval_validation_leggepertutti_loss": 1.2890092134475708,
"eval_validation_leggepertutti_runtime": 36.4584,
"eval_validation_leggepertutti_samples_per_second": 2.77,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 2325
},
{
"epoch": 0.8,
"eval_validation_altalexprivacy_loss": 1.1662389039993286,
"eval_validation_altalexprivacy_runtime": 58.8138,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 2325
},
{
"epoch": 0.84,
"learning_rate": 1e-05,
"loss": 1.0016,
"step": 2418
},
{
"epoch": 0.84,
"eval_validation_privacy_sources_loss": 0.7539491653442383,
"eval_validation_privacy_sources_runtime": 207.8953,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.385,
"step": 2418
},
{
"epoch": 0.84,
"eval_validation_agenda_digitale_loss": 1.3551262617111206,
"eval_validation_agenda_digitale_runtime": 185.5266,
"eval_validation_agenda_digitale_samples_per_second": 2.77,
"eval_validation_agenda_digitale_steps_per_second": 1.385,
"step": 2418
},
{
"epoch": 0.84,
"eval_validation_leggepertutti_loss": 1.287420630455017,
"eval_validation_leggepertutti_runtime": 36.4572,
"eval_validation_leggepertutti_samples_per_second": 2.77,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 2418
},
{
"epoch": 0.84,
"eval_validation_altalexprivacy_loss": 1.1637060642242432,
"eval_validation_altalexprivacy_runtime": 58.8299,
"eval_validation_altalexprivacy_samples_per_second": 2.771,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 2418
},
{
"epoch": 0.87,
"learning_rate": 1e-05,
"loss": 1.0106,
"step": 2511
},
{
"epoch": 0.87,
"eval_validation_privacy_sources_loss": 0.7510882616043091,
"eval_validation_privacy_sources_runtime": 207.8929,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.385,
"step": 2511
},
{
"epoch": 0.87,
"eval_validation_agenda_digitale_loss": 1.3524880409240723,
"eval_validation_agenda_digitale_runtime": 185.5648,
"eval_validation_agenda_digitale_samples_per_second": 2.77,
"eval_validation_agenda_digitale_steps_per_second": 1.385,
"step": 2511
},
{
"epoch": 0.87,
"eval_validation_leggepertutti_loss": 1.2826858758926392,
"eval_validation_leggepertutti_runtime": 36.4693,
"eval_validation_leggepertutti_samples_per_second": 2.769,
"eval_validation_leggepertutti_steps_per_second": 1.398,
"step": 2511
},
{
"epoch": 0.87,
"eval_validation_altalexprivacy_loss": 1.1573538780212402,
"eval_validation_altalexprivacy_runtime": 58.8452,
"eval_validation_altalexprivacy_samples_per_second": 2.77,
"eval_validation_altalexprivacy_steps_per_second": 1.393,
"step": 2511
},
{
"epoch": 0.9,
"learning_rate": 1e-05,
"loss": 1.0075,
"step": 2604
},
{
"epoch": 0.9,
"eval_validation_privacy_sources_loss": 0.74814373254776,
"eval_validation_privacy_sources_runtime": 207.9033,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.385,
"step": 2604
},
{
"epoch": 0.9,
"eval_validation_agenda_digitale_loss": 1.3509397506713867,
"eval_validation_agenda_digitale_runtime": 185.5149,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.385,
"step": 2604
},
{
"epoch": 0.9,
"eval_validation_leggepertutti_loss": 1.2835361957550049,
"eval_validation_leggepertutti_runtime": 36.4782,
"eval_validation_leggepertutti_samples_per_second": 2.769,
"eval_validation_leggepertutti_steps_per_second": 1.398,
"step": 2604
},
{
"epoch": 0.9,
"eval_validation_altalexprivacy_loss": 1.1581933498382568,
"eval_validation_altalexprivacy_runtime": 58.808,
"eval_validation_altalexprivacy_samples_per_second": 2.772,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 2604
},
{
"epoch": 0.93,
"learning_rate": 1e-05,
"loss": 0.9994,
"step": 2697
},
{
"epoch": 0.93,
"eval_validation_privacy_sources_loss": 0.7448787689208984,
"eval_validation_privacy_sources_runtime": 207.8624,
"eval_validation_privacy_sources_samples_per_second": 2.771,
"eval_validation_privacy_sources_steps_per_second": 1.386,
"step": 2697
},
{
"epoch": 0.93,
"eval_validation_agenda_digitale_loss": 1.3478621244430542,
"eval_validation_agenda_digitale_runtime": 185.4737,
"eval_validation_agenda_digitale_samples_per_second": 2.771,
"eval_validation_agenda_digitale_steps_per_second": 1.386,
"step": 2697
},
{
"epoch": 0.93,
"eval_validation_leggepertutti_loss": 1.2804486751556396,
"eval_validation_leggepertutti_runtime": 36.4501,
"eval_validation_leggepertutti_samples_per_second": 2.771,
"eval_validation_leggepertutti_steps_per_second": 1.399,
"step": 2697
},
{
"epoch": 0.93,
"eval_validation_altalexprivacy_loss": 1.1511160135269165,
"eval_validation_altalexprivacy_runtime": 58.8365,
"eval_validation_altalexprivacy_samples_per_second": 2.77,
"eval_validation_altalexprivacy_steps_per_second": 1.394,
"step": 2697
}
],
"logging_steps": 93,
"max_steps": 5778,
"num_input_tokens_seen": 0,
"num_train_epochs": 2,
"save_steps": 93,
"total_flos": 1.5081760577745322e+19,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}