|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 0.9333794774182385, |
|
"eval_steps": 93, |
|
"global_step": 2697, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.0, |
|
"learning_rate": 1e-05, |
|
"loss": 1.466, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"learning_rate": 1e-05, |
|
"loss": 1.3439, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_privacy_sources_loss": 0.9993858337402344, |
|
"eval_validation_privacy_sources_runtime": 208.8742, |
|
"eval_validation_privacy_sources_samples_per_second": 2.758, |
|
"eval_validation_privacy_sources_steps_per_second": 1.379, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_agenda_digitale_loss": 1.5262001752853394, |
|
"eval_validation_agenda_digitale_runtime": 186.7009, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.753, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.377, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_leggepertutti_loss": 1.393169641494751, |
|
"eval_validation_leggepertutti_runtime": 36.5278, |
|
"eval_validation_leggepertutti_samples_per_second": 2.765, |
|
"eval_validation_leggepertutti_steps_per_second": 1.396, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_altalexprivacy_loss": 1.3749068975448608, |
|
"eval_validation_altalexprivacy_runtime": 59.1055, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.758, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.387, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"learning_rate": 1e-05, |
|
"loss": 1.2277, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_privacy_sources_loss": 0.9398746490478516, |
|
"eval_validation_privacy_sources_runtime": 207.7931, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_agenda_digitale_loss": 1.4900918006896973, |
|
"eval_validation_agenda_digitale_runtime": 185.4857, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_leggepertutti_loss": 1.3686381578445435, |
|
"eval_validation_leggepertutti_runtime": 36.4651, |
|
"eval_validation_leggepertutti_samples_per_second": 2.77, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_altalexprivacy_loss": 1.3352404832839966, |
|
"eval_validation_altalexprivacy_runtime": 58.8108, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.772, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1989, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_validation_privacy_sources_loss": 0.9079627990722656, |
|
"eval_validation_privacy_sources_runtime": 207.7801, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_validation_agenda_digitale_loss": 1.4663112163543701, |
|
"eval_validation_agenda_digitale_runtime": 185.4551, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.772, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_validation_leggepertutti_loss": 1.3589648008346558, |
|
"eval_validation_leggepertutti_runtime": 36.4528, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_validation_altalexprivacy_loss": 1.3104432821273804, |
|
"eval_validation_altalexprivacy_runtime": 58.8143, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 1e-05, |
|
"loss": 1.166, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_privacy_sources_loss": 0.8864494562149048, |
|
"eval_validation_privacy_sources_runtime": 207.7989, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_agenda_digitale_loss": 1.4535290002822876, |
|
"eval_validation_agenda_digitale_runtime": 185.4338, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.772, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_leggepertutti_loss": 1.3470954895019531, |
|
"eval_validation_leggepertutti_runtime": 36.4554, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_altalexprivacy_loss": 1.2923557758331299, |
|
"eval_validation_altalexprivacy_runtime": 58.8034, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.772, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1502, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_privacy_sources_loss": 0.8700113296508789, |
|
"eval_validation_privacy_sources_runtime": 207.7896, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_agenda_digitale_loss": 1.4420515298843384, |
|
"eval_validation_agenda_digitale_runtime": 185.5107, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.385, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_leggepertutti_loss": 1.3380672931671143, |
|
"eval_validation_leggepertutti_runtime": 36.4532, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_altalexprivacy_loss": 1.2828154563903809, |
|
"eval_validation_altalexprivacy_runtime": 58.7825, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.773, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.395, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1293, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_privacy_sources_loss": 0.8583760857582092, |
|
"eval_validation_privacy_sources_runtime": 207.7778, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_agenda_digitale_loss": 1.4329832792282104, |
|
"eval_validation_agenda_digitale_runtime": 185.4109, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.772, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_leggepertutti_loss": 1.332190752029419, |
|
"eval_validation_leggepertutti_runtime": 36.4466, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_altalexprivacy_loss": 1.2727842330932617, |
|
"eval_validation_altalexprivacy_runtime": 58.812, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.772, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1214, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_validation_privacy_sources_loss": 0.8476831912994385, |
|
"eval_validation_privacy_sources_runtime": 207.83, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_validation_agenda_digitale_loss": 1.4262702465057373, |
|
"eval_validation_agenda_digitale_runtime": 185.4527, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.772, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_validation_leggepertutti_loss": 1.3270900249481201, |
|
"eval_validation_leggepertutti_runtime": 36.4393, |
|
"eval_validation_leggepertutti_samples_per_second": 2.772, |
|
"eval_validation_leggepertutti_steps_per_second": 1.4, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_validation_altalexprivacy_loss": 1.260352611541748, |
|
"eval_validation_altalexprivacy_runtime": 58.8334, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1091, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_validation_privacy_sources_loss": 0.8393220901489258, |
|
"eval_validation_privacy_sources_runtime": 207.8694, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.385, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_validation_agenda_digitale_loss": 1.419695258140564, |
|
"eval_validation_agenda_digitale_runtime": 185.5111, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.385, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_validation_leggepertutti_loss": 1.3253276348114014, |
|
"eval_validation_leggepertutti_runtime": 36.4703, |
|
"eval_validation_leggepertutti_samples_per_second": 2.769, |
|
"eval_validation_leggepertutti_steps_per_second": 1.398, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_validation_altalexprivacy_loss": 1.2589938640594482, |
|
"eval_validation_altalexprivacy_runtime": 58.8276, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1054, |
|
"step": 837 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"eval_validation_privacy_sources_loss": 0.8303313851356506, |
|
"eval_validation_privacy_sources_runtime": 207.8766, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.385, |
|
"step": 837 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"eval_validation_agenda_digitale_loss": 1.4135520458221436, |
|
"eval_validation_agenda_digitale_runtime": 185.5466, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.77, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.385, |
|
"step": 837 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"eval_validation_leggepertutti_loss": 1.3197592496871948, |
|
"eval_validation_leggepertutti_runtime": 36.4762, |
|
"eval_validation_leggepertutti_samples_per_second": 2.769, |
|
"eval_validation_leggepertutti_steps_per_second": 1.398, |
|
"step": 837 |
|
}, |
|
{ |
|
"epoch": 0.29, |
|
"eval_validation_altalexprivacy_loss": 1.248721957206726, |
|
"eval_validation_altalexprivacy_runtime": 58.845, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.77, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.393, |
|
"step": 837 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0981, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_privacy_sources_loss": 0.8243758678436279, |
|
"eval_validation_privacy_sources_runtime": 207.9136, |
|
"eval_validation_privacy_sources_samples_per_second": 2.77, |
|
"eval_validation_privacy_sources_steps_per_second": 1.385, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_agenda_digitale_loss": 1.4070162773132324, |
|
"eval_validation_agenda_digitale_runtime": 185.5276, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.77, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.385, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_leggepertutti_loss": 1.3205946683883667, |
|
"eval_validation_leggepertutti_runtime": 36.4768, |
|
"eval_validation_leggepertutti_samples_per_second": 2.769, |
|
"eval_validation_leggepertutti_steps_per_second": 1.398, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_altalexprivacy_loss": 1.236555576324463, |
|
"eval_validation_altalexprivacy_runtime": 58.8174, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0826, |
|
"step": 1023 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_privacy_sources_loss": 0.8142690062522888, |
|
"eval_validation_privacy_sources_runtime": 207.8182, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1023 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_agenda_digitale_loss": 1.4016144275665283, |
|
"eval_validation_agenda_digitale_runtime": 185.5524, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.77, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.385, |
|
"step": 1023 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_leggepertutti_loss": 1.314708948135376, |
|
"eval_validation_leggepertutti_runtime": 36.4554, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1023 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_altalexprivacy_loss": 1.230077862739563, |
|
"eval_validation_altalexprivacy_runtime": 58.8338, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1023 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0854, |
|
"step": 1116 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_privacy_sources_loss": 0.8100457787513733, |
|
"eval_validation_privacy_sources_runtime": 207.7761, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1116 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_agenda_digitale_loss": 1.3958582878112793, |
|
"eval_validation_agenda_digitale_runtime": 185.4776, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1116 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_leggepertutti_loss": 1.3077082633972168, |
|
"eval_validation_leggepertutti_runtime": 36.4414, |
|
"eval_validation_leggepertutti_samples_per_second": 2.772, |
|
"eval_validation_leggepertutti_steps_per_second": 1.4, |
|
"step": 1116 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_altalexprivacy_loss": 1.221291422843933, |
|
"eval_validation_altalexprivacy_runtime": 58.8442, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.77, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1116 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0771, |
|
"step": 1209 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_validation_privacy_sources_loss": 0.8034979701042175, |
|
"eval_validation_privacy_sources_runtime": 207.8146, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1209 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_validation_agenda_digitale_loss": 1.3933522701263428, |
|
"eval_validation_agenda_digitale_runtime": 185.4596, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1209 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_validation_leggepertutti_loss": 1.3102238178253174, |
|
"eval_validation_leggepertutti_runtime": 36.4505, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1209 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"eval_validation_altalexprivacy_loss": 1.2192506790161133, |
|
"eval_validation_altalexprivacy_runtime": 58.8165, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1209 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0637, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_validation_privacy_sources_loss": 0.7970249056816101, |
|
"eval_validation_privacy_sources_runtime": 207.8381, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_validation_agenda_digitale_loss": 1.3897120952606201, |
|
"eval_validation_agenda_digitale_runtime": 185.475, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_validation_leggepertutti_loss": 1.303721308708191, |
|
"eval_validation_leggepertutti_runtime": 36.4613, |
|
"eval_validation_leggepertutti_samples_per_second": 2.77, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_validation_altalexprivacy_loss": 1.2124699354171753, |
|
"eval_validation_altalexprivacy_runtime": 58.8366, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.77, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0566, |
|
"step": 1395 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_validation_privacy_sources_loss": 0.7921364307403564, |
|
"eval_validation_privacy_sources_runtime": 207.8584, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1395 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_validation_agenda_digitale_loss": 1.3843779563903809, |
|
"eval_validation_agenda_digitale_runtime": 185.4492, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.772, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1395 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_validation_leggepertutti_loss": 1.3031646013259888, |
|
"eval_validation_leggepertutti_runtime": 36.4511, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1395 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_validation_altalexprivacy_loss": 1.2079439163208008, |
|
"eval_validation_altalexprivacy_runtime": 58.8443, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.77, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1395 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0553, |
|
"step": 1488 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_validation_privacy_sources_loss": 0.7880584001541138, |
|
"eval_validation_privacy_sources_runtime": 207.9058, |
|
"eval_validation_privacy_sources_samples_per_second": 2.77, |
|
"eval_validation_privacy_sources_steps_per_second": 1.385, |
|
"step": 1488 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_validation_agenda_digitale_loss": 1.3801347017288208, |
|
"eval_validation_agenda_digitale_runtime": 185.4606, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1488 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_validation_leggepertutti_loss": 1.304322361946106, |
|
"eval_validation_leggepertutti_runtime": 36.4655, |
|
"eval_validation_leggepertutti_samples_per_second": 2.77, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1488 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_validation_altalexprivacy_loss": 1.200743556022644, |
|
"eval_validation_altalexprivacy_runtime": 58.8181, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1488 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0464, |
|
"step": 1581 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_privacy_sources_loss": 0.7845947742462158, |
|
"eval_validation_privacy_sources_runtime": 207.7953, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1581 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_agenda_digitale_loss": 1.3774136304855347, |
|
"eval_validation_agenda_digitale_runtime": 185.4238, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.772, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1581 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_leggepertutti_loss": 1.2997848987579346, |
|
"eval_validation_leggepertutti_runtime": 36.4545, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1581 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_altalexprivacy_loss": 1.196614146232605, |
|
"eval_validation_altalexprivacy_runtime": 58.7946, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.772, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.395, |
|
"step": 1581 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0387, |
|
"step": 1674 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_privacy_sources_loss": 0.7808618545532227, |
|
"eval_validation_privacy_sources_runtime": 207.8015, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1674 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_agenda_digitale_loss": 1.375112533569336, |
|
"eval_validation_agenda_digitale_runtime": 185.4231, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.772, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1674 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_leggepertutti_loss": 1.3011507987976074, |
|
"eval_validation_leggepertutti_runtime": 36.4454, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1674 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_altalexprivacy_loss": 1.190794825553894, |
|
"eval_validation_altalexprivacy_runtime": 58.8028, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.772, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1674 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0318, |
|
"step": 1767 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_privacy_sources_loss": 0.7766129970550537, |
|
"eval_validation_privacy_sources_runtime": 207.7465, |
|
"eval_validation_privacy_sources_samples_per_second": 2.773, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1767 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_agenda_digitale_loss": 1.372268795967102, |
|
"eval_validation_agenda_digitale_runtime": 185.4359, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.772, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1767 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_leggepertutti_loss": 1.2967208623886108, |
|
"eval_validation_leggepertutti_runtime": 36.4479, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1767 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_altalexprivacy_loss": 1.1859400272369385, |
|
"eval_validation_altalexprivacy_runtime": 58.8168, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1767 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0549, |
|
"step": 1860 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_validation_privacy_sources_loss": 0.7737349271774292, |
|
"eval_validation_privacy_sources_runtime": 207.757, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1860 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_validation_agenda_digitale_loss": 1.3696516752243042, |
|
"eval_validation_agenda_digitale_runtime": 185.376, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.773, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1860 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_validation_leggepertutti_loss": 1.2951971292495728, |
|
"eval_validation_leggepertutti_runtime": 36.4425, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 1860 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_validation_altalexprivacy_loss": 1.180280089378357, |
|
"eval_validation_altalexprivacy_runtime": 58.807, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.772, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1860 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0244, |
|
"step": 1953 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_validation_privacy_sources_loss": 0.7704524993896484, |
|
"eval_validation_privacy_sources_runtime": 207.8153, |
|
"eval_validation_privacy_sources_samples_per_second": 2.772, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 1953 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_validation_agenda_digitale_loss": 1.3666201829910278, |
|
"eval_validation_agenda_digitale_runtime": 185.3706, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.773, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 1953 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_validation_leggepertutti_loss": 1.2933101654052734, |
|
"eval_validation_leggepertutti_runtime": 36.4405, |
|
"eval_validation_leggepertutti_samples_per_second": 2.772, |
|
"eval_validation_leggepertutti_steps_per_second": 1.4, |
|
"step": 1953 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_validation_altalexprivacy_loss": 1.1771676540374756, |
|
"eval_validation_altalexprivacy_runtime": 58.8195, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 1953 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0244, |
|
"step": 2046 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_validation_privacy_sources_loss": 0.7678720951080322, |
|
"eval_validation_privacy_sources_runtime": 207.6339, |
|
"eval_validation_privacy_sources_samples_per_second": 2.774, |
|
"eval_validation_privacy_sources_steps_per_second": 1.387, |
|
"step": 2046 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_validation_agenda_digitale_loss": 1.3635469675064087, |
|
"eval_validation_agenda_digitale_runtime": 185.2599, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.774, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.387, |
|
"step": 2046 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_validation_leggepertutti_loss": 1.2988970279693604, |
|
"eval_validation_leggepertutti_runtime": 36.3946, |
|
"eval_validation_leggepertutti_samples_per_second": 2.775, |
|
"eval_validation_leggepertutti_steps_per_second": 1.401, |
|
"step": 2046 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_validation_altalexprivacy_loss": 1.1761205196380615, |
|
"eval_validation_altalexprivacy_runtime": 58.7639, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.774, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.395, |
|
"step": 2046 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0203, |
|
"step": 2139 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_validation_privacy_sources_loss": 0.7644345164299011, |
|
"eval_validation_privacy_sources_runtime": 207.6697, |
|
"eval_validation_privacy_sources_samples_per_second": 2.774, |
|
"eval_validation_privacy_sources_steps_per_second": 1.387, |
|
"step": 2139 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_validation_agenda_digitale_loss": 1.3618555068969727, |
|
"eval_validation_agenda_digitale_runtime": 185.3011, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.774, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.387, |
|
"step": 2139 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_validation_leggepertutti_loss": 1.2900038957595825, |
|
"eval_validation_leggepertutti_runtime": 36.4155, |
|
"eval_validation_leggepertutti_samples_per_second": 2.774, |
|
"eval_validation_leggepertutti_steps_per_second": 1.401, |
|
"step": 2139 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_validation_altalexprivacy_loss": 1.170756220817566, |
|
"eval_validation_altalexprivacy_runtime": 58.7521, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.774, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.396, |
|
"step": 2139 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0256, |
|
"step": 2232 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_validation_privacy_sources_loss": 0.7612179517745972, |
|
"eval_validation_privacy_sources_runtime": 207.7191, |
|
"eval_validation_privacy_sources_samples_per_second": 2.773, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 2232 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_validation_agenda_digitale_loss": 1.3602862358093262, |
|
"eval_validation_agenda_digitale_runtime": 185.3214, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.774, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.387, |
|
"step": 2232 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_validation_leggepertutti_loss": 1.288977861404419, |
|
"eval_validation_leggepertutti_runtime": 36.4223, |
|
"eval_validation_leggepertutti_samples_per_second": 2.773, |
|
"eval_validation_leggepertutti_steps_per_second": 1.4, |
|
"step": 2232 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_validation_altalexprivacy_loss": 1.1712496280670166, |
|
"eval_validation_altalexprivacy_runtime": 58.7757, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.773, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.395, |
|
"step": 2232 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 1e-05, |
|
"loss": 1.011, |
|
"step": 2325 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_validation_privacy_sources_loss": 0.7570701241493225, |
|
"eval_validation_privacy_sources_runtime": 207.9647, |
|
"eval_validation_privacy_sources_samples_per_second": 2.77, |
|
"eval_validation_privacy_sources_steps_per_second": 1.385, |
|
"step": 2325 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_validation_agenda_digitale_loss": 1.3573753833770752, |
|
"eval_validation_agenda_digitale_runtime": 185.4907, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 2325 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_validation_leggepertutti_loss": 1.2890092134475708, |
|
"eval_validation_leggepertutti_runtime": 36.4584, |
|
"eval_validation_leggepertutti_samples_per_second": 2.77, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 2325 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_validation_altalexprivacy_loss": 1.1662389039993286, |
|
"eval_validation_altalexprivacy_runtime": 58.8138, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 2325 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0016, |
|
"step": 2418 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_validation_privacy_sources_loss": 0.7539491653442383, |
|
"eval_validation_privacy_sources_runtime": 207.8953, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.385, |
|
"step": 2418 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_validation_agenda_digitale_loss": 1.3551262617111206, |
|
"eval_validation_agenda_digitale_runtime": 185.5266, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.77, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.385, |
|
"step": 2418 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_validation_leggepertutti_loss": 1.287420630455017, |
|
"eval_validation_leggepertutti_runtime": 36.4572, |
|
"eval_validation_leggepertutti_samples_per_second": 2.77, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 2418 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_validation_altalexprivacy_loss": 1.1637060642242432, |
|
"eval_validation_altalexprivacy_runtime": 58.8299, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.771, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 2418 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0106, |
|
"step": 2511 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_validation_privacy_sources_loss": 0.7510882616043091, |
|
"eval_validation_privacy_sources_runtime": 207.8929, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.385, |
|
"step": 2511 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_validation_agenda_digitale_loss": 1.3524880409240723, |
|
"eval_validation_agenda_digitale_runtime": 185.5648, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.77, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.385, |
|
"step": 2511 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_validation_leggepertutti_loss": 1.2826858758926392, |
|
"eval_validation_leggepertutti_runtime": 36.4693, |
|
"eval_validation_leggepertutti_samples_per_second": 2.769, |
|
"eval_validation_leggepertutti_steps_per_second": 1.398, |
|
"step": 2511 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_validation_altalexprivacy_loss": 1.1573538780212402, |
|
"eval_validation_altalexprivacy_runtime": 58.8452, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.77, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.393, |
|
"step": 2511 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0075, |
|
"step": 2604 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_validation_privacy_sources_loss": 0.74814373254776, |
|
"eval_validation_privacy_sources_runtime": 207.9033, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.385, |
|
"step": 2604 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_validation_agenda_digitale_loss": 1.3509397506713867, |
|
"eval_validation_agenda_digitale_runtime": 185.5149, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.385, |
|
"step": 2604 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_validation_leggepertutti_loss": 1.2835361957550049, |
|
"eval_validation_leggepertutti_runtime": 36.4782, |
|
"eval_validation_leggepertutti_samples_per_second": 2.769, |
|
"eval_validation_leggepertutti_steps_per_second": 1.398, |
|
"step": 2604 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_validation_altalexprivacy_loss": 1.1581933498382568, |
|
"eval_validation_altalexprivacy_runtime": 58.808, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.772, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 2604 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"learning_rate": 1e-05, |
|
"loss": 0.9994, |
|
"step": 2697 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_validation_privacy_sources_loss": 0.7448787689208984, |
|
"eval_validation_privacy_sources_runtime": 207.8624, |
|
"eval_validation_privacy_sources_samples_per_second": 2.771, |
|
"eval_validation_privacy_sources_steps_per_second": 1.386, |
|
"step": 2697 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_validation_agenda_digitale_loss": 1.3478621244430542, |
|
"eval_validation_agenda_digitale_runtime": 185.4737, |
|
"eval_validation_agenda_digitale_samples_per_second": 2.771, |
|
"eval_validation_agenda_digitale_steps_per_second": 1.386, |
|
"step": 2697 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_validation_leggepertutti_loss": 1.2804486751556396, |
|
"eval_validation_leggepertutti_runtime": 36.4501, |
|
"eval_validation_leggepertutti_samples_per_second": 2.771, |
|
"eval_validation_leggepertutti_steps_per_second": 1.399, |
|
"step": 2697 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_validation_altalexprivacy_loss": 1.1511160135269165, |
|
"eval_validation_altalexprivacy_runtime": 58.8365, |
|
"eval_validation_altalexprivacy_samples_per_second": 2.77, |
|
"eval_validation_altalexprivacy_steps_per_second": 1.394, |
|
"step": 2697 |
|
} |
|
], |
|
"logging_steps": 93, |
|
"max_steps": 5778, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 2, |
|
"save_steps": 93, |
|
"total_flos": 1.5081760577745322e+19, |
|
"train_batch_size": 1, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|