|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 0.450928611628209, |
|
"eval_steps": 93, |
|
"global_step": 651, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.0, |
|
"learning_rate": 1e-05, |
|
"loss": 1.2904, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"learning_rate": 1e-05, |
|
"loss": 1.2883, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_privacy_sources_loss": 0.931429386138916, |
|
"eval_validation_privacy_sources_runtime": 224.921, |
|
"eval_validation_privacy_sources_samples_per_second": 1.258, |
|
"eval_validation_privacy_sources_steps_per_second": 0.631, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_agenda_digitale_loss": 1.4688478708267212, |
|
"eval_validation_agenda_digitale_runtime": 201.5869, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.26, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.63, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_leggepertutti_loss": 1.293728232383728, |
|
"eval_validation_leggepertutti_runtime": 37.3205, |
|
"eval_validation_leggepertutti_samples_per_second": 1.259, |
|
"eval_validation_leggepertutti_steps_per_second": 0.643, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_altalexprivacy_loss": 1.3008275032043457, |
|
"eval_validation_altalexprivacy_runtime": 62.7339, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.259, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.638, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1632, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_privacy_sources_loss": 0.8801236152648926, |
|
"eval_validation_privacy_sources_runtime": 224.5622, |
|
"eval_validation_privacy_sources_samples_per_second": 1.26, |
|
"eval_validation_privacy_sources_steps_per_second": 0.632, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_agenda_digitale_loss": 1.4332246780395508, |
|
"eval_validation_agenda_digitale_runtime": 201.5945, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.26, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.63, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_leggepertutti_loss": 1.2643470764160156, |
|
"eval_validation_leggepertutti_runtime": 37.3205, |
|
"eval_validation_leggepertutti_samples_per_second": 1.259, |
|
"eval_validation_leggepertutti_steps_per_second": 0.643, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_altalexprivacy_loss": 1.2626982927322388, |
|
"eval_validation_altalexprivacy_runtime": 62.7289, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.259, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.638, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1339, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_privacy_sources_loss": 0.8503767251968384, |
|
"eval_validation_privacy_sources_runtime": 224.5704, |
|
"eval_validation_privacy_sources_samples_per_second": 1.26, |
|
"eval_validation_privacy_sources_steps_per_second": 0.632, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_agenda_digitale_loss": 1.4141554832458496, |
|
"eval_validation_agenda_digitale_runtime": 201.4979, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.261, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.63, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_leggepertutti_loss": 1.2566713094711304, |
|
"eval_validation_leggepertutti_runtime": 37.3026, |
|
"eval_validation_leggepertutti_samples_per_second": 1.26, |
|
"eval_validation_leggepertutti_steps_per_second": 0.643, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_altalexprivacy_loss": 1.2368062734603882, |
|
"eval_validation_altalexprivacy_runtime": 62.6933, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.26, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.638, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"learning_rate": 1e-05, |
|
"loss": 1.1007, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_validation_privacy_sources_loss": 0.8314403295516968, |
|
"eval_validation_privacy_sources_runtime": 224.5386, |
|
"eval_validation_privacy_sources_samples_per_second": 1.26, |
|
"eval_validation_privacy_sources_steps_per_second": 0.632, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_validation_agenda_digitale_loss": 1.3996949195861816, |
|
"eval_validation_agenda_digitale_runtime": 201.5206, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.26, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.63, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_validation_leggepertutti_loss": 1.2466578483581543, |
|
"eval_validation_leggepertutti_runtime": 37.3026, |
|
"eval_validation_leggepertutti_samples_per_second": 1.26, |
|
"eval_validation_leggepertutti_steps_per_second": 0.643, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"eval_validation_altalexprivacy_loss": 1.2185348272323608, |
|
"eval_validation_altalexprivacy_runtime": 62.6898, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.26, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.638, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0747, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_privacy_sources_loss": 0.8157272338867188, |
|
"eval_validation_privacy_sources_runtime": 224.5077, |
|
"eval_validation_privacy_sources_samples_per_second": 1.261, |
|
"eval_validation_privacy_sources_steps_per_second": 0.632, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_agenda_digitale_loss": 1.3890674114227295, |
|
"eval_validation_agenda_digitale_runtime": 201.5006, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.261, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.63, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_leggepertutti_loss": 1.2424800395965576, |
|
"eval_validation_leggepertutti_runtime": 37.28, |
|
"eval_validation_leggepertutti_samples_per_second": 1.261, |
|
"eval_validation_leggepertutti_steps_per_second": 0.644, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_altalexprivacy_loss": 1.203458547592163, |
|
"eval_validation_altalexprivacy_runtime": 62.6722, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.261, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.638, |
|
"step": 465 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0703, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_privacy_sources_loss": 0.8016490936279297, |
|
"eval_validation_privacy_sources_runtime": 224.4789, |
|
"eval_validation_privacy_sources_samples_per_second": 1.261, |
|
"eval_validation_privacy_sources_steps_per_second": 0.633, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_agenda_digitale_loss": 1.3786152601242065, |
|
"eval_validation_agenda_digitale_runtime": 201.4702, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.261, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.63, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_leggepertutti_loss": 1.23654043674469, |
|
"eval_validation_leggepertutti_runtime": 37.2956, |
|
"eval_validation_leggepertutti_samples_per_second": 1.26, |
|
"eval_validation_leggepertutti_steps_per_second": 0.644, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_altalexprivacy_loss": 1.1914178133010864, |
|
"eval_validation_altalexprivacy_runtime": 62.6741, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.26, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.638, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"learning_rate": 1e-05, |
|
"loss": 1.0514, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_validation_privacy_sources_loss": 0.7911774516105652, |
|
"eval_validation_privacy_sources_runtime": 224.3988, |
|
"eval_validation_privacy_sources_samples_per_second": 1.261, |
|
"eval_validation_privacy_sources_steps_per_second": 0.633, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_validation_agenda_digitale_loss": 1.370524525642395, |
|
"eval_validation_agenda_digitale_runtime": 201.3956, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.261, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.631, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_validation_leggepertutti_loss": 1.2246781587600708, |
|
"eval_validation_leggepertutti_runtime": 37.2851, |
|
"eval_validation_leggepertutti_samples_per_second": 1.261, |
|
"eval_validation_leggepertutti_steps_per_second": 0.644, |
|
"step": 651 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_validation_altalexprivacy_loss": 1.1746492385864258, |
|
"eval_validation_altalexprivacy_runtime": 62.6484, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.261, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.638, |
|
"step": 651 |
|
} |
|
], |
|
"logging_steps": 93, |
|
"max_steps": 2886, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 2, |
|
"save_steps": 93, |
|
"total_flos": 7.280849934083949e+18, |
|
"train_batch_size": 1, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|