|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 0.6464586846543001, |
|
"eval_steps": 187, |
|
"global_step": 7667, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.0, |
|
"grad_norm": 8.5, |
|
"learning_rate": 1e-05, |
|
"loss": 1.9119, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"grad_norm": 4.59375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.7164, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_validation_privacy_sources_loss": 1.0334585905075073, |
|
"eval_validation_privacy_sources_runtime": 212.2756, |
|
"eval_validation_privacy_sources_samples_per_second": 1.804, |
|
"eval_validation_privacy_sources_steps_per_second": 0.904, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_validation_agenda_digitale_loss": 1.5160526037216187, |
|
"eval_validation_agenda_digitale_runtime": 188.4106, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.805, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.902, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_validation_leggepertutti_loss": 1.3417482376098633, |
|
"eval_validation_leggepertutti_runtime": 35.8837, |
|
"eval_validation_leggepertutti_samples_per_second": 1.811, |
|
"eval_validation_leggepertutti_steps_per_second": 0.92, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_validation_altalexprivacy_loss": 1.3672271966934204, |
|
"eval_validation_altalexprivacy_runtime": 58.6063, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.809, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.904, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_validation_mc4_it_loss": 1.9217756986618042, |
|
"eval_validation_mc4_it_runtime": 78.6277, |
|
"eval_validation_mc4_it_samples_per_second": 1.806, |
|
"eval_validation_mc4_it_steps_per_second": 0.903, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 0.02, |
|
"eval_validation_dolma_loss": 1.9627543687820435, |
|
"eval_validation_dolma_runtime": 54.0088, |
|
"eval_validation_dolma_samples_per_second": 1.815, |
|
"eval_validation_dolma_steps_per_second": 0.907, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"grad_norm": 3.859375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.6579, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_privacy_sources_loss": 0.9830030798912048, |
|
"eval_validation_privacy_sources_runtime": 210.811, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_agenda_digitale_loss": 1.4846152067184448, |
|
"eval_validation_agenda_digitale_runtime": 187.1837, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.816, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_leggepertutti_loss": 1.3172152042388916, |
|
"eval_validation_leggepertutti_runtime": 35.7866, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_altalexprivacy_loss": 1.3326139450073242, |
|
"eval_validation_altalexprivacy_runtime": 58.3381, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_mc4_it_loss": 1.8915678262710571, |
|
"eval_validation_mc4_it_runtime": 78.169, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_validation_dolma_loss": 1.9608409404754639, |
|
"eval_validation_dolma_runtime": 53.9716, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"grad_norm": 3.484375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.6402, |
|
"step": 561 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_validation_privacy_sources_loss": 0.9559596180915833, |
|
"eval_validation_privacy_sources_runtime": 210.7246, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 561 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_validation_agenda_digitale_loss": 1.4720743894577026, |
|
"eval_validation_agenda_digitale_runtime": 187.11, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 561 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_validation_leggepertutti_loss": 1.3074837923049927, |
|
"eval_validation_leggepertutti_runtime": 35.7797, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 561 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_validation_altalexprivacy_loss": 1.3142317533493042, |
|
"eval_validation_altalexprivacy_runtime": 58.315, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 561 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_validation_mc4_it_loss": 1.87451171875, |
|
"eval_validation_mc4_it_runtime": 78.1299, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 561 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"eval_validation_dolma_loss": 1.956404447555542, |
|
"eval_validation_dolma_runtime": 53.9194, |
|
"eval_validation_dolma_samples_per_second": 1.818, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 561 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"grad_norm": 9.625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.6284, |
|
"step": 748 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_privacy_sources_loss": 0.933682918548584, |
|
"eval_validation_privacy_sources_runtime": 210.799, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 748 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_agenda_digitale_loss": 1.4578524827957153, |
|
"eval_validation_agenda_digitale_runtime": 187.08, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 748 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_leggepertutti_loss": 1.2905200719833374, |
|
"eval_validation_leggepertutti_runtime": 35.7738, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 748 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_altalexprivacy_loss": 1.2977306842803955, |
|
"eval_validation_altalexprivacy_runtime": 58.3215, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 748 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_mc4_it_loss": 1.8592724800109863, |
|
"eval_validation_mc4_it_runtime": 78.1141, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 748 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"eval_validation_dolma_loss": 1.9574466943740845, |
|
"eval_validation_dolma_runtime": 53.9297, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 748 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"grad_norm": 3.390625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.6082, |
|
"step": 935 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_validation_privacy_sources_loss": 0.919241726398468, |
|
"eval_validation_privacy_sources_runtime": 210.6302, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.912, |
|
"step": 935 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_validation_agenda_digitale_loss": 1.4438046216964722, |
|
"eval_validation_agenda_digitale_runtime": 187.0727, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 935 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_validation_leggepertutti_loss": 1.2822848558425903, |
|
"eval_validation_leggepertutti_runtime": 35.7909, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 935 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_validation_altalexprivacy_loss": 1.2801928520202637, |
|
"eval_validation_altalexprivacy_runtime": 58.3369, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 935 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_validation_mc4_it_loss": 1.8457767963409424, |
|
"eval_validation_mc4_it_runtime": 78.1714, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 935 |
|
}, |
|
{ |
|
"epoch": 0.08, |
|
"eval_validation_dolma_loss": 1.9588344097137451, |
|
"eval_validation_dolma_runtime": 53.9317, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 935 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"grad_norm": 3.46875, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5989, |
|
"step": 1122 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_validation_privacy_sources_loss": 0.9032600522041321, |
|
"eval_validation_privacy_sources_runtime": 210.7002, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 1122 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_validation_agenda_digitale_loss": 1.433292031288147, |
|
"eval_validation_agenda_digitale_runtime": 187.0521, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 1122 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_validation_leggepertutti_loss": 1.2763991355895996, |
|
"eval_validation_leggepertutti_runtime": 35.7627, |
|
"eval_validation_leggepertutti_samples_per_second": 1.818, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 1122 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_validation_altalexprivacy_loss": 1.2663257122039795, |
|
"eval_validation_altalexprivacy_runtime": 58.3197, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 1122 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_validation_mc4_it_loss": 1.8358547687530518, |
|
"eval_validation_mc4_it_runtime": 78.1183, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 1122 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"eval_validation_dolma_loss": 2.0097882747650146, |
|
"eval_validation_dolma_runtime": 53.9266, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 1122 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"grad_norm": 3.40625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.6161, |
|
"step": 1309 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_validation_privacy_sources_loss": 0.8906105160713196, |
|
"eval_validation_privacy_sources_runtime": 210.7431, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 1309 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_validation_agenda_digitale_loss": 1.4252179861068726, |
|
"eval_validation_agenda_digitale_runtime": 187.1263, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 1309 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_validation_leggepertutti_loss": 1.2690521478652954, |
|
"eval_validation_leggepertutti_runtime": 35.7673, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 1309 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_validation_altalexprivacy_loss": 1.258312463760376, |
|
"eval_validation_altalexprivacy_runtime": 58.3303, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 1309 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_validation_mc4_it_loss": 1.8263970613479614, |
|
"eval_validation_mc4_it_runtime": 78.147, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 1309 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_validation_dolma_loss": 1.9555673599243164, |
|
"eval_validation_dolma_runtime": 53.9288, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 1309 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"grad_norm": 3.25, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5911, |
|
"step": 1496 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_privacy_sources_loss": 0.8815954327583313, |
|
"eval_validation_privacy_sources_runtime": 210.7215, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 1496 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_agenda_digitale_loss": 1.4188568592071533, |
|
"eval_validation_agenda_digitale_runtime": 187.0962, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 1496 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_leggepertutti_loss": 1.269508957862854, |
|
"eval_validation_leggepertutti_runtime": 35.7762, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 1496 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_altalexprivacy_loss": 1.2556049823760986, |
|
"eval_validation_altalexprivacy_runtime": 58.3467, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 1496 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_mc4_it_loss": 1.8174842596054077, |
|
"eval_validation_mc4_it_runtime": 78.1412, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 1496 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_validation_dolma_loss": 1.9592047929763794, |
|
"eval_validation_dolma_runtime": 53.9471, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 1496 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"grad_norm": 3.359375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5694, |
|
"step": 1683 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_validation_privacy_sources_loss": 0.8737432956695557, |
|
"eval_validation_privacy_sources_runtime": 210.8196, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 1683 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_validation_agenda_digitale_loss": 1.4132717847824097, |
|
"eval_validation_agenda_digitale_runtime": 187.1554, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 1683 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_validation_leggepertutti_loss": 1.2630620002746582, |
|
"eval_validation_leggepertutti_runtime": 35.7934, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 1683 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_validation_altalexprivacy_loss": 1.247528076171875, |
|
"eval_validation_altalexprivacy_runtime": 58.3547, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.816, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 1683 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_validation_mc4_it_loss": 1.8103784322738647, |
|
"eval_validation_mc4_it_runtime": 78.1665, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 1683 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"eval_validation_dolma_loss": 1.956905722618103, |
|
"eval_validation_dolma_runtime": 53.9622, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 1683 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"grad_norm": 3.1875, |
|
"learning_rate": 1e-05, |
|
"loss": 1.563, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_privacy_sources_loss": 0.8650386929512024, |
|
"eval_validation_privacy_sources_runtime": 210.8215, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_agenda_digitale_loss": 1.4071804285049438, |
|
"eval_validation_agenda_digitale_runtime": 187.1502, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_leggepertutti_loss": 1.2562586069107056, |
|
"eval_validation_leggepertutti_runtime": 35.7742, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_altalexprivacy_loss": 1.240662932395935, |
|
"eval_validation_altalexprivacy_runtime": 58.3499, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_mc4_it_loss": 1.8042465448379517, |
|
"eval_validation_mc4_it_runtime": 78.1652, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_validation_dolma_loss": 1.9527182579040527, |
|
"eval_validation_dolma_runtime": 53.948, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 1870 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"grad_norm": 3.171875, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5747, |
|
"step": 2057 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_validation_privacy_sources_loss": 0.8606281876564026, |
|
"eval_validation_privacy_sources_runtime": 210.8197, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 2057 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_validation_agenda_digitale_loss": 1.401216983795166, |
|
"eval_validation_agenda_digitale_runtime": 187.1929, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.816, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 2057 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_validation_leggepertutti_loss": 1.249880075454712, |
|
"eval_validation_leggepertutti_runtime": 35.7828, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 2057 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_validation_altalexprivacy_loss": 1.2347912788391113, |
|
"eval_validation_altalexprivacy_runtime": 58.3271, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 2057 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_validation_mc4_it_loss": 1.7988897562026978, |
|
"eval_validation_mc4_it_runtime": 78.1637, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 2057 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_validation_dolma_loss": 1.9512945413589478, |
|
"eval_validation_dolma_runtime": 53.9545, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 2057 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"grad_norm": 3.703125, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5631, |
|
"step": 2244 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_privacy_sources_loss": 0.8552854061126709, |
|
"eval_validation_privacy_sources_runtime": 210.7654, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 2244 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_agenda_digitale_loss": 1.3981597423553467, |
|
"eval_validation_agenda_digitale_runtime": 187.0896, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 2244 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_leggepertutti_loss": 1.249776840209961, |
|
"eval_validation_leggepertutti_runtime": 35.7701, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 2244 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_altalexprivacy_loss": 1.2317657470703125, |
|
"eval_validation_altalexprivacy_runtime": 58.3402, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 2244 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_mc4_it_loss": 1.7936795949935913, |
|
"eval_validation_mc4_it_runtime": 78.1539, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 2244 |
|
}, |
|
{ |
|
"epoch": 0.19, |
|
"eval_validation_dolma_loss": 1.949507474899292, |
|
"eval_validation_dolma_runtime": 53.9287, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 2244 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"grad_norm": 3.28125, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5502, |
|
"step": 2431 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_validation_privacy_sources_loss": 0.8490111231803894, |
|
"eval_validation_privacy_sources_runtime": 210.7371, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 2431 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_validation_agenda_digitale_loss": 1.391976237297058, |
|
"eval_validation_agenda_digitale_runtime": 187.0694, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 2431 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_validation_leggepertutti_loss": 1.2457927465438843, |
|
"eval_validation_leggepertutti_runtime": 35.7756, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 2431 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_validation_altalexprivacy_loss": 1.2249823808670044, |
|
"eval_validation_altalexprivacy_runtime": 58.3391, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 2431 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_validation_mc4_it_loss": 1.7877947092056274, |
|
"eval_validation_mc4_it_runtime": 78.1519, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 2431 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_validation_dolma_loss": 1.9478541612625122, |
|
"eval_validation_dolma_runtime": 53.9392, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 2431 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"grad_norm": 3.109375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5612, |
|
"step": 2618 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_validation_privacy_sources_loss": 0.8443201184272766, |
|
"eval_validation_privacy_sources_runtime": 210.7053, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 2618 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_validation_agenda_digitale_loss": 1.3874356746673584, |
|
"eval_validation_agenda_digitale_runtime": 187.0741, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 2618 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_validation_leggepertutti_loss": 1.242628574371338, |
|
"eval_validation_leggepertutti_runtime": 35.7724, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 2618 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_validation_altalexprivacy_loss": 1.22023606300354, |
|
"eval_validation_altalexprivacy_runtime": 58.3215, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 2618 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_validation_mc4_it_loss": 1.783267617225647, |
|
"eval_validation_mc4_it_runtime": 78.1277, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 2618 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_validation_dolma_loss": 1.9474639892578125, |
|
"eval_validation_dolma_runtime": 53.9215, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 2618 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"grad_norm": 9.0, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5625, |
|
"step": 2805 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_validation_privacy_sources_loss": 0.8386737108230591, |
|
"eval_validation_privacy_sources_runtime": 210.6496, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 2805 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_validation_agenda_digitale_loss": 1.3825620412826538, |
|
"eval_validation_agenda_digitale_runtime": 186.9852, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 2805 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_validation_leggepertutti_loss": 1.2439346313476562, |
|
"eval_validation_leggepertutti_runtime": 35.762, |
|
"eval_validation_leggepertutti_samples_per_second": 1.818, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 2805 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_validation_altalexprivacy_loss": 1.2144984006881714, |
|
"eval_validation_altalexprivacy_runtime": 58.2929, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 2805 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_validation_mc4_it_loss": 1.7777953147888184, |
|
"eval_validation_mc4_it_runtime": 78.0862, |
|
"eval_validation_mc4_it_samples_per_second": 1.819, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 2805 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_validation_dolma_loss": 1.9426158666610718, |
|
"eval_validation_dolma_runtime": 53.8932, |
|
"eval_validation_dolma_samples_per_second": 1.818, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 2805 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"grad_norm": 3.09375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5659, |
|
"step": 2992 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_validation_privacy_sources_loss": 0.8341156840324402, |
|
"eval_validation_privacy_sources_runtime": 210.6733, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 2992 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_validation_agenda_digitale_loss": 1.3803825378417969, |
|
"eval_validation_agenda_digitale_runtime": 187.0096, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 2992 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_validation_leggepertutti_loss": 1.2398289442062378, |
|
"eval_validation_leggepertutti_runtime": 35.7578, |
|
"eval_validation_leggepertutti_samples_per_second": 1.818, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 2992 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_validation_altalexprivacy_loss": 1.2100013494491577, |
|
"eval_validation_altalexprivacy_runtime": 58.3051, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 2992 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_validation_mc4_it_loss": 1.7749333381652832, |
|
"eval_validation_mc4_it_runtime": 78.0968, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 2992 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_validation_dolma_loss": 1.9426519870758057, |
|
"eval_validation_dolma_runtime": 53.9195, |
|
"eval_validation_dolma_samples_per_second": 1.818, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 2992 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"grad_norm": 3.265625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5527, |
|
"step": 3179 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_validation_privacy_sources_loss": 0.8318145871162415, |
|
"eval_validation_privacy_sources_runtime": 210.7255, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 3179 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_validation_agenda_digitale_loss": 1.378063440322876, |
|
"eval_validation_agenda_digitale_runtime": 187.087, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 3179 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_validation_leggepertutti_loss": 1.2370458841323853, |
|
"eval_validation_leggepertutti_runtime": 35.7809, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 3179 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_validation_altalexprivacy_loss": 1.2080256938934326, |
|
"eval_validation_altalexprivacy_runtime": 58.3354, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 3179 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_validation_mc4_it_loss": 1.7702537775039673, |
|
"eval_validation_mc4_it_runtime": 78.1409, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 3179 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_validation_dolma_loss": 1.950868844985962, |
|
"eval_validation_dolma_runtime": 53.9369, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 3179 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"grad_norm": 3.265625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5476, |
|
"step": 3366 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_validation_privacy_sources_loss": 0.8264653086662292, |
|
"eval_validation_privacy_sources_runtime": 210.7205, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 3366 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_validation_agenda_digitale_loss": 1.3743617534637451, |
|
"eval_validation_agenda_digitale_runtime": 187.1448, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 3366 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_validation_leggepertutti_loss": 1.2376344203948975, |
|
"eval_validation_leggepertutti_runtime": 35.7729, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 3366 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_validation_altalexprivacy_loss": 1.2052847146987915, |
|
"eval_validation_altalexprivacy_runtime": 58.3348, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 3366 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_validation_mc4_it_loss": 1.7669274806976318, |
|
"eval_validation_mc4_it_runtime": 78.1532, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 3366 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_validation_dolma_loss": 1.9461361169815063, |
|
"eval_validation_dolma_runtime": 53.9281, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 3366 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"grad_norm": 3.625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.558, |
|
"step": 3553 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_validation_privacy_sources_loss": 0.822688102722168, |
|
"eval_validation_privacy_sources_runtime": 210.9998, |
|
"eval_validation_privacy_sources_samples_per_second": 1.815, |
|
"eval_validation_privacy_sources_steps_per_second": 0.91, |
|
"step": 3553 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_validation_agenda_digitale_loss": 1.3728498220443726, |
|
"eval_validation_agenda_digitale_runtime": 187.2711, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.816, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 3553 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_validation_leggepertutti_loss": 1.2360832691192627, |
|
"eval_validation_leggepertutti_runtime": 35.7958, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 3553 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_validation_altalexprivacy_loss": 1.2027132511138916, |
|
"eval_validation_altalexprivacy_runtime": 58.3972, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.815, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 3553 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_validation_mc4_it_loss": 1.7643710374832153, |
|
"eval_validation_mc4_it_runtime": 78.2118, |
|
"eval_validation_mc4_it_samples_per_second": 1.816, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 3553 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_validation_dolma_loss": 1.9442397356033325, |
|
"eval_validation_dolma_runtime": 53.9609, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 3553 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"grad_norm": 4.65625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.535, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_privacy_sources_loss": 0.8193829655647278, |
|
"eval_validation_privacy_sources_runtime": 210.8214, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_agenda_digitale_loss": 1.3690398931503296, |
|
"eval_validation_agenda_digitale_runtime": 187.1433, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_leggepertutti_loss": 1.2321481704711914, |
|
"eval_validation_leggepertutti_runtime": 35.7856, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_altalexprivacy_loss": 1.1964303255081177, |
|
"eval_validation_altalexprivacy_runtime": 58.3552, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.816, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_mc4_it_loss": 1.7612253427505493, |
|
"eval_validation_mc4_it_runtime": 78.1715, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_validation_dolma_loss": 1.9415688514709473, |
|
"eval_validation_dolma_runtime": 53.9531, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 3740 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"grad_norm": 3.203125, |
|
"learning_rate": 1e-05, |
|
"loss": 1.551, |
|
"step": 3927 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_validation_privacy_sources_loss": 0.8159863352775574, |
|
"eval_validation_privacy_sources_runtime": 210.8294, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 3927 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_validation_agenda_digitale_loss": 1.3660005331039429, |
|
"eval_validation_agenda_digitale_runtime": 187.2084, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.816, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 3927 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_validation_leggepertutti_loss": 1.2291594743728638, |
|
"eval_validation_leggepertutti_runtime": 35.7917, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 3927 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_validation_altalexprivacy_loss": 1.1953657865524292, |
|
"eval_validation_altalexprivacy_runtime": 58.3486, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 3927 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_validation_mc4_it_loss": 1.7568954229354858, |
|
"eval_validation_mc4_it_runtime": 78.1754, |
|
"eval_validation_mc4_it_samples_per_second": 1.816, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 3927 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_validation_dolma_loss": 1.9388848543167114, |
|
"eval_validation_dolma_runtime": 53.9683, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 3927 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"grad_norm": 3.578125, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5452, |
|
"step": 4114 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_privacy_sources_loss": 0.8137150406837463, |
|
"eval_validation_privacy_sources_runtime": 210.7357, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 4114 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_agenda_digitale_loss": 1.3656136989593506, |
|
"eval_validation_agenda_digitale_runtime": 187.146, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 4114 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_leggepertutti_loss": 1.2296239137649536, |
|
"eval_validation_leggepertutti_runtime": 35.7766, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 4114 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_altalexprivacy_loss": 1.1915565729141235, |
|
"eval_validation_altalexprivacy_runtime": 58.3322, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 4114 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_mc4_it_loss": 1.7542990446090698, |
|
"eval_validation_mc4_it_runtime": 78.1622, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 4114 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"eval_validation_dolma_loss": 1.9385536909103394, |
|
"eval_validation_dolma_runtime": 53.9474, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 4114 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"grad_norm": 3.421875, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5371, |
|
"step": 4301 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_validation_privacy_sources_loss": 0.8114846348762512, |
|
"eval_validation_privacy_sources_runtime": 210.7483, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 4301 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_validation_agenda_digitale_loss": 1.36287522315979, |
|
"eval_validation_agenda_digitale_runtime": 187.0978, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 4301 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_validation_leggepertutti_loss": 1.225502371788025, |
|
"eval_validation_leggepertutti_runtime": 35.7725, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 4301 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_validation_altalexprivacy_loss": 1.1899324655532837, |
|
"eval_validation_altalexprivacy_runtime": 58.3269, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 4301 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_validation_mc4_it_loss": 1.7518540620803833, |
|
"eval_validation_mc4_it_runtime": 78.1395, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 4301 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"eval_validation_dolma_loss": 1.9364405870437622, |
|
"eval_validation_dolma_runtime": 53.9366, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 4301 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"grad_norm": 3.4375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5349, |
|
"step": 4488 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_validation_privacy_sources_loss": 0.8089282512664795, |
|
"eval_validation_privacy_sources_runtime": 210.6735, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 4488 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_validation_agenda_digitale_loss": 1.3604696989059448, |
|
"eval_validation_agenda_digitale_runtime": 187.0247, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 4488 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_validation_leggepertutti_loss": 1.2236857414245605, |
|
"eval_validation_leggepertutti_runtime": 35.775, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 4488 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_validation_altalexprivacy_loss": 1.1892808675765991, |
|
"eval_validation_altalexprivacy_runtime": 58.2983, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 4488 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_validation_mc4_it_loss": 1.7490640878677368, |
|
"eval_validation_mc4_it_runtime": 78.1304, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 4488 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"eval_validation_dolma_loss": 1.9361358880996704, |
|
"eval_validation_dolma_runtime": 53.9258, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 4488 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"grad_norm": 3.265625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.538, |
|
"step": 4675 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_privacy_sources_loss": 0.8068882822990417, |
|
"eval_validation_privacy_sources_runtime": 210.6987, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 4675 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_agenda_digitale_loss": 1.357992172241211, |
|
"eval_validation_agenda_digitale_runtime": 187.0601, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 4675 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_leggepertutti_loss": 1.2222189903259277, |
|
"eval_validation_leggepertutti_runtime": 35.7685, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 4675 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_altalexprivacy_loss": 1.1868293285369873, |
|
"eval_validation_altalexprivacy_runtime": 58.3028, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 4675 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_mc4_it_loss": 1.747467279434204, |
|
"eval_validation_mc4_it_runtime": 78.0822, |
|
"eval_validation_mc4_it_samples_per_second": 1.819, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 4675 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_validation_dolma_loss": 1.9376739263534546, |
|
"eval_validation_dolma_runtime": 53.9131, |
|
"eval_validation_dolma_samples_per_second": 1.818, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 4675 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"grad_norm": 4.5625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5217, |
|
"step": 4862 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_validation_privacy_sources_loss": 0.8034628033638, |
|
"eval_validation_privacy_sources_runtime": 210.664, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 4862 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_validation_agenda_digitale_loss": 1.3556355237960815, |
|
"eval_validation_agenda_digitale_runtime": 187.0481, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 4862 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_validation_leggepertutti_loss": 1.2238881587982178, |
|
"eval_validation_leggepertutti_runtime": 35.77, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 4862 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_validation_altalexprivacy_loss": 1.1821054220199585, |
|
"eval_validation_altalexprivacy_runtime": 58.3131, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 4862 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_validation_mc4_it_loss": 1.7454167604446411, |
|
"eval_validation_mc4_it_runtime": 78.136, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 4862 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"eval_validation_dolma_loss": 1.9336557388305664, |
|
"eval_validation_dolma_runtime": 53.931, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 4862 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"grad_norm": 3.25, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5231, |
|
"step": 5049 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_validation_privacy_sources_loss": 0.8018712997436523, |
|
"eval_validation_privacy_sources_runtime": 210.6286, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.912, |
|
"step": 5049 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_validation_agenda_digitale_loss": 1.3536696434020996, |
|
"eval_validation_agenda_digitale_runtime": 186.962, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.819, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 5049 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_validation_leggepertutti_loss": 1.219115138053894, |
|
"eval_validation_leggepertutti_runtime": 35.7552, |
|
"eval_validation_leggepertutti_samples_per_second": 1.818, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 5049 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_validation_altalexprivacy_loss": 1.1803195476531982, |
|
"eval_validation_altalexprivacy_runtime": 58.254, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.82, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.91, |
|
"step": 5049 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_validation_mc4_it_loss": 1.7427842617034912, |
|
"eval_validation_mc4_it_runtime": 78.0819, |
|
"eval_validation_mc4_it_samples_per_second": 1.819, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 5049 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_validation_dolma_loss": 1.932908058166504, |
|
"eval_validation_dolma_runtime": 53.9066, |
|
"eval_validation_dolma_samples_per_second": 1.818, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 5049 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"grad_norm": 3.34375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.535, |
|
"step": 5236 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_validation_privacy_sources_loss": 0.7990080714225769, |
|
"eval_validation_privacy_sources_runtime": 210.6936, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 5236 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_validation_agenda_digitale_loss": 1.3512707948684692, |
|
"eval_validation_agenda_digitale_runtime": 187.0661, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 5236 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_validation_leggepertutti_loss": 1.2183226346969604, |
|
"eval_validation_leggepertutti_runtime": 35.7756, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 5236 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_validation_altalexprivacy_loss": 1.1762974262237549, |
|
"eval_validation_altalexprivacy_runtime": 58.3182, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 5236 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_validation_mc4_it_loss": 1.7408561706542969, |
|
"eval_validation_mc4_it_runtime": 78.1139, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 5236 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_validation_dolma_loss": 1.9324188232421875, |
|
"eval_validation_dolma_runtime": 53.9296, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 5236 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"grad_norm": 3.40625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5195, |
|
"step": 5423 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_validation_privacy_sources_loss": 0.7970147728919983, |
|
"eval_validation_privacy_sources_runtime": 210.7209, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 5423 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_validation_agenda_digitale_loss": 1.350595235824585, |
|
"eval_validation_agenda_digitale_runtime": 187.0929, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 5423 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_validation_leggepertutti_loss": 1.2196227312088013, |
|
"eval_validation_leggepertutti_runtime": 35.7764, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 5423 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_validation_altalexprivacy_loss": 1.176468014717102, |
|
"eval_validation_altalexprivacy_runtime": 58.3399, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 5423 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_validation_mc4_it_loss": 1.7395856380462646, |
|
"eval_validation_mc4_it_runtime": 78.1494, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 5423 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_validation_dolma_loss": 1.9318716526031494, |
|
"eval_validation_dolma_runtime": 53.9467, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 5423 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"grad_norm": 3.484375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5356, |
|
"step": 5610 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_validation_privacy_sources_loss": 0.7967193126678467, |
|
"eval_validation_privacy_sources_runtime": 210.7692, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 5610 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_validation_agenda_digitale_loss": 1.3498324155807495, |
|
"eval_validation_agenda_digitale_runtime": 187.1217, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 5610 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_validation_leggepertutti_loss": 1.2213656902313232, |
|
"eval_validation_leggepertutti_runtime": 35.7931, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 5610 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_validation_altalexprivacy_loss": 1.1725049018859863, |
|
"eval_validation_altalexprivacy_runtime": 58.34, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 5610 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_validation_mc4_it_loss": 1.7369210720062256, |
|
"eval_validation_mc4_it_runtime": 78.1677, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 5610 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_validation_dolma_loss": 1.931601643562317, |
|
"eval_validation_dolma_runtime": 53.9523, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 5610 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"grad_norm": 3.25, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5248, |
|
"step": 5797 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_validation_privacy_sources_loss": 0.7927350997924805, |
|
"eval_validation_privacy_sources_runtime": 210.7499, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 5797 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_validation_agenda_digitale_loss": 1.3474359512329102, |
|
"eval_validation_agenda_digitale_runtime": 187.1385, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 5797 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_validation_leggepertutti_loss": 1.2162562608718872, |
|
"eval_validation_leggepertutti_runtime": 35.7966, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 5797 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_validation_altalexprivacy_loss": 1.1715296506881714, |
|
"eval_validation_altalexprivacy_runtime": 58.3612, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.816, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 5797 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_validation_mc4_it_loss": 1.7344577312469482, |
|
"eval_validation_mc4_it_runtime": 78.1843, |
|
"eval_validation_mc4_it_samples_per_second": 1.816, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 5797 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"eval_validation_dolma_loss": 1.9310978651046753, |
|
"eval_validation_dolma_runtime": 53.9513, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 5797 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"grad_norm": 3.390625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5147, |
|
"step": 5984 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_validation_privacy_sources_loss": 0.7904417514801025, |
|
"eval_validation_privacy_sources_runtime": 210.6793, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 5984 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_validation_agenda_digitale_loss": 1.3463512659072876, |
|
"eval_validation_agenda_digitale_runtime": 187.0767, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 5984 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_validation_leggepertutti_loss": 1.2104567289352417, |
|
"eval_validation_leggepertutti_runtime": 35.7676, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 5984 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_validation_altalexprivacy_loss": 1.1698046922683716, |
|
"eval_validation_altalexprivacy_runtime": 58.3216, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 5984 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_validation_mc4_it_loss": 1.733211874961853, |
|
"eval_validation_mc4_it_runtime": 78.1157, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 5984 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_validation_dolma_loss": 1.9291273355484009, |
|
"eval_validation_dolma_runtime": 53.9368, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 5984 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"grad_norm": 3.15625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5307, |
|
"step": 6171 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_validation_privacy_sources_loss": 0.7893861532211304, |
|
"eval_validation_privacy_sources_runtime": 210.7488, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 6171 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_validation_agenda_digitale_loss": 1.3451480865478516, |
|
"eval_validation_agenda_digitale_runtime": 187.0845, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 6171 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_validation_leggepertutti_loss": 1.2113819122314453, |
|
"eval_validation_leggepertutti_runtime": 35.7727, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 6171 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_validation_altalexprivacy_loss": 1.1663610935211182, |
|
"eval_validation_altalexprivacy_runtime": 58.3307, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 6171 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_validation_mc4_it_loss": 1.7309118509292603, |
|
"eval_validation_mc4_it_runtime": 78.1316, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 6171 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"eval_validation_dolma_loss": 1.9281673431396484, |
|
"eval_validation_dolma_runtime": 53.9207, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 6171 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"grad_norm": 3.078125, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5203, |
|
"step": 6358 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_validation_privacy_sources_loss": 0.7874845266342163, |
|
"eval_validation_privacy_sources_runtime": 210.6148, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.912, |
|
"step": 6358 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_validation_agenda_digitale_loss": 1.3434906005859375, |
|
"eval_validation_agenda_digitale_runtime": 186.9358, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.819, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 6358 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_validation_leggepertutti_loss": 1.2103608846664429, |
|
"eval_validation_leggepertutti_runtime": 35.7522, |
|
"eval_validation_leggepertutti_samples_per_second": 1.818, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 6358 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_validation_altalexprivacy_loss": 1.164802074432373, |
|
"eval_validation_altalexprivacy_runtime": 58.2954, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 6358 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_validation_mc4_it_loss": 1.7286055088043213, |
|
"eval_validation_mc4_it_runtime": 78.0929, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 6358 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_validation_dolma_loss": 1.927778720855713, |
|
"eval_validation_dolma_runtime": 53.9081, |
|
"eval_validation_dolma_samples_per_second": 1.818, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 6358 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"grad_norm": 3.59375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5257, |
|
"step": 6545 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_privacy_sources_loss": 0.785801887512207, |
|
"eval_validation_privacy_sources_runtime": 210.655, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 6545 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_agenda_digitale_loss": 1.341984510421753, |
|
"eval_validation_agenda_digitale_runtime": 186.9769, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 6545 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_leggepertutti_loss": 1.208351492881775, |
|
"eval_validation_leggepertutti_runtime": 35.7494, |
|
"eval_validation_leggepertutti_samples_per_second": 1.818, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 6545 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_altalexprivacy_loss": 1.1633599996566772, |
|
"eval_validation_altalexprivacy_runtime": 58.2944, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 6545 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_mc4_it_loss": 1.726757526397705, |
|
"eval_validation_mc4_it_runtime": 78.0983, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 6545 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_validation_dolma_loss": 1.9275562763214111, |
|
"eval_validation_dolma_runtime": 53.8914, |
|
"eval_validation_dolma_samples_per_second": 1.818, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 6545 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"grad_norm": 3.234375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5019, |
|
"step": 6732 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_validation_privacy_sources_loss": 0.7848771214485168, |
|
"eval_validation_privacy_sources_runtime": 210.6636, |
|
"eval_validation_privacy_sources_samples_per_second": 1.818, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 6732 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_validation_agenda_digitale_loss": 1.3411486148834229, |
|
"eval_validation_agenda_digitale_runtime": 186.9976, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.818, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 6732 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_validation_leggepertutti_loss": 1.2077082395553589, |
|
"eval_validation_leggepertutti_runtime": 35.7665, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 6732 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_validation_altalexprivacy_loss": 1.1618914604187012, |
|
"eval_validation_altalexprivacy_runtime": 58.33, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 6732 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_validation_mc4_it_loss": 1.725679874420166, |
|
"eval_validation_mc4_it_runtime": 78.1276, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 6732 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_validation_dolma_loss": 1.9271798133850098, |
|
"eval_validation_dolma_runtime": 53.9117, |
|
"eval_validation_dolma_samples_per_second": 1.818, |
|
"eval_validation_dolma_steps_per_second": 0.909, |
|
"step": 6732 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"grad_norm": 3.15625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5152, |
|
"step": 6919 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_privacy_sources_loss": 0.782995879650116, |
|
"eval_validation_privacy_sources_runtime": 210.7422, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 6919 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_agenda_digitale_loss": 1.3396461009979248, |
|
"eval_validation_agenda_digitale_runtime": 187.0789, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.909, |
|
"step": 6919 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_leggepertutti_loss": 1.2054615020751953, |
|
"eval_validation_leggepertutti_runtime": 35.7709, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.923, |
|
"step": 6919 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_altalexprivacy_loss": 1.1602697372436523, |
|
"eval_validation_altalexprivacy_runtime": 58.3175, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.818, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 6919 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_mc4_it_loss": 1.724775791168213, |
|
"eval_validation_mc4_it_runtime": 78.0214, |
|
"eval_validation_mc4_it_samples_per_second": 1.82, |
|
"eval_validation_mc4_it_steps_per_second": 0.91, |
|
"step": 6919 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"eval_validation_dolma_loss": 1.9262704849243164, |
|
"eval_validation_dolma_runtime": 53.8374, |
|
"eval_validation_dolma_samples_per_second": 1.82, |
|
"eval_validation_dolma_steps_per_second": 0.91, |
|
"step": 6919 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"grad_norm": 3.28125, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5167, |
|
"step": 7106 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_validation_privacy_sources_loss": 0.7818235158920288, |
|
"eval_validation_privacy_sources_runtime": 210.7745, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 7106 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_validation_agenda_digitale_loss": 1.3387728929519653, |
|
"eval_validation_agenda_digitale_runtime": 187.1722, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 7106 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_validation_leggepertutti_loss": 1.2060880661010742, |
|
"eval_validation_leggepertutti_runtime": 35.7758, |
|
"eval_validation_leggepertutti_samples_per_second": 1.817, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 7106 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_validation_altalexprivacy_loss": 1.158158302307129, |
|
"eval_validation_altalexprivacy_runtime": 58.3272, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.909, |
|
"step": 7106 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_validation_mc4_it_loss": 1.7227188348770142, |
|
"eval_validation_mc4_it_runtime": 78.0893, |
|
"eval_validation_mc4_it_samples_per_second": 1.818, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 7106 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_validation_dolma_loss": 1.925492763519287, |
|
"eval_validation_dolma_runtime": 53.8538, |
|
"eval_validation_dolma_samples_per_second": 1.82, |
|
"eval_validation_dolma_steps_per_second": 0.91, |
|
"step": 7106 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"grad_norm": 3.390625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.4819, |
|
"step": 7293 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_privacy_sources_loss": 0.7804288268089294, |
|
"eval_validation_privacy_sources_runtime": 210.7884, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 7293 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_agenda_digitale_loss": 1.337357521057129, |
|
"eval_validation_agenda_digitale_runtime": 187.1395, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.817, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 7293 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_leggepertutti_loss": 1.205103874206543, |
|
"eval_validation_leggepertutti_runtime": 35.7974, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 7293 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_altalexprivacy_loss": 1.155694603919983, |
|
"eval_validation_altalexprivacy_runtime": 58.3571, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.816, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 7293 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_mc4_it_loss": 1.7214677333831787, |
|
"eval_validation_mc4_it_runtime": 78.1458, |
|
"eval_validation_mc4_it_samples_per_second": 1.817, |
|
"eval_validation_mc4_it_steps_per_second": 0.909, |
|
"step": 7293 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_validation_dolma_loss": 1.926133155822754, |
|
"eval_validation_dolma_runtime": 53.9449, |
|
"eval_validation_dolma_samples_per_second": 1.817, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 7293 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"grad_norm": 3.34375, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5164, |
|
"step": 7480 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_validation_privacy_sources_loss": 0.7794305682182312, |
|
"eval_validation_privacy_sources_runtime": 210.7859, |
|
"eval_validation_privacy_sources_samples_per_second": 1.817, |
|
"eval_validation_privacy_sources_steps_per_second": 0.911, |
|
"step": 7480 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_validation_agenda_digitale_loss": 1.3364444971084595, |
|
"eval_validation_agenda_digitale_runtime": 187.1772, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.816, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 7480 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_validation_leggepertutti_loss": 1.2025309801101685, |
|
"eval_validation_leggepertutti_runtime": 35.7941, |
|
"eval_validation_leggepertutti_samples_per_second": 1.816, |
|
"eval_validation_leggepertutti_steps_per_second": 0.922, |
|
"step": 7480 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_validation_altalexprivacy_loss": 1.1547417640686035, |
|
"eval_validation_altalexprivacy_runtime": 58.3512, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.817, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 7480 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_validation_mc4_it_loss": 1.7210993766784668, |
|
"eval_validation_mc4_it_runtime": 78.1723, |
|
"eval_validation_mc4_it_samples_per_second": 1.816, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 7480 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_validation_dolma_loss": 1.925874948501587, |
|
"eval_validation_dolma_runtime": 53.9674, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 7480 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"grad_norm": 3.140625, |
|
"learning_rate": 1e-05, |
|
"loss": 1.5167, |
|
"step": 7667 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_validation_privacy_sources_loss": 0.7769683599472046, |
|
"eval_validation_privacy_sources_runtime": 210.8943, |
|
"eval_validation_privacy_sources_samples_per_second": 1.816, |
|
"eval_validation_privacy_sources_steps_per_second": 0.91, |
|
"step": 7667 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_validation_agenda_digitale_loss": 1.3346428871154785, |
|
"eval_validation_agenda_digitale_runtime": 187.2224, |
|
"eval_validation_agenda_digitale_samples_per_second": 1.816, |
|
"eval_validation_agenda_digitale_steps_per_second": 0.908, |
|
"step": 7667 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_validation_leggepertutti_loss": 1.2033891677856445, |
|
"eval_validation_leggepertutti_runtime": 35.8133, |
|
"eval_validation_leggepertutti_samples_per_second": 1.815, |
|
"eval_validation_leggepertutti_steps_per_second": 0.921, |
|
"step": 7667 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_validation_altalexprivacy_loss": 1.1526622772216797, |
|
"eval_validation_altalexprivacy_runtime": 58.3616, |
|
"eval_validation_altalexprivacy_samples_per_second": 1.816, |
|
"eval_validation_altalexprivacy_steps_per_second": 0.908, |
|
"step": 7667 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_validation_mc4_it_loss": 1.7187703847885132, |
|
"eval_validation_mc4_it_runtime": 78.1967, |
|
"eval_validation_mc4_it_samples_per_second": 1.816, |
|
"eval_validation_mc4_it_steps_per_second": 0.908, |
|
"step": 7667 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"eval_validation_dolma_loss": 1.9250844717025757, |
|
"eval_validation_dolma_runtime": 53.9678, |
|
"eval_validation_dolma_samples_per_second": 1.816, |
|
"eval_validation_dolma_steps_per_second": 0.908, |
|
"step": 7667 |
|
} |
|
], |
|
"logging_steps": 187, |
|
"max_steps": 23720, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 2, |
|
"save_steps": 187, |
|
"total_flos": 3.215568919621062e+19, |
|
"train_batch_size": 1, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|