LexLLMv0.0.0.x.10.23_060 / trainer_state.json
andrealexroom's picture
Upload folder using huggingface_hub
f1ae7b4 verified
raw
history blame contribute delete
No virus
49.8 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.6005253374988001,
"eval_steps": 187,
"global_step": 4301,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"grad_norm": 6.75,
"learning_rate": 1e-05,
"loss": 1.5273,
"step": 1
},
{
"epoch": 0.03,
"grad_norm": 4.84375,
"learning_rate": 1e-05,
"loss": 1.4233,
"step": 187
},
{
"epoch": 0.03,
"eval_validation_loss": 0.9953275918960571,
"eval_validation_runtime": 194.4686,
"eval_validation_samples_per_second": 1.455,
"eval_validation_steps_per_second": 0.73,
"step": 187
},
{
"epoch": 0.03,
"eval_validation_privacy_sources_loss": 0.9953275918960571,
"eval_validation_privacy_sources_runtime": 194.1974,
"eval_validation_privacy_sources_samples_per_second": 1.457,
"eval_validation_privacy_sources_steps_per_second": 0.731,
"step": 187
},
{
"epoch": 0.03,
"eval_validation_agenda_digitale_loss": 1.5556422472000122,
"eval_validation_agenda_digitale_runtime": 174.2863,
"eval_validation_agenda_digitale_samples_per_second": 1.457,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 187
},
{
"epoch": 0.03,
"eval_validation_legal_articles_loss": 1.4555308818817139,
"eval_validation_legal_articles_runtime": 280.5049,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 187
},
{
"epoch": 0.03,
"eval_validation_dolma_loss": 1.8503074645996094,
"eval_validation_dolma_runtime": 111.0987,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 187
},
{
"epoch": 0.03,
"eval_validation_leggepertutti_loss": 1.3198411464691162,
"eval_validation_leggepertutti_runtime": 32.2433,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 187
},
{
"epoch": 0.03,
"eval_validation_stack_loss": 0.7054847478866577,
"eval_validation_stack_runtime": 150.1631,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.733,
"step": 187
},
{
"epoch": 0.05,
"grad_norm": 3.21875,
"learning_rate": 1e-05,
"loss": 1.36,
"step": 374
},
{
"epoch": 0.05,
"eval_validation_loss": 0.9383934140205383,
"eval_validation_runtime": 194.1055,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.732,
"step": 374
},
{
"epoch": 0.05,
"eval_validation_privacy_sources_loss": 0.9383934140205383,
"eval_validation_privacy_sources_runtime": 194.049,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 374
},
{
"epoch": 0.05,
"eval_validation_agenda_digitale_loss": 1.5316377878189087,
"eval_validation_agenda_digitale_runtime": 174.1261,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 374
},
{
"epoch": 0.05,
"eval_validation_legal_articles_loss": 1.4261502027511597,
"eval_validation_legal_articles_runtime": 280.4336,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 374
},
{
"epoch": 0.05,
"eval_validation_dolma_loss": 1.8504927158355713,
"eval_validation_dolma_runtime": 111.0511,
"eval_validation_dolma_samples_per_second": 1.459,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 374
},
{
"epoch": 0.05,
"eval_validation_leggepertutti_loss": 1.2899781465530396,
"eval_validation_leggepertutti_runtime": 32.2352,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.745,
"step": 374
},
{
"epoch": 0.05,
"eval_validation_stack_loss": 0.6623784303665161,
"eval_validation_stack_runtime": 150.1338,
"eval_validation_stack_samples_per_second": 1.459,
"eval_validation_stack_steps_per_second": 0.733,
"step": 374
},
{
"epoch": 0.08,
"grad_norm": 2.984375,
"learning_rate": 1e-05,
"loss": 1.335,
"step": 561
},
{
"epoch": 0.08,
"eval_validation_loss": 0.9139429926872253,
"eval_validation_runtime": 194.0822,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.732,
"step": 561
},
{
"epoch": 0.08,
"eval_validation_privacy_sources_loss": 0.9139429926872253,
"eval_validation_privacy_sources_runtime": 194.1531,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.731,
"step": 561
},
{
"epoch": 0.08,
"eval_validation_agenda_digitale_loss": 1.5203362703323364,
"eval_validation_agenda_digitale_runtime": 174.1785,
"eval_validation_agenda_digitale_samples_per_second": 1.458,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 561
},
{
"epoch": 0.08,
"eval_validation_legal_articles_loss": 1.4142487049102783,
"eval_validation_legal_articles_runtime": 280.7608,
"eval_validation_legal_articles_samples_per_second": 1.457,
"eval_validation_legal_articles_steps_per_second": 0.73,
"step": 561
},
{
"epoch": 0.08,
"eval_validation_dolma_loss": 1.8510735034942627,
"eval_validation_dolma_runtime": 111.1069,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 561
},
{
"epoch": 0.08,
"eval_validation_leggepertutti_loss": 1.2792346477508545,
"eval_validation_leggepertutti_runtime": 32.2763,
"eval_validation_leggepertutti_samples_per_second": 1.456,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 561
},
{
"epoch": 0.08,
"eval_validation_stack_loss": 0.6663106083869934,
"eval_validation_stack_runtime": 150.2829,
"eval_validation_stack_samples_per_second": 1.457,
"eval_validation_stack_steps_per_second": 0.732,
"step": 561
},
{
"epoch": 0.1,
"grad_norm": 3.34375,
"learning_rate": 1e-05,
"loss": 1.3227,
"step": 748
},
{
"epoch": 0.1,
"eval_validation_loss": 0.8906309008598328,
"eval_validation_runtime": 193.9915,
"eval_validation_samples_per_second": 1.459,
"eval_validation_steps_per_second": 0.732,
"step": 748
},
{
"epoch": 0.1,
"eval_validation_privacy_sources_loss": 0.8906309008598328,
"eval_validation_privacy_sources_runtime": 193.9118,
"eval_validation_privacy_sources_samples_per_second": 1.459,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 748
},
{
"epoch": 0.1,
"eval_validation_agenda_digitale_loss": 1.505711555480957,
"eval_validation_agenda_digitale_runtime": 174.1465,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 748
},
{
"epoch": 0.1,
"eval_validation_legal_articles_loss": 1.4007651805877686,
"eval_validation_legal_articles_runtime": 280.6207,
"eval_validation_legal_articles_samples_per_second": 1.457,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 748
},
{
"epoch": 0.1,
"eval_validation_dolma_loss": 1.8508217334747314,
"eval_validation_dolma_runtime": 111.0428,
"eval_validation_dolma_samples_per_second": 1.459,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 748
},
{
"epoch": 0.1,
"eval_validation_leggepertutti_loss": 1.2712979316711426,
"eval_validation_leggepertutti_runtime": 32.243,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 748
},
{
"epoch": 0.1,
"eval_validation_stack_loss": 0.6624295711517334,
"eval_validation_stack_runtime": 150.1684,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.733,
"step": 748
},
{
"epoch": 0.13,
"grad_norm": 3.1875,
"learning_rate": 1e-05,
"loss": 1.2894,
"step": 935
},
{
"epoch": 0.13,
"eval_validation_loss": 0.8783557415008545,
"eval_validation_runtime": 194.0651,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.732,
"step": 935
},
{
"epoch": 0.13,
"eval_validation_privacy_sources_loss": 0.8783557415008545,
"eval_validation_privacy_sources_runtime": 194.2156,
"eval_validation_privacy_sources_samples_per_second": 1.457,
"eval_validation_privacy_sources_steps_per_second": 0.731,
"step": 935
},
{
"epoch": 0.13,
"eval_validation_agenda_digitale_loss": 1.4970660209655762,
"eval_validation_agenda_digitale_runtime": 174.2301,
"eval_validation_agenda_digitale_samples_per_second": 1.458,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 935
},
{
"epoch": 0.13,
"eval_validation_legal_articles_loss": 1.3921587467193604,
"eval_validation_legal_articles_runtime": 280.4294,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 935
},
{
"epoch": 0.13,
"eval_validation_dolma_loss": 1.851251244544983,
"eval_validation_dolma_runtime": 111.0768,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 935
},
{
"epoch": 0.13,
"eval_validation_leggepertutti_loss": 1.2646007537841797,
"eval_validation_leggepertutti_runtime": 32.2511,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 935
},
{
"epoch": 0.13,
"eval_validation_stack_loss": 0.667582631111145,
"eval_validation_stack_runtime": 150.215,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.732,
"step": 935
},
{
"epoch": 0.16,
"grad_norm": 6.3125,
"learning_rate": 1e-05,
"loss": 1.2936,
"step": 1122
},
{
"epoch": 0.16,
"eval_validation_loss": 0.8658438920974731,
"eval_validation_runtime": 193.9819,
"eval_validation_samples_per_second": 1.459,
"eval_validation_steps_per_second": 0.732,
"step": 1122
},
{
"epoch": 0.16,
"eval_validation_privacy_sources_loss": 0.8658438920974731,
"eval_validation_privacy_sources_runtime": 193.9777,
"eval_validation_privacy_sources_samples_per_second": 1.459,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 1122
},
{
"epoch": 0.16,
"eval_validation_agenda_digitale_loss": 1.4888020753860474,
"eval_validation_agenda_digitale_runtime": 174.0686,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.73,
"step": 1122
},
{
"epoch": 0.16,
"eval_validation_legal_articles_loss": 1.384485125541687,
"eval_validation_legal_articles_runtime": 280.3377,
"eval_validation_legal_articles_samples_per_second": 1.459,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 1122
},
{
"epoch": 0.16,
"eval_validation_dolma_loss": 1.855146050453186,
"eval_validation_dolma_runtime": 110.9957,
"eval_validation_dolma_samples_per_second": 1.46,
"eval_validation_dolma_steps_per_second": 0.73,
"step": 1122
},
{
"epoch": 0.16,
"eval_validation_leggepertutti_loss": 1.2589794397354126,
"eval_validation_leggepertutti_runtime": 32.2366,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 1122
},
{
"epoch": 0.16,
"eval_validation_stack_loss": 0.6629025340080261,
"eval_validation_stack_runtime": 150.1177,
"eval_validation_stack_samples_per_second": 1.459,
"eval_validation_stack_steps_per_second": 0.733,
"step": 1122
},
{
"epoch": 0.18,
"grad_norm": 3.25,
"learning_rate": 1e-05,
"loss": 1.2703,
"step": 1309
},
{
"epoch": 0.18,
"eval_validation_loss": 0.8527970910072327,
"eval_validation_runtime": 193.9817,
"eval_validation_samples_per_second": 1.459,
"eval_validation_steps_per_second": 0.732,
"step": 1309
},
{
"epoch": 0.18,
"eval_validation_privacy_sources_loss": 0.8527970910072327,
"eval_validation_privacy_sources_runtime": 194.001,
"eval_validation_privacy_sources_samples_per_second": 1.459,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 1309
},
{
"epoch": 0.18,
"eval_validation_agenda_digitale_loss": 1.4821778535842896,
"eval_validation_agenda_digitale_runtime": 174.0669,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.73,
"step": 1309
},
{
"epoch": 0.18,
"eval_validation_legal_articles_loss": 1.3752673864364624,
"eval_validation_legal_articles_runtime": 280.3145,
"eval_validation_legal_articles_samples_per_second": 1.459,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 1309
},
{
"epoch": 0.18,
"eval_validation_dolma_loss": 1.851420283317566,
"eval_validation_dolma_runtime": 111.0747,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 1309
},
{
"epoch": 0.18,
"eval_validation_leggepertutti_loss": 1.2481449842453003,
"eval_validation_leggepertutti_runtime": 32.2435,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 1309
},
{
"epoch": 0.18,
"eval_validation_stack_loss": 0.663459062576294,
"eval_validation_stack_runtime": 150.3253,
"eval_validation_stack_samples_per_second": 1.457,
"eval_validation_stack_steps_per_second": 0.732,
"step": 1309
},
{
"epoch": 0.21,
"grad_norm": 3.3125,
"learning_rate": 1e-05,
"loss": 1.2603,
"step": 1496
},
{
"epoch": 0.21,
"eval_validation_loss": 0.8457313776016235,
"eval_validation_runtime": 194.1045,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.732,
"step": 1496
},
{
"epoch": 0.21,
"eval_validation_privacy_sources_loss": 0.8457313776016235,
"eval_validation_privacy_sources_runtime": 194.0987,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 1496
},
{
"epoch": 0.21,
"eval_validation_agenda_digitale_loss": 1.4775303602218628,
"eval_validation_agenda_digitale_runtime": 174.2206,
"eval_validation_agenda_digitale_samples_per_second": 1.458,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 1496
},
{
"epoch": 0.21,
"eval_validation_legal_articles_loss": 1.3696094751358032,
"eval_validation_legal_articles_runtime": 280.5342,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 1496
},
{
"epoch": 0.21,
"eval_validation_dolma_loss": 1.8503979444503784,
"eval_validation_dolma_runtime": 111.072,
"eval_validation_dolma_samples_per_second": 1.459,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 1496
},
{
"epoch": 0.21,
"eval_validation_leggepertutti_loss": 1.2421447038650513,
"eval_validation_leggepertutti_runtime": 32.2684,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 1496
},
{
"epoch": 0.21,
"eval_validation_stack_loss": 0.6622874140739441,
"eval_validation_stack_runtime": 150.2083,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.732,
"step": 1496
},
{
"epoch": 0.23,
"grad_norm": 2.78125,
"learning_rate": 1e-05,
"loss": 1.2556,
"step": 1683
},
{
"epoch": 0.23,
"eval_validation_loss": 0.8370487689971924,
"eval_validation_runtime": 194.2283,
"eval_validation_samples_per_second": 1.457,
"eval_validation_steps_per_second": 0.731,
"step": 1683
},
{
"epoch": 0.23,
"eval_validation_privacy_sources_loss": 0.8370487689971924,
"eval_validation_privacy_sources_runtime": 194.3184,
"eval_validation_privacy_sources_samples_per_second": 1.456,
"eval_validation_privacy_sources_steps_per_second": 0.731,
"step": 1683
},
{
"epoch": 0.23,
"eval_validation_agenda_digitale_loss": 1.4706999063491821,
"eval_validation_agenda_digitale_runtime": 174.3662,
"eval_validation_agenda_digitale_samples_per_second": 1.457,
"eval_validation_agenda_digitale_steps_per_second": 0.728,
"step": 1683
},
{
"epoch": 0.23,
"eval_validation_legal_articles_loss": 1.363641381263733,
"eval_validation_legal_articles_runtime": 280.656,
"eval_validation_legal_articles_samples_per_second": 1.457,
"eval_validation_legal_articles_steps_per_second": 0.73,
"step": 1683
},
{
"epoch": 0.23,
"eval_validation_dolma_loss": 1.848027229309082,
"eval_validation_dolma_runtime": 111.1824,
"eval_validation_dolma_samples_per_second": 1.457,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 1683
},
{
"epoch": 0.23,
"eval_validation_leggepertutti_loss": 1.240347146987915,
"eval_validation_leggepertutti_runtime": 32.2674,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 1683
},
{
"epoch": 0.23,
"eval_validation_stack_loss": 0.6605746746063232,
"eval_validation_stack_runtime": 150.2441,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.732,
"step": 1683
},
{
"epoch": 0.26,
"grad_norm": 3.1875,
"learning_rate": 1e-05,
"loss": 1.25,
"step": 1870
},
{
"epoch": 0.26,
"eval_validation_loss": 0.8285319805145264,
"eval_validation_runtime": 194.0857,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.732,
"step": 1870
},
{
"epoch": 0.26,
"eval_validation_privacy_sources_loss": 0.8285319805145264,
"eval_validation_privacy_sources_runtime": 194.1082,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 1870
},
{
"epoch": 0.26,
"eval_validation_agenda_digitale_loss": 1.467832088470459,
"eval_validation_agenda_digitale_runtime": 174.0948,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 1870
},
{
"epoch": 0.26,
"eval_validation_legal_articles_loss": 1.3606085777282715,
"eval_validation_legal_articles_runtime": 280.4529,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 1870
},
{
"epoch": 0.26,
"eval_validation_dolma_loss": 1.8478673696517944,
"eval_validation_dolma_runtime": 111.0459,
"eval_validation_dolma_samples_per_second": 1.459,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 1870
},
{
"epoch": 0.26,
"eval_validation_leggepertutti_loss": 1.2359322309494019,
"eval_validation_leggepertutti_runtime": 32.2397,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 1870
},
{
"epoch": 0.26,
"eval_validation_stack_loss": 0.6594959497451782,
"eval_validation_stack_runtime": 150.1577,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.733,
"step": 1870
},
{
"epoch": 0.29,
"grad_norm": 4.96875,
"learning_rate": 1e-05,
"loss": 1.238,
"step": 2057
},
{
"epoch": 0.29,
"eval_validation_loss": 0.8220862150192261,
"eval_validation_runtime": 194.0761,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.732,
"step": 2057
},
{
"epoch": 0.29,
"eval_validation_privacy_sources_loss": 0.8220862150192261,
"eval_validation_privacy_sources_runtime": 194.0716,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 2057
},
{
"epoch": 0.29,
"eval_validation_agenda_digitale_loss": 1.4595245122909546,
"eval_validation_agenda_digitale_runtime": 174.1501,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 2057
},
{
"epoch": 0.29,
"eval_validation_legal_articles_loss": 1.355904221534729,
"eval_validation_legal_articles_runtime": 280.5038,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 2057
},
{
"epoch": 0.29,
"eval_validation_dolma_loss": 1.846190333366394,
"eval_validation_dolma_runtime": 111.1135,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 2057
},
{
"epoch": 0.29,
"eval_validation_leggepertutti_loss": 1.2381559610366821,
"eval_validation_leggepertutti_runtime": 32.2445,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 2057
},
{
"epoch": 0.29,
"eval_validation_stack_loss": 0.660571813583374,
"eval_validation_stack_runtime": 150.2476,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.732,
"step": 2057
},
{
"epoch": 0.31,
"grad_norm": 9.0,
"learning_rate": 1e-05,
"loss": 1.2384,
"step": 2244
},
{
"epoch": 0.31,
"eval_validation_loss": 0.8178092241287231,
"eval_validation_runtime": 194.1251,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.731,
"step": 2244
},
{
"epoch": 0.31,
"eval_validation_privacy_sources_loss": 0.8178092241287231,
"eval_validation_privacy_sources_runtime": 194.0771,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 2244
},
{
"epoch": 0.31,
"eval_validation_agenda_digitale_loss": 1.460057258605957,
"eval_validation_agenda_digitale_runtime": 174.2114,
"eval_validation_agenda_digitale_samples_per_second": 1.458,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 2244
},
{
"epoch": 0.31,
"eval_validation_legal_articles_loss": 1.3545092344284058,
"eval_validation_legal_articles_runtime": 280.7055,
"eval_validation_legal_articles_samples_per_second": 1.457,
"eval_validation_legal_articles_steps_per_second": 0.73,
"step": 2244
},
{
"epoch": 0.31,
"eval_validation_dolma_loss": 1.8475868701934814,
"eval_validation_dolma_runtime": 111.0986,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 2244
},
{
"epoch": 0.31,
"eval_validation_leggepertutti_loss": 1.2337557077407837,
"eval_validation_leggepertutti_runtime": 32.2593,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 2244
},
{
"epoch": 0.31,
"eval_validation_stack_loss": 0.6590169072151184,
"eval_validation_stack_runtime": 150.2183,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.732,
"step": 2244
},
{
"epoch": 0.34,
"grad_norm": 2.96875,
"learning_rate": 1e-05,
"loss": 1.2267,
"step": 2431
},
{
"epoch": 0.34,
"eval_validation_loss": 0.8118987083435059,
"eval_validation_runtime": 194.1905,
"eval_validation_samples_per_second": 1.457,
"eval_validation_steps_per_second": 0.731,
"step": 2431
},
{
"epoch": 0.34,
"eval_validation_privacy_sources_loss": 0.8118987083435059,
"eval_validation_privacy_sources_runtime": 194.1644,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.731,
"step": 2431
},
{
"epoch": 0.34,
"eval_validation_agenda_digitale_loss": 1.4531759023666382,
"eval_validation_agenda_digitale_runtime": 174.2809,
"eval_validation_agenda_digitale_samples_per_second": 1.457,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 2431
},
{
"epoch": 0.34,
"eval_validation_legal_articles_loss": 1.3473464250564575,
"eval_validation_legal_articles_runtime": 280.6295,
"eval_validation_legal_articles_samples_per_second": 1.457,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 2431
},
{
"epoch": 0.34,
"eval_validation_dolma_loss": 1.8490244150161743,
"eval_validation_dolma_runtime": 111.164,
"eval_validation_dolma_samples_per_second": 1.457,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 2431
},
{
"epoch": 0.34,
"eval_validation_leggepertutti_loss": 1.2278121709823608,
"eval_validation_leggepertutti_runtime": 32.2528,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 2431
},
{
"epoch": 0.34,
"eval_validation_stack_loss": 0.6574946641921997,
"eval_validation_stack_runtime": 150.229,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.732,
"step": 2431
},
{
"epoch": 0.37,
"grad_norm": 7.125,
"learning_rate": 1e-05,
"loss": 1.228,
"step": 2618
},
{
"epoch": 0.37,
"eval_validation_loss": 0.8083770275115967,
"eval_validation_runtime": 194.1727,
"eval_validation_samples_per_second": 1.457,
"eval_validation_steps_per_second": 0.731,
"step": 2618
},
{
"epoch": 0.37,
"eval_validation_privacy_sources_loss": 0.8083770275115967,
"eval_validation_privacy_sources_runtime": 194.109,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 2618
},
{
"epoch": 0.37,
"eval_validation_agenda_digitale_loss": 1.4517344236373901,
"eval_validation_agenda_digitale_runtime": 174.2026,
"eval_validation_agenda_digitale_samples_per_second": 1.458,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 2618
},
{
"epoch": 0.37,
"eval_validation_legal_articles_loss": 1.3457854986190796,
"eval_validation_legal_articles_runtime": 280.5077,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 2618
},
{
"epoch": 0.37,
"eval_validation_dolma_loss": 1.8457980155944824,
"eval_validation_dolma_runtime": 111.0983,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 2618
},
{
"epoch": 0.37,
"eval_validation_leggepertutti_loss": 1.2257617712020874,
"eval_validation_leggepertutti_runtime": 32.2598,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 2618
},
{
"epoch": 0.37,
"eval_validation_stack_loss": 0.6570916175842285,
"eval_validation_stack_runtime": 150.252,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.732,
"step": 2618
},
{
"epoch": 0.39,
"grad_norm": 2.953125,
"learning_rate": 1e-05,
"loss": 1.2256,
"step": 2805
},
{
"epoch": 0.39,
"eval_validation_loss": 0.8021377325057983,
"eval_validation_runtime": 194.2469,
"eval_validation_samples_per_second": 1.457,
"eval_validation_steps_per_second": 0.731,
"step": 2805
},
{
"epoch": 0.39,
"eval_validation_privacy_sources_loss": 0.8021377325057983,
"eval_validation_privacy_sources_runtime": 194.4649,
"eval_validation_privacy_sources_samples_per_second": 1.455,
"eval_validation_privacy_sources_steps_per_second": 0.73,
"step": 2805
},
{
"epoch": 0.39,
"eval_validation_agenda_digitale_loss": 1.449271559715271,
"eval_validation_agenda_digitale_runtime": 174.4445,
"eval_validation_agenda_digitale_samples_per_second": 1.456,
"eval_validation_agenda_digitale_steps_per_second": 0.728,
"step": 2805
},
{
"epoch": 0.39,
"eval_validation_legal_articles_loss": 1.3434243202209473,
"eval_validation_legal_articles_runtime": 281.0216,
"eval_validation_legal_articles_samples_per_second": 1.455,
"eval_validation_legal_articles_steps_per_second": 0.729,
"step": 2805
},
{
"epoch": 0.39,
"eval_validation_dolma_loss": 1.8447160720825195,
"eval_validation_dolma_runtime": 111.2369,
"eval_validation_dolma_samples_per_second": 1.456,
"eval_validation_dolma_steps_per_second": 0.728,
"step": 2805
},
{
"epoch": 0.39,
"eval_validation_leggepertutti_loss": 1.225563883781433,
"eval_validation_leggepertutti_runtime": 32.3051,
"eval_validation_leggepertutti_samples_per_second": 1.455,
"eval_validation_leggepertutti_steps_per_second": 0.743,
"step": 2805
},
{
"epoch": 0.39,
"eval_validation_stack_loss": 0.6570674180984497,
"eval_validation_stack_runtime": 150.4367,
"eval_validation_stack_samples_per_second": 1.456,
"eval_validation_stack_steps_per_second": 0.731,
"step": 2805
},
{
"epoch": 0.42,
"grad_norm": 3.28125,
"learning_rate": 1e-05,
"loss": 1.2136,
"step": 2992
},
{
"epoch": 0.42,
"eval_validation_loss": 0.8003722429275513,
"eval_validation_runtime": 194.1597,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.731,
"step": 2992
},
{
"epoch": 0.42,
"eval_validation_privacy_sources_loss": 0.8003722429275513,
"eval_validation_privacy_sources_runtime": 194.2144,
"eval_validation_privacy_sources_samples_per_second": 1.457,
"eval_validation_privacy_sources_steps_per_second": 0.731,
"step": 2992
},
{
"epoch": 0.42,
"eval_validation_agenda_digitale_loss": 1.445157766342163,
"eval_validation_agenda_digitale_runtime": 174.3593,
"eval_validation_agenda_digitale_samples_per_second": 1.457,
"eval_validation_agenda_digitale_steps_per_second": 0.728,
"step": 2992
},
{
"epoch": 0.42,
"eval_validation_legal_articles_loss": 1.340084433555603,
"eval_validation_legal_articles_runtime": 280.628,
"eval_validation_legal_articles_samples_per_second": 1.457,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 2992
},
{
"epoch": 0.42,
"eval_validation_dolma_loss": 1.8441739082336426,
"eval_validation_dolma_runtime": 111.1155,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 2992
},
{
"epoch": 0.42,
"eval_validation_leggepertutti_loss": 1.2245877981185913,
"eval_validation_leggepertutti_runtime": 32.2646,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 2992
},
{
"epoch": 0.42,
"eval_validation_stack_loss": 0.657370388507843,
"eval_validation_stack_runtime": 150.3713,
"eval_validation_stack_samples_per_second": 1.456,
"eval_validation_stack_steps_per_second": 0.732,
"step": 2992
},
{
"epoch": 0.44,
"grad_norm": 2.8125,
"learning_rate": 1e-05,
"loss": 1.2216,
"step": 3179
},
{
"epoch": 0.44,
"eval_validation_loss": 0.7953833341598511,
"eval_validation_runtime": 194.5265,
"eval_validation_samples_per_second": 1.455,
"eval_validation_steps_per_second": 0.73,
"step": 3179
},
{
"epoch": 0.44,
"eval_validation_privacy_sources_loss": 0.7953833341598511,
"eval_validation_privacy_sources_runtime": 194.6007,
"eval_validation_privacy_sources_samples_per_second": 1.454,
"eval_validation_privacy_sources_steps_per_second": 0.73,
"step": 3179
},
{
"epoch": 0.44,
"eval_validation_agenda_digitale_loss": 1.4409934282302856,
"eval_validation_agenda_digitale_runtime": 174.5993,
"eval_validation_agenda_digitale_samples_per_second": 1.455,
"eval_validation_agenda_digitale_steps_per_second": 0.727,
"step": 3179
},
{
"epoch": 0.44,
"eval_validation_legal_articles_loss": 1.3360470533370972,
"eval_validation_legal_articles_runtime": 281.1454,
"eval_validation_legal_articles_samples_per_second": 1.455,
"eval_validation_legal_articles_steps_per_second": 0.729,
"step": 3179
},
{
"epoch": 0.44,
"eval_validation_dolma_loss": 1.8454322814941406,
"eval_validation_dolma_runtime": 111.309,
"eval_validation_dolma_samples_per_second": 1.455,
"eval_validation_dolma_steps_per_second": 0.728,
"step": 3179
},
{
"epoch": 0.44,
"eval_validation_leggepertutti_loss": 1.2207506895065308,
"eval_validation_leggepertutti_runtime": 32.3094,
"eval_validation_leggepertutti_samples_per_second": 1.455,
"eval_validation_leggepertutti_steps_per_second": 0.743,
"step": 3179
},
{
"epoch": 0.44,
"eval_validation_stack_loss": 0.6579957604408264,
"eval_validation_stack_runtime": 150.3599,
"eval_validation_stack_samples_per_second": 1.457,
"eval_validation_stack_steps_per_second": 0.732,
"step": 3179
},
{
"epoch": 0.47,
"grad_norm": 3.3125,
"learning_rate": 1e-05,
"loss": 1.2183,
"step": 3366
},
{
"epoch": 0.47,
"eval_validation_loss": 0.7924418449401855,
"eval_validation_runtime": 194.1975,
"eval_validation_samples_per_second": 1.457,
"eval_validation_steps_per_second": 0.731,
"step": 3366
},
{
"epoch": 0.47,
"eval_validation_privacy_sources_loss": 0.7924418449401855,
"eval_validation_privacy_sources_runtime": 194.1952,
"eval_validation_privacy_sources_samples_per_second": 1.457,
"eval_validation_privacy_sources_steps_per_second": 0.731,
"step": 3366
},
{
"epoch": 0.47,
"eval_validation_agenda_digitale_loss": 1.4390149116516113,
"eval_validation_agenda_digitale_runtime": 174.2539,
"eval_validation_agenda_digitale_samples_per_second": 1.458,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 3366
},
{
"epoch": 0.47,
"eval_validation_legal_articles_loss": 1.3332501649856567,
"eval_validation_legal_articles_runtime": 280.6326,
"eval_validation_legal_articles_samples_per_second": 1.457,
"eval_validation_legal_articles_steps_per_second": 0.73,
"step": 3366
},
{
"epoch": 0.47,
"eval_validation_dolma_loss": 1.848328709602356,
"eval_validation_dolma_runtime": 111.0824,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 3366
},
{
"epoch": 0.47,
"eval_validation_leggepertutti_loss": 1.2147657871246338,
"eval_validation_leggepertutti_runtime": 32.2807,
"eval_validation_leggepertutti_samples_per_second": 1.456,
"eval_validation_leggepertutti_steps_per_second": 0.743,
"step": 3366
},
{
"epoch": 0.47,
"eval_validation_stack_loss": 0.6573349833488464,
"eval_validation_stack_runtime": 150.3498,
"eval_validation_stack_samples_per_second": 1.457,
"eval_validation_stack_steps_per_second": 0.732,
"step": 3366
},
{
"epoch": 0.5,
"grad_norm": 3.140625,
"learning_rate": 1e-05,
"loss": 1.217,
"step": 3553
},
{
"epoch": 0.5,
"eval_validation_loss": 0.7858894467353821,
"eval_validation_runtime": 194.4212,
"eval_validation_samples_per_second": 1.456,
"eval_validation_steps_per_second": 0.73,
"step": 3553
},
{
"epoch": 0.5,
"eval_validation_privacy_sources_loss": 0.7858894467353821,
"eval_validation_privacy_sources_runtime": 194.417,
"eval_validation_privacy_sources_samples_per_second": 1.456,
"eval_validation_privacy_sources_steps_per_second": 0.73,
"step": 3553
},
{
"epoch": 0.5,
"eval_validation_agenda_digitale_loss": 1.4353201389312744,
"eval_validation_agenda_digitale_runtime": 174.2645,
"eval_validation_agenda_digitale_samples_per_second": 1.458,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 3553
},
{
"epoch": 0.5,
"eval_validation_legal_articles_loss": 1.329630732536316,
"eval_validation_legal_articles_runtime": 280.8801,
"eval_validation_legal_articles_samples_per_second": 1.456,
"eval_validation_legal_articles_steps_per_second": 0.73,
"step": 3553
},
{
"epoch": 0.5,
"eval_validation_dolma_loss": 1.847051978111267,
"eval_validation_dolma_runtime": 111.2168,
"eval_validation_dolma_samples_per_second": 1.457,
"eval_validation_dolma_steps_per_second": 0.728,
"step": 3553
},
{
"epoch": 0.5,
"eval_validation_leggepertutti_loss": 1.2128466367721558,
"eval_validation_leggepertutti_runtime": 32.2731,
"eval_validation_leggepertutti_samples_per_second": 1.456,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 3553
},
{
"epoch": 0.5,
"eval_validation_stack_loss": 0.660595715045929,
"eval_validation_stack_runtime": 150.4122,
"eval_validation_stack_samples_per_second": 1.456,
"eval_validation_stack_steps_per_second": 0.731,
"step": 3553
},
{
"epoch": 0.52,
"grad_norm": 4.59375,
"learning_rate": 1e-05,
"loss": 1.2025,
"step": 3740
},
{
"epoch": 0.52,
"eval_validation_loss": 0.7821725606918335,
"eval_validation_runtime": 194.102,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.732,
"step": 3740
},
{
"epoch": 0.52,
"eval_validation_privacy_sources_loss": 0.7821725606918335,
"eval_validation_privacy_sources_runtime": 194.0576,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 3740
},
{
"epoch": 0.52,
"eval_validation_agenda_digitale_loss": 1.4339957237243652,
"eval_validation_agenda_digitale_runtime": 174.1039,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 3740
},
{
"epoch": 0.52,
"eval_validation_legal_articles_loss": 1.3280164003372192,
"eval_validation_legal_articles_runtime": 280.5513,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 3740
},
{
"epoch": 0.52,
"eval_validation_dolma_loss": 1.84745454788208,
"eval_validation_dolma_runtime": 111.0532,
"eval_validation_dolma_samples_per_second": 1.459,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 3740
},
{
"epoch": 0.52,
"eval_validation_leggepertutti_loss": 1.2140834331512451,
"eval_validation_leggepertutti_runtime": 32.2501,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 3740
},
{
"epoch": 0.52,
"eval_validation_stack_loss": 0.6579498052597046,
"eval_validation_stack_runtime": 150.177,
"eval_validation_stack_samples_per_second": 1.458,
"eval_validation_stack_steps_per_second": 0.732,
"step": 3740
},
{
"epoch": 0.55,
"grad_norm": 2.90625,
"learning_rate": 1e-05,
"loss": 1.1892,
"step": 3927
},
{
"epoch": 0.55,
"eval_validation_loss": 0.778718888759613,
"eval_validation_runtime": 194.0252,
"eval_validation_samples_per_second": 1.459,
"eval_validation_steps_per_second": 0.732,
"step": 3927
},
{
"epoch": 0.55,
"eval_validation_privacy_sources_loss": 0.778718888759613,
"eval_validation_privacy_sources_runtime": 194.0094,
"eval_validation_privacy_sources_samples_per_second": 1.459,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 3927
},
{
"epoch": 0.55,
"eval_validation_agenda_digitale_loss": 1.4309070110321045,
"eval_validation_agenda_digitale_runtime": 174.153,
"eval_validation_agenda_digitale_samples_per_second": 1.458,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 3927
},
{
"epoch": 0.55,
"eval_validation_legal_articles_loss": 1.3250170946121216,
"eval_validation_legal_articles_runtime": 280.4271,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 3927
},
{
"epoch": 0.55,
"eval_validation_dolma_loss": 1.8441972732543945,
"eval_validation_dolma_runtime": 111.0278,
"eval_validation_dolma_samples_per_second": 1.459,
"eval_validation_dolma_steps_per_second": 0.73,
"step": 3927
},
{
"epoch": 0.55,
"eval_validation_leggepertutti_loss": 1.2091401815414429,
"eval_validation_leggepertutti_runtime": 32.2467,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 3927
},
{
"epoch": 0.55,
"eval_validation_stack_loss": 0.6560612916946411,
"eval_validation_stack_runtime": 150.1302,
"eval_validation_stack_samples_per_second": 1.459,
"eval_validation_stack_steps_per_second": 0.733,
"step": 3927
},
{
"epoch": 0.57,
"grad_norm": 2.890625,
"learning_rate": 1e-05,
"loss": 1.1884,
"step": 4114
},
{
"epoch": 0.57,
"eval_validation_loss": 0.775921106338501,
"eval_validation_runtime": 194.1411,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.731,
"step": 4114
},
{
"epoch": 0.57,
"eval_validation_privacy_sources_loss": 0.775921106338501,
"eval_validation_privacy_sources_runtime": 194.0466,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 4114
},
{
"epoch": 0.57,
"eval_validation_agenda_digitale_loss": 1.4286702871322632,
"eval_validation_agenda_digitale_runtime": 174.1174,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 4114
},
{
"epoch": 0.57,
"eval_validation_legal_articles_loss": 1.3244529962539673,
"eval_validation_legal_articles_runtime": 280.4889,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 4114
},
{
"epoch": 0.57,
"eval_validation_dolma_loss": 1.8429710865020752,
"eval_validation_dolma_runtime": 111.0663,
"eval_validation_dolma_samples_per_second": 1.459,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 4114
},
{
"epoch": 0.57,
"eval_validation_leggepertutti_loss": 1.2103228569030762,
"eval_validation_leggepertutti_runtime": 32.2408,
"eval_validation_leggepertutti_samples_per_second": 1.458,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 4114
},
{
"epoch": 0.57,
"eval_validation_stack_loss": 0.6574613451957703,
"eval_validation_stack_runtime": 150.2725,
"eval_validation_stack_samples_per_second": 1.457,
"eval_validation_stack_steps_per_second": 0.732,
"step": 4114
},
{
"epoch": 0.6,
"grad_norm": 3.328125,
"learning_rate": 1e-05,
"loss": 1.216,
"step": 4301
},
{
"epoch": 0.6,
"eval_validation_loss": 0.7726068496704102,
"eval_validation_runtime": 194.1083,
"eval_validation_samples_per_second": 1.458,
"eval_validation_steps_per_second": 0.732,
"step": 4301
},
{
"epoch": 0.6,
"eval_validation_privacy_sources_loss": 0.7726068496704102,
"eval_validation_privacy_sources_runtime": 194.0844,
"eval_validation_privacy_sources_samples_per_second": 1.458,
"eval_validation_privacy_sources_steps_per_second": 0.732,
"step": 4301
},
{
"epoch": 0.6,
"eval_validation_agenda_digitale_loss": 1.4294990301132202,
"eval_validation_agenda_digitale_runtime": 174.0978,
"eval_validation_agenda_digitale_samples_per_second": 1.459,
"eval_validation_agenda_digitale_steps_per_second": 0.729,
"step": 4301
},
{
"epoch": 0.6,
"eval_validation_legal_articles_loss": 1.3229315280914307,
"eval_validation_legal_articles_runtime": 280.5081,
"eval_validation_legal_articles_samples_per_second": 1.458,
"eval_validation_legal_articles_steps_per_second": 0.731,
"step": 4301
},
{
"epoch": 0.6,
"eval_validation_dolma_loss": 1.844489574432373,
"eval_validation_dolma_runtime": 111.0784,
"eval_validation_dolma_samples_per_second": 1.458,
"eval_validation_dolma_steps_per_second": 0.729,
"step": 4301
},
{
"epoch": 0.6,
"eval_validation_leggepertutti_loss": 1.2054811716079712,
"eval_validation_leggepertutti_runtime": 32.2642,
"eval_validation_leggepertutti_samples_per_second": 1.457,
"eval_validation_leggepertutti_steps_per_second": 0.744,
"step": 4301
},
{
"epoch": 0.6,
"eval_validation_stack_loss": 0.657507061958313,
"eval_validation_stack_runtime": 150.2647,
"eval_validation_stack_samples_per_second": 1.457,
"eval_validation_stack_steps_per_second": 0.732,
"step": 4301
}
],
"logging_steps": 187,
"max_steps": 14324,
"num_input_tokens_seen": 0,
"num_train_epochs": 2,
"save_steps": 187,
"total_flos": 2.4051409805295747e+19,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}