{ "best_metric": 25.1709, "best_model_checkpoint": "my-model/checkpoint-1528", "epoch": 2.0, "eval_steps": 500, "global_step": 3056, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.32722513089005234, "grad_norm": 0.9616150856018066, "learning_rate": 4.454624781849913e-05, "loss": 0.0158, "step": 500 }, { "epoch": 0.6544502617801047, "grad_norm": 2.0808584690093994, "learning_rate": 3.909249563699826e-05, "loss": 0.0223, "step": 1000 }, { "epoch": 0.981675392670157, "grad_norm": 1.145504117012024, "learning_rate": 3.3638743455497386e-05, "loss": 0.0271, "step": 1500 }, { "epoch": 1.0, "eval_loss": 5.483295917510986, "eval_rouge1": 25.1709, "eval_rouge2": 10.0024, "eval_rougeL": 21.9926, "eval_runtime": 372.8877, "eval_samples_per_second": 5.886, "eval_steps_per_second": 0.59, "step": 1528 }, { "epoch": 1.3089005235602094, "grad_norm": 3.2998411655426025, "learning_rate": 2.8184991273996508e-05, "loss": 0.0416, "step": 2000 }, { "epoch": 1.6361256544502618, "grad_norm": 1.5071967840194702, "learning_rate": 2.273123909249564e-05, "loss": 0.0513, "step": 2500 }, { "epoch": 1.9633507853403143, "grad_norm": 4.118706226348877, "learning_rate": 1.7277486910994763e-05, "loss": 0.0687, "step": 3000 }, { "epoch": 2.0, "eval_loss": 5.419973373413086, "eval_rouge1": 24.9529, "eval_rouge2": 9.9221, "eval_rougeL": 21.6944, "eval_runtime": 386.7275, "eval_samples_per_second": 5.676, "eval_steps_per_second": 0.569, "step": 3056 } ], "logging_steps": 500, "max_steps": 4584, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 1.4662889498529792e+16, "train_batch_size": 10, "trial_name": null, "trial_params": null }