learning_rate: 5.0e-05 nb_training_epochs: 10 dataloader_nb_workers: 0 batch_size: 16 seed: null gradient_accumulation_steps: 1 do_metrics_in_training: false metric_to_track_lr: loss checkpoint_period: 1 checkpoint_metric: loss minimize_checkpoint_metric: true