adam_beta1: 0.9 adam_beta2: 0.999 adam_epsilon: 1.0e-08 adam_weight_decay: 0.01 cache_dir: null caption_column: text center_crop: true dataset_config_name: null dataset_name: lambdalabs/pokemon-blip-captions gradient_accumulation_steps: 4 gradient_checkpointing: true hub_model_id: null hub_token: null image_column: image learning_rate: 1.0e-05 local_rank: -1 logging_dir: logs lr_scheduler: constant lr_warmup_steps: 0 max_grad_norm: 1.0 max_train_samples: null max_train_steps: 15000 mixed_precision: null num_train_epochs: 72 output_dir: sd-pokemon-distil-model-loss-teacher-2 pretrained_model_name_or_path: lambdalabs/sd-pokemon-diffusers push_to_hub: false random_flip: true report_to: tensorboard resolution: 512 scale_lr: false seed: null train_batch_size: 1 train_data_dir: null use_8bit_adam: false use_ema: true