total_params: 5930596 image_size: 256 num_train_steps: -1 num_epochs: 10 batch_size: 1 lr: 0.0001 lr_warmup_steps: 10 lr_scheduler: cosine_with_restarts gradient_accumulation_steps: 2000 save_results_every: 500 save_model_every: 5000 dim: 32 vq_codebook_size: 128 vq_codebook_dim: 128 seq_len: 1024 channels: 3 layers: 4 discr_layers: 4 scheduler_power: 8.0 num_cycles: 800 only_save_last_checkpoint: false validation_image_scale: 1.0 no_center_crop: false no_flip: false random_crop: true dataset_save_path: H:/cached_datasets/INE clear_previous_experiments: false max_grad_norm: null discr_max_grad_norm: null seed: 42 valid_frac: 0.05 use_ema: false ema_beta: 0.995 ema_update_after_step: 1 ema_update_every: 1 apply_grad_penalty_every: 4 image_column: image caption_column: caption log_with: wandb mixed_precision: 'no' use_8bit_adam: false results_dir: results\Muse-v0.12_test logging_dir: null resume_path: results\Muse-v0.12_test\vae.4515000.pt dataset_name: null streaming: false train_data_dir: H:/dataset checkpoint_limit: null cond_drop_prob: 0.5 taming_model_path: null taming_config_path: null optimizer: Adam weight_decay: 0.001 cache_path: null no_cache: true latest_checkpoint: true do_not_save_config: false use_l2_recon_loss: false debug: false config_path: null validation_folder_at_end_of_epoch: samples/validation exclude_folders: null webdataset: null project_name: muse_vae run_name: null wandb_user: null hf_split_name: train