total_params: 66889174 image_size: 128 num_tokens: 8192 num_train_steps: -1 num_epochs: 20 dim: 64 channels: 4 batch_size: 1 lr: 0.0001 gradient_accumulation_steps: 100 save_results_every: 500 save_model_every: 5000 vq_codebook_size: 8192 vq_codebook_dim: 8192 lr_scheduler: cosine_with_restarts lr_warmup_steps: 100 seq_len: 8192 depth: 4 dim_head: 64 heads: 8 ff_mult: 4 t5_name: t5-small mixed_precision: 'no' cond_image_size: null validation_prompt: a girl|a cat|a dog timesteps: 18 optimizer: Adam only_save_last_checkpoint: false validation_image_scale: 1.0 no_center_crop: false no_flip: false dataset_save_path: E:\cached_datasets\INE2 clear_previous_experiments: false max_grad_norm: null seed: 42 valid_frac: 0.05 use_ema: false ema_beta: 0.995 ema_update_after_step: 1 ema_update_every: 1 apply_grad_penalty_every: 4 image_column: image caption_column: caption log_with: wandb use_8bit_adam: false results_dir: results\Muse-v0.10 logging_dir: null vae_path: results\Muse-v0.10\vae.1456000.pt dataset_name: null hf_split_name: null streaming: false train_data_dir: E:\dataset checkpoint_limit: null cond_drop_prob: 0.5 scheduler_power: 1.0 num_cycles: 200 resume_path: results\Muse-v0.10\maskgit.143000.pt taming_model_path: null taming_config_path: null weight_decay: 0.0001 cache_path: null no_cache: true link: false latest_checkpoint: true do_not_save_config: false use_l2_recon_loss: false debug: false config_path: null attention_type: ein random_crop: true project_name: muse_maskgit run_name: null wandb_user: sygil layers: 4 discr_layers: 4