{ "seed": 1, "decoder": { "unets": [ { "dim": 416, "cond_dim": 512, "image_embed_dim": 768, "channels": 3, "dim_mults": [1, 2, 3, 4], "num_resnet_blocks": 4, "attn_heads": 8, "attn_dim_head": 64, "sparse_attn": true } ], "image_sizes": [64], "channels": 3, "timesteps": 1000, "loss_type": "l2", "beta_schedule": ["cosine"], "learned_variance": true }, "data": { "webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion-aesthetic/data/laion2B-en-aesthetic/{}.tar -", "embeddings_url": "s3://s-datasets/laion-aesthetic/ordered_embeddings/", "num_workers": 4, "batch_size": 8, "start_shard": 0, "end_shard": 5247, "shard_width": 5, "index_width": 4, "splits": { "train": 0.75, "val": 0.15, "test": 0.1 }, "shuffle_train": false, "resample_train": true, "preprocessing": { "RandomResizedCrop": { "size": [64, 64], "scale": [0.75, 1.0], "ratio": [1.0, 1.0] }, "ToTensor": true } }, "train": { "epochs": 40, "lr":5e-5, "wd": 0.01, "max_grad_norm": 0.5, "save_every_n_samples": 200000, "n_sample_images": 10, "device": "cuda:0", "epoch_samples": 2000000, "validation_samples": 100000, "use_ema": true, "ema_beta": 0.99, "ema_param_or_buffer_names_no_ema": ["_dummy"], "save_all": false, "save_latest": true, "save_best": true, "unet_training_mask": [true] }, "evaluate": { "n_evaluation_samples": 30, "FID": { "feature": 64 }, "LPIPS": { "net_type": "vgg", "reduction": "mean" } }, "tracker": { "tracker_type": "wandb", "data_path": ".tracker-data", "verbose": true, "wandb_entity": "nousr_laion", "wandb_project": "dalle2_train_decoder" }, "load": { "source": "wandb", "run_path": "nousr_laion/dalle2_train_decoder/3rrsm5gy", "file_path": "best.pth", "resume": false } }