ddpm-mnist-32 / run_args.json
xkronosx's picture
Iteration 50000
48d7824 verified
{"model": "UNet", "dataset": "mnist", "save_folder": "/network/scratch/l/luca.scimeca/gfn_generated_results/train_prior_mnist_unet_0/", "load_path": "./../models/pretrained", "data_path": "/network/scratch/l/luca.scimeca/data/", "prior_training_mode": "dpm", "pretrain_models": false, "replace": false, "show_figures": false, "save_figures": true, "save_model_weights": false, "plot_batch_size": 16, "exp_name": "train_prior_mnist_unet", "channels": 1, "workers": 8, "epochs": 200000, "algo": "mle", "batch_size": 64, "test_batch_size": 16, "lr": 0.0001, "lr_logZ": 0.1, "z_weight_decay": 0, "traj_length": 200, "sampling_length": 100, "learning_cutoff": 0.1, "learn_var": false, "loss_type": "l2", "accumulate_gradient_every": 1, "detach_freq": 0.0, "back_and_forth": false, "bf_length": 50, "drift_only": false, "drift_burn_in": 1000, "mixed_precision": false, "checkpointing": true, "multi_class_index": 0, "finetune_class": [0], "class_name": "not_specified", "classifier_model": "cnn", "classifier_depth": 18, "classifier_pretrained": false, "langevin": false, "lgv_clip": 100.0, "lgv_clipping": false, "lgv_t_dim": 64, "lgv_hidden_dim": 256, "lgv_num_layers": 3, "lgv_zero_init": false, "compute_fid": false, "num_fid_samples": 50000, "lora": false, "rank": 32, "push_to_hub": 1, "notes": "", "seed": 123, "use_cuda": true, "device": "cuda", "system": "linux", "supported_datasets": ["mnist", "cifar10", "UTKFace", "CelebA"], "image_size": 32, "noise_size": 32, "num_classes": 10, "block_out_channels": [32, 64, 128, 256]}