camenduru commited on
Commit
3295322
1 Parent(s): 0523f79

thanks to advimman ❤

Browse files
Files changed (35) hide show
  1. big-lama-with-discr/config.yaml +159 -0
  2. big-lama-with-discr/models/best.ckpt +3 -0
  3. big-lama/config.yaml +157 -0
  4. big-lama/models/best.ckpt +3 -0
  5. lama-celeba-hq-pl-abl/lama-no-pl/config.yaml +122 -0
  6. lama-celeba-hq-pl-abl/lama-no-pl/models/best.ckpt +3 -0
  7. lama-celeba-hq/ lama-regular/config.yaml +123 -0
  8. lama-celeba-hq/ lama-regular/models/best.ckpt +3 -0
  9. lama-celeba-hq/lama-deep/config.yaml +123 -0
  10. lama-celeba-hq/lama-deep/models/best.ckpt +3 -0
  11. lama-celeba-hq/lama-dilated/config.yaml +127 -0
  12. lama-celeba-hq/lama-dilated/models/best.ckpt +3 -0
  13. lama-celeba-hq/lama-fourier-shallow/config.yaml +134 -0
  14. lama-celeba-hq/lama-fourier-shallow/models/best.ckpt +3 -0
  15. lama-celeba-hq/lama-fourier/config.yaml +134 -0
  16. lama-celeba-hq/lama-fourier/models/best.ckpt +3 -0
  17. lama-celeba-hq/lama_small_train_masks/config.yaml +123 -0
  18. lama-celeba-hq/lama_small_train_masks/models/best.ckpt +3 -0
  19. lama-pl-abl/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/config.yaml +130 -0
  20. lama-pl-abl/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/models/best.ckpt +3 -0
  21. lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/config.yaml +130 -0
  22. lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/models/best.ckpt +3 -0
  23. lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/config.yaml +130 -0
  24. lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/models/best.ckpt +3 -0
  25. lama-places/big-lama-regular/config.yaml +129 -0
  26. lama-places/big-lama-regular/models/best.ckpt +3 -0
  27. lama-places/lama-dilated/config.yaml +133 -0
  28. lama-places/lama-dilated/models/best.ckpt +3 -0
  29. lama-places/lama-fourier/config.yaml +142 -0
  30. lama-places/lama-fourier/models/best.ckpt +3 -0
  31. lama-places/lama-fourier/models/last.ckpt +3 -0
  32. lama-places/lama-regular/config.yaml +130 -0
  33. lama-places/lama-regular/models/best.ckpt +3 -0
  34. lama-places/lama_small_train_masks/config.yaml +130 -0
  35. lama-places/lama_small_train_masks/models/best.ckpt +3 -0
big-lama-with-discr/config.yaml ADDED
@@ -0,0 +1,159 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: b18_ffc075_batch8x15
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ segm_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ depth_pl:
25
+ weight: 0
26
+ use_features: true
27
+ optimizers:
28
+ generator:
29
+ kind: adam
30
+ lr: 0.001
31
+ discriminator:
32
+ kind: adam
33
+ lr: 0.0001
34
+ visualizer:
35
+ key_order:
36
+ - image
37
+ - predicted_image
38
+ - discr_output_fake
39
+ - discr_output_real
40
+ - inpainted
41
+ rescale_keys:
42
+ - discr_output_fake
43
+ - discr_output_real
44
+ kind: directory
45
+ outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-04-30_14-41-12_train_simple_pix2pix2_gap_sdpl_novgg_large_b18_ffc075_batch8x15/samples
46
+ location:
47
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_large
48
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
49
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
50
+ data:
51
+ batch_size: 15
52
+ val_batch_size: 2
53
+ num_workers: 3
54
+ train:
55
+ indir: ${location.data_root_dir}/train
56
+ out_size: 256
57
+ mask_gen_kwargs:
58
+ irregular_proba: 1
59
+ irregular_kwargs:
60
+ max_angle: 4
61
+ max_len: 200
62
+ max_width: 100
63
+ max_times: 5
64
+ min_times: 1
65
+ box_proba: 1
66
+ box_kwargs:
67
+ margin: 10
68
+ bbox_min_size: 30
69
+ bbox_max_size: 150
70
+ max_times: 3
71
+ min_times: 1
72
+ segm_proba: 0
73
+ segm_kwargs:
74
+ confidence_threshold: 0.5
75
+ max_object_area: 0.5
76
+ min_mask_area: 0.07
77
+ downsample_levels: 6
78
+ num_variants_per_mask: 1
79
+ rigidness_mode: 1
80
+ max_foreground_coverage: 0.3
81
+ max_foreground_intersection: 0.7
82
+ max_mask_intersection: 0.1
83
+ max_hidden_area: 0.1
84
+ max_scale_change: 0.25
85
+ horizontal_flip: true
86
+ max_vertical_shift: 0.2
87
+ position_shuffle: true
88
+ transform_variant: distortions
89
+ dataloader_kwargs:
90
+ batch_size: ${data.batch_size}
91
+ shuffle: true
92
+ num_workers: ${data.num_workers}
93
+ val:
94
+ indir: ${location.data_root_dir}/val
95
+ img_suffix: .png
96
+ dataloader_kwargs:
97
+ batch_size: ${data.val_batch_size}
98
+ shuffle: false
99
+ num_workers: ${data.num_workers}
100
+ visual_test:
101
+ indir: ${location.data_root_dir}/korean_test
102
+ img_suffix: _input.png
103
+ pad_out_to_modulo: 32
104
+ dataloader_kwargs:
105
+ batch_size: 1
106
+ shuffle: false
107
+ num_workers: ${data.num_workers}
108
+ generator:
109
+ kind: ffc_resnet
110
+ input_nc: 4
111
+ output_nc: 3
112
+ ngf: 64
113
+ n_downsampling: 3
114
+ n_blocks: 18
115
+ add_out_act: sigmoid
116
+ init_conv_kwargs:
117
+ ratio_gin: 0
118
+ ratio_gout: 0
119
+ enable_lfu: false
120
+ downsample_conv_kwargs:
121
+ ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
122
+ ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
123
+ enable_lfu: false
124
+ resnet_conv_kwargs:
125
+ ratio_gin: 0.75
126
+ ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
127
+ enable_lfu: false
128
+ discriminator:
129
+ kind: pix2pixhd_nlayer
130
+ input_nc: 3
131
+ ndf: 64
132
+ n_layers: 4
133
+ evaluator:
134
+ kind: default
135
+ inpainted_key: inpainted
136
+ integral_kind: ssim_fid100_f1
137
+ trainer:
138
+ kwargs:
139
+ gpus: -1
140
+ accelerator: ddp
141
+ max_epochs: 200
142
+ gradient_clip_val: 1
143
+ log_gpu_memory: None
144
+ limit_train_batches: 25000
145
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
146
+ log_every_n_steps: 1000
147
+ precision: 32
148
+ terminate_on_nan: false
149
+ check_val_every_n_epoch: 1
150
+ num_sanity_val_steps: 8
151
+ limit_val_batches: 1000
152
+ replace_sampler_ddp: false
153
+ checkpoint_kwargs:
154
+ verbose: true
155
+ save_top_k: 5
156
+ save_last: true
157
+ period: 1
158
+ monitor: val_ssim_fid100_f1_total_mean
159
+ mode: max
big-lama-with-discr/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0806dc98a99c09561f5e45542ded1126a7ea9eeb91858a468d92c63a0054a550
3
+ size 532770031
big-lama/config.yaml ADDED
@@ -0,0 +1,157 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: b18_ffc075_batch8x15
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ resnet_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+
25
+ optimizers:
26
+ generator:
27
+ kind: adam
28
+ lr: 0.001
29
+ discriminator:
30
+ kind: adam
31
+ lr: 0.0001
32
+ visualizer:
33
+ key_order:
34
+ - image
35
+ - predicted_image
36
+ - discr_output_fake
37
+ - discr_output_real
38
+ - inpainted
39
+ rescale_keys:
40
+ - discr_output_fake
41
+ - discr_output_real
42
+ kind: directory
43
+ outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-04-30_14-41-12_train_simple_pix2pix2_gap_sdpl_novgg_large_b18_ffc075_batch8x15/samples
44
+ location:
45
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_large
46
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
47
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
48
+ data:
49
+ batch_size: 15
50
+ val_batch_size: 2
51
+ num_workers: 3
52
+ train:
53
+ indir: ${location.data_root_dir}/train
54
+ out_size: 256
55
+ mask_gen_kwargs:
56
+ irregular_proba: 1
57
+ irregular_kwargs:
58
+ max_angle: 4
59
+ max_len: 200
60
+ max_width: 100
61
+ max_times: 5
62
+ min_times: 1
63
+ box_proba: 1
64
+ box_kwargs:
65
+ margin: 10
66
+ bbox_min_size: 30
67
+ bbox_max_size: 150
68
+ max_times: 3
69
+ min_times: 1
70
+ segm_proba: 0
71
+ segm_kwargs:
72
+ confidence_threshold: 0.5
73
+ max_object_area: 0.5
74
+ min_mask_area: 0.07
75
+ downsample_levels: 6
76
+ num_variants_per_mask: 1
77
+ rigidness_mode: 1
78
+ max_foreground_coverage: 0.3
79
+ max_foreground_intersection: 0.7
80
+ max_mask_intersection: 0.1
81
+ max_hidden_area: 0.1
82
+ max_scale_change: 0.25
83
+ horizontal_flip: true
84
+ max_vertical_shift: 0.2
85
+ position_shuffle: true
86
+ transform_variant: distortions
87
+ dataloader_kwargs:
88
+ batch_size: ${data.batch_size}
89
+ shuffle: true
90
+ num_workers: ${data.num_workers}
91
+ val:
92
+ indir: ${location.data_root_dir}/val
93
+ img_suffix: .png
94
+ dataloader_kwargs:
95
+ batch_size: ${data.val_batch_size}
96
+ shuffle: false
97
+ num_workers: ${data.num_workers}
98
+ visual_test:
99
+ indir: ${location.data_root_dir}/korean_test
100
+ img_suffix: _input.png
101
+ pad_out_to_modulo: 32
102
+ dataloader_kwargs:
103
+ batch_size: 1
104
+ shuffle: false
105
+ num_workers: ${data.num_workers}
106
+ generator:
107
+ kind: ffc_resnet
108
+ input_nc: 4
109
+ output_nc: 3
110
+ ngf: 64
111
+ n_downsampling: 3
112
+ n_blocks: 18
113
+ add_out_act: sigmoid
114
+ init_conv_kwargs:
115
+ ratio_gin: 0
116
+ ratio_gout: 0
117
+ enable_lfu: false
118
+ downsample_conv_kwargs:
119
+ ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
120
+ ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
121
+ enable_lfu: false
122
+ resnet_conv_kwargs:
123
+ ratio_gin: 0.75
124
+ ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
125
+ enable_lfu: false
126
+ discriminator:
127
+ kind: pix2pixhd_nlayer
128
+ input_nc: 3
129
+ ndf: 64
130
+ n_layers: 4
131
+ evaluator:
132
+ kind: default
133
+ inpainted_key: inpainted
134
+ integral_kind: ssim_fid100_f1
135
+ trainer:
136
+ kwargs:
137
+ gpus: -1
138
+ accelerator: ddp
139
+ max_epochs: 200
140
+ gradient_clip_val: 1
141
+ log_gpu_memory: None
142
+ limit_train_batches: 25000
143
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
144
+ log_every_n_steps: 1000
145
+ precision: 32
146
+ terminate_on_nan: false
147
+ check_val_every_n_epoch: 1
148
+ num_sanity_val_steps: 8
149
+ limit_val_batches: 1000
150
+ replace_sampler_ddp: false
151
+ checkpoint_kwargs:
152
+ verbose: true
153
+ save_top_k: 5
154
+ save_last: true
155
+ period: 1
156
+ monitor: val_ssim_fid100_f1_total_mean
157
+ mode: max
big-lama/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fccb7adffd53ec0974ee5503c3731c2c2f1e7e07856fd9228cdcc0b46fd5d423
3
+ size 410046389
lama-celeba-hq-pl-abl/lama-no-pl/config.yaml ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: swu_celeba_bs30
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ segm_pl:
22
+ weight: 0
23
+ optimizers:
24
+ generator:
25
+ kind: adam
26
+ lr: 0.001
27
+ discriminator:
28
+ kind: adam
29
+ lr: 0.0001
30
+ visualizer:
31
+ key_order:
32
+ - image
33
+ - predicted_image
34
+ - discr_output_fake
35
+ - discr_output_real
36
+ - inpainted
37
+ rescale_keys:
38
+ - discr_output_fake
39
+ - discr_output_real
40
+ kind: directory
41
+ outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_16-02-59_train_ablv2_work_no_segmpl_swu_celeba_bs30/samples
42
+ location:
43
+ data_root_dir: ${env:HOME}/CelebA-HQ
44
+ out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
45
+ tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
46
+ pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
47
+ data:
48
+ batch_size: 5
49
+ val_batch_size: 2
50
+ num_workers: 3
51
+ train:
52
+ indir: ${location.data_root_dir}/train_256
53
+ out_size: 256
54
+ mask_gen_kwargs:
55
+ irregular_proba: 1
56
+ irregular_kwargs:
57
+ max_angle: 4
58
+ max_len: 200
59
+ max_width: 100
60
+ max_times: 5
61
+ min_times: 1
62
+ box_proba: 1
63
+ box_kwargs:
64
+ margin: 10
65
+ bbox_min_size: 30
66
+ bbox_max_size: 150
67
+ max_times: 4
68
+ min_times: 1
69
+ segm_proba: 0
70
+ transform_variant: no_augs
71
+ dataloader_kwargs:
72
+ batch_size: ${data.batch_size}
73
+ shuffle: true
74
+ num_workers: ${data.num_workers}
75
+ val:
76
+ indir: ${location.data_root_dir}/val_256
77
+ img_suffix: .png
78
+ dataloader_kwargs:
79
+ batch_size: ${data.val_batch_size}
80
+ shuffle: false
81
+ num_workers: ${data.num_workers}
82
+ visual_test: null
83
+ generator:
84
+ kind: pix2pixhd_global
85
+ input_nc: 4
86
+ output_nc: 3
87
+ ngf: 64
88
+ n_downsampling: 3
89
+ n_blocks: 9
90
+ conv_kind: default
91
+ add_out_act: sigmoid
92
+ discriminator:
93
+ kind: pix2pixhd_nlayer
94
+ input_nc: 3
95
+ ndf: 64
96
+ n_layers: 4
97
+ evaluator:
98
+ kind: default
99
+ inpainted_key: inpainted
100
+ integral_kind: ssim_fid100_f1
101
+ trainer:
102
+ kwargs:
103
+ gpus: -1
104
+ distributed_backend: ddp
105
+ max_epochs: 40
106
+ gradient_clip_val: 1
107
+ log_gpu_memory: None
108
+ limit_train_batches: 25000
109
+ val_check_interval: 2600
110
+ log_save_interval: 250
111
+ precision: 32
112
+ terminate_on_nan: false
113
+ check_val_every_n_epoch: 1
114
+ num_sanity_val_steps: 8
115
+ replace_sampler_ddp: false
116
+ checkpoint_kwargs:
117
+ verbose: true
118
+ save_top_k: 5
119
+ save_last: true
120
+ period: 1
121
+ monitor: val_ssim_fid100_f1_total_mean
122
+ mode: max
lama-celeba-hq-pl-abl/lama-no-pl/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66b111ddcbf7253685b16ceeb291210381c5a9f9f3310efd6275b90e95d67cb9
3
+ size 388001399
lama-celeba-hq/ lama-regular/config.yaml ADDED
@@ -0,0 +1,123 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: swu_celeba_bs30
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ segm_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_16-00-45_train_ablv2_work_swu_celeba_bs30/samples
43
+ location:
44
+ data_root_dir: ${env:HOME}/CelebA-HQ
45
+ out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
46
+ tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
47
+ pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
48
+ data:
49
+ batch_size: 5
50
+ val_batch_size: 2
51
+ num_workers: 3
52
+ train:
53
+ indir: ${location.data_root_dir}/train_256
54
+ out_size: 256
55
+ mask_gen_kwargs:
56
+ irregular_proba: 1
57
+ irregular_kwargs:
58
+ max_angle: 4
59
+ max_len: 200
60
+ max_width: 100
61
+ max_times: 5
62
+ min_times: 1
63
+ box_proba: 1
64
+ box_kwargs:
65
+ margin: 10
66
+ bbox_min_size: 30
67
+ bbox_max_size: 150
68
+ max_times: 4
69
+ min_times: 1
70
+ segm_proba: 0
71
+ transform_variant: no_augs
72
+ dataloader_kwargs:
73
+ batch_size: ${data.batch_size}
74
+ shuffle: true
75
+ num_workers: ${data.num_workers}
76
+ val:
77
+ indir: ${location.data_root_dir}/val_256
78
+ img_suffix: .png
79
+ dataloader_kwargs:
80
+ batch_size: ${data.val_batch_size}
81
+ shuffle: false
82
+ num_workers: ${data.num_workers}
83
+ visual_test: null
84
+ generator:
85
+ kind: pix2pixhd_global
86
+ input_nc: 4
87
+ output_nc: 3
88
+ ngf: 64
89
+ n_downsampling: 3
90
+ n_blocks: 9
91
+ conv_kind: default
92
+ add_out_act: sigmoid
93
+ discriminator:
94
+ kind: pix2pixhd_nlayer
95
+ input_nc: 3
96
+ ndf: 64
97
+ n_layers: 4
98
+ evaluator:
99
+ kind: default
100
+ inpainted_key: inpainted
101
+ integral_kind: ssim_fid100_f1
102
+ trainer:
103
+ kwargs:
104
+ gpus: -1
105
+ distributed_backend: ddp
106
+ max_epochs: 40
107
+ gradient_clip_val: 1
108
+ log_gpu_memory: None
109
+ limit_train_batches: 25000
110
+ val_check_interval: 2600
111
+ log_save_interval: 250
112
+ precision: 32
113
+ terminate_on_nan: false
114
+ check_val_every_n_epoch: 1
115
+ num_sanity_val_steps: 8
116
+ replace_sampler_ddp: false
117
+ checkpoint_kwargs:
118
+ verbose: true
119
+ save_top_k: 5
120
+ save_last: true
121
+ period: 1
122
+ monitor: val_ssim_fid100_f1_total_mean
123
+ mode: max
lama-celeba-hq/ lama-regular/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5641c7655a82749e22c0a392c80dd94d7266ae0f63fbaf6b2a96671ac2d0e918
3
+ size 388009385
lama-celeba-hq/lama-deep/config.yaml ADDED
@@ -0,0 +1,123 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: swu_celeba_bs30_b15
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ segm_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-06-11_18-11-09_train_ablv2_work_swu_celeba_bs30_b15/samples
43
+ location:
44
+ data_root_dir: ${env:HOME}/CelebA-HQ
45
+ out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
46
+ tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
47
+ pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
48
+ data:
49
+ batch_size: 5
50
+ val_batch_size: 2
51
+ num_workers: 3
52
+ train:
53
+ indir: ${location.data_root_dir}/train_256
54
+ out_size: 256
55
+ mask_gen_kwargs:
56
+ irregular_proba: 1
57
+ irregular_kwargs:
58
+ max_angle: 4
59
+ max_len: 200
60
+ max_width: 100
61
+ max_times: 5
62
+ min_times: 1
63
+ box_proba: 1
64
+ box_kwargs:
65
+ margin: 10
66
+ bbox_min_size: 30
67
+ bbox_max_size: 150
68
+ max_times: 4
69
+ min_times: 1
70
+ segm_proba: 0
71
+ transform_variant: no_augs
72
+ dataloader_kwargs:
73
+ batch_size: ${data.batch_size}
74
+ shuffle: true
75
+ num_workers: ${data.num_workers}
76
+ val:
77
+ indir: ${location.data_root_dir}/val_256
78
+ img_suffix: .png
79
+ dataloader_kwargs:
80
+ batch_size: ${data.val_batch_size}
81
+ shuffle: false
82
+ num_workers: ${data.num_workers}
83
+ visual_test: null
84
+ generator:
85
+ kind: pix2pixhd_global
86
+ input_nc: 4
87
+ output_nc: 3
88
+ ngf: 64
89
+ n_downsampling: 3
90
+ n_blocks: 15
91
+ conv_kind: default
92
+ add_out_act: sigmoid
93
+ discriminator:
94
+ kind: pix2pixhd_nlayer
95
+ input_nc: 3
96
+ ndf: 64
97
+ n_layers: 4
98
+ evaluator:
99
+ kind: default
100
+ inpainted_key: inpainted
101
+ integral_kind: ssim_fid100_f1
102
+ trainer:
103
+ kwargs:
104
+ gpus: -1
105
+ distributed_backend: ddp
106
+ max_epochs: 40
107
+ gradient_clip_val: 1
108
+ log_gpu_memory: None
109
+ limit_train_batches: 25000
110
+ val_check_interval: 2600
111
+ log_save_interval: 250
112
+ precision: 32
113
+ terminate_on_nan: false
114
+ check_val_every_n_epoch: 1
115
+ num_sanity_val_steps: 8
116
+ replace_sampler_ddp: false
117
+ checkpoint_kwargs:
118
+ verbose: true
119
+ save_top_k: 5
120
+ save_last: true
121
+ period: 1
122
+ monitor: val_ssim_fid100_f1_total_mean
123
+ mode: max
lama-celeba-hq/lama-deep/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec02f080ef3adf6395a111efc061dd2d869ab78fe014c6f4431e61a8a448332e
3
+ size 501258959
lama-celeba-hq/lama-dilated/config.yaml ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: swu_celeba_bs30
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ segm_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_00-49-10_train_final_md_swu_celeba_bs30/samples
43
+ location:
44
+ data_root_dir: ${env:HOME}/CelebA-HQ
45
+ out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
46
+ tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
47
+ pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
48
+ data:
49
+ batch_size: 5
50
+ val_batch_size: 2
51
+ num_workers: 3
52
+ train:
53
+ indir: ${location.data_root_dir}/train_256
54
+ out_size: 256
55
+ mask_gen_kwargs:
56
+ irregular_proba: 1
57
+ irregular_kwargs:
58
+ max_angle: 4
59
+ max_len: 200
60
+ max_width: 100
61
+ max_times: 5
62
+ min_times: 1
63
+ box_proba: 1
64
+ box_kwargs:
65
+ margin: 10
66
+ bbox_min_size: 30
67
+ bbox_max_size: 150
68
+ max_times: 4
69
+ min_times: 1
70
+ segm_proba: 0
71
+ transform_variant: no_augs
72
+ dataloader_kwargs:
73
+ batch_size: ${data.batch_size}
74
+ shuffle: true
75
+ num_workers: ${data.num_workers}
76
+ val:
77
+ indir: ${location.data_root_dir}/val_256
78
+ img_suffix: .png
79
+ dataloader_kwargs:
80
+ batch_size: ${data.val_batch_size}
81
+ shuffle: false
82
+ num_workers: ${data.num_workers}
83
+ visual_test: null
84
+ generator:
85
+ kind: pix2pixhd_multidilated
86
+ input_nc: 4
87
+ output_nc: 3
88
+ ngf: 64
89
+ n_downsampling: 3
90
+ n_blocks: 9
91
+ conv_kind: default
92
+ add_out_act: sigmoid
93
+ multidilation_kwargs:
94
+ comb_mode: cat_in
95
+ dilation_num: 4
96
+ discriminator:
97
+ kind: pix2pixhd_nlayer
98
+ input_nc: 3
99
+ ndf: 64
100
+ n_layers: 4
101
+ evaluator:
102
+ kind: default
103
+ inpainted_key: inpainted
104
+ integral_kind: ssim_fid100_f1
105
+ trainer:
106
+ kwargs:
107
+ gpus: -1
108
+ distributed_backend: ddp
109
+ max_epochs: 40
110
+ gradient_clip_val: 1
111
+ log_gpu_memory: None
112
+ limit_train_batches: 25000
113
+ val_check_interval: 2600
114
+ log_save_interval: 250
115
+ precision: 32
116
+ terminate_on_nan: false
117
+ check_val_every_n_epoch: 1
118
+ num_sanity_val_steps: 8
119
+ replace_sampler_ddp: false
120
+ benchmark: true
121
+ checkpoint_kwargs:
122
+ verbose: true
123
+ save_top_k: 5
124
+ save_last: true
125
+ period: 1
126
+ monitor: val_ssim_fid100_f1_total_mean
127
+ mode: max
lama-celeba-hq/lama-dilated/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c71a0e8195c0944c27b5e2ba785c6e7fe2bef32da68bd1a46ee2b1c36f425476
3
+ size 388160827
lama-celeba-hq/lama-fourier-shallow/config.yaml ADDED
@@ -0,0 +1,134 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: swu_celeba_bs30_b6
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ segm_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-06-11_18-21-08_train_ablv2_work_ffc075_swu_celeba_bs30_b6/samples
43
+ location:
44
+ data_root_dir: ${env:HOME}/CelebA-HQ
45
+ out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
46
+ tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
47
+ pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
48
+ data:
49
+ batch_size: 6
50
+ val_batch_size: 2
51
+ num_workers: 3
52
+ train:
53
+ indir: ${location.data_root_dir}/train_256
54
+ out_size: 256
55
+ mask_gen_kwargs:
56
+ irregular_proba: 1
57
+ irregular_kwargs:
58
+ max_angle: 4
59
+ max_len: 200
60
+ max_width: 100
61
+ max_times: 5
62
+ min_times: 1
63
+ box_proba: 1
64
+ box_kwargs:
65
+ margin: 10
66
+ bbox_min_size: 30
67
+ bbox_max_size: 150
68
+ max_times: 4
69
+ min_times: 1
70
+ segm_proba: 0
71
+ transform_variant: no_augs
72
+ dataloader_kwargs:
73
+ batch_size: ${data.batch_size}
74
+ shuffle: true
75
+ num_workers: ${data.num_workers}
76
+ val:
77
+ indir: ${location.data_root_dir}/val_256
78
+ img_suffix: .png
79
+ dataloader_kwargs:
80
+ batch_size: ${data.val_batch_size}
81
+ shuffle: false
82
+ num_workers: ${data.num_workers}
83
+ visual_test: null
84
+ generator:
85
+ kind: ffc_resnet
86
+ input_nc: 4
87
+ output_nc: 3
88
+ ngf: 64
89
+ n_downsampling: 3
90
+ n_blocks: 6
91
+ add_out_act: sigmoid
92
+ init_conv_kwargs:
93
+ ratio_gin: 0
94
+ ratio_gout: 0
95
+ enable_lfu: false
96
+ downsample_conv_kwargs:
97
+ ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
98
+ ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
99
+ enable_lfu: false
100
+ resnet_conv_kwargs:
101
+ ratio_gin: 0.75
102
+ ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
103
+ enable_lfu: false
104
+ discriminator:
105
+ kind: pix2pixhd_nlayer
106
+ input_nc: 3
107
+ ndf: 64
108
+ n_layers: 4
109
+ evaluator:
110
+ kind: default
111
+ inpainted_key: inpainted
112
+ integral_kind: ssim_fid100_f1
113
+ trainer:
114
+ kwargs:
115
+ gpus: -1
116
+ distributed_backend: ddp
117
+ max_epochs: 40
118
+ gradient_clip_val: 1
119
+ log_gpu_memory: None
120
+ limit_train_batches: 25000
121
+ val_check_interval: 2600
122
+ log_save_interval: 250
123
+ precision: 32
124
+ terminate_on_nan: false
125
+ check_val_every_n_epoch: 1
126
+ num_sanity_val_steps: 8
127
+ replace_sampler_ddp: false
128
+ checkpoint_kwargs:
129
+ verbose: true
130
+ save_top_k: 5
131
+ save_last: true
132
+ period: 1
133
+ monitor: val_ssim_fid100_f1_total_mean
134
+ mode: max
lama-celeba-hq/lama-fourier-shallow/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ba34746ca7e365c56429317e64c6ff964ecb1217b0599c735a76118197cbb06
3
+ size 281772850
lama-celeba-hq/lama-fourier/config.yaml ADDED
@@ -0,0 +1,134 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: swu_celeba_bs30
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ segm_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_00-40-44_train_ablv2_work_ffc075_swu_celeba_bs30/samples
43
+ location:
44
+ data_root_dir: ${env:HOME}/CelebA-HQ
45
+ out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
46
+ tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
47
+ pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
48
+ data:
49
+ batch_size: 5
50
+ val_batch_size: 2
51
+ num_workers: 3
52
+ train:
53
+ indir: ${location.data_root_dir}/train_256
54
+ out_size: 256
55
+ mask_gen_kwargs:
56
+ irregular_proba: 1
57
+ irregular_kwargs:
58
+ max_angle: 4
59
+ max_len: 200
60
+ max_width: 100
61
+ max_times: 5
62
+ min_times: 1
63
+ box_proba: 1
64
+ box_kwargs:
65
+ margin: 10
66
+ bbox_min_size: 30
67
+ bbox_max_size: 150
68
+ max_times: 4
69
+ min_times: 1
70
+ segm_proba: 0
71
+ transform_variant: no_augs
72
+ dataloader_kwargs:
73
+ batch_size: ${data.batch_size}
74
+ shuffle: true
75
+ num_workers: ${data.num_workers}
76
+ val:
77
+ indir: ${location.data_root_dir}/val_256
78
+ img_suffix: .png
79
+ dataloader_kwargs:
80
+ batch_size: ${data.val_batch_size}
81
+ shuffle: false
82
+ num_workers: ${data.num_workers}
83
+ visual_test: null
84
+ generator:
85
+ kind: ffc_resnet
86
+ input_nc: 4
87
+ output_nc: 3
88
+ ngf: 64
89
+ n_downsampling: 3
90
+ n_blocks: 9
91
+ add_out_act: sigmoid
92
+ init_conv_kwargs:
93
+ ratio_gin: 0
94
+ ratio_gout: 0
95
+ enable_lfu: false
96
+ downsample_conv_kwargs:
97
+ ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
98
+ ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
99
+ enable_lfu: false
100
+ resnet_conv_kwargs:
101
+ ratio_gin: 0.75
102
+ ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
103
+ enable_lfu: false
104
+ discriminator:
105
+ kind: pix2pixhd_nlayer
106
+ input_nc: 3
107
+ ndf: 64
108
+ n_layers: 4
109
+ evaluator:
110
+ kind: default
111
+ inpainted_key: inpainted
112
+ integral_kind: ssim_fid100_f1
113
+ trainer:
114
+ kwargs:
115
+ gpus: -1
116
+ distributed_backend: ddp
117
+ max_epochs: 40
118
+ gradient_clip_val: 1
119
+ log_gpu_memory: None
120
+ limit_train_batches: 25000
121
+ val_check_interval: 2600
122
+ log_save_interval: 250
123
+ precision: 32
124
+ terminate_on_nan: false
125
+ check_val_every_n_epoch: 1
126
+ num_sanity_val_steps: 8
127
+ replace_sampler_ddp: false
128
+ checkpoint_kwargs:
129
+ verbose: true
130
+ save_top_k: 5
131
+ save_last: true
132
+ period: 1
133
+ monitor: val_ssim_fid100_f1_total_mean
134
+ mode: max
lama-celeba-hq/lama-fourier/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3060742ea7464288d7d5fa8e83c940ddbd359ba1640f79135759da9c8c81f281
3
+ size 313953334
lama-celeba-hq/lama_small_train_masks/config.yaml ADDED
@@ -0,0 +1,123 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: swu_celeba_bs30
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ segm_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_16-02-59_train_ablv2_work_small_holes_swu_celeba_bs30/samples
43
+ location:
44
+ data_root_dir: ${env:HOME}/CelebA-HQ
45
+ out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
46
+ tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
47
+ pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
48
+ data:
49
+ batch_size: 5
50
+ val_batch_size: 2
51
+ num_workers: 3
52
+ train:
53
+ indir: ${location.data_root_dir}/train_256
54
+ out_size: 256
55
+ mask_gen_kwargs:
56
+ irregular_proba: 1
57
+ irregular_kwargs:
58
+ max_angle: 4
59
+ max_len: 200
60
+ max_width: 100
61
+ max_times: 5
62
+ min_times: 1
63
+ box_proba: 1
64
+ box_kwargs:
65
+ margin: 10
66
+ bbox_min_size: 30
67
+ bbox_max_size: 150
68
+ max_times: 4
69
+ min_times: 1
70
+ segm_proba: 0
71
+ transform_variant: no_augs
72
+ dataloader_kwargs:
73
+ batch_size: ${data.batch_size}
74
+ shuffle: true
75
+ num_workers: ${data.num_workers}
76
+ val:
77
+ indir: ${location.data_root_dir}/val_256
78
+ img_suffix: .png
79
+ dataloader_kwargs:
80
+ batch_size: ${data.val_batch_size}
81
+ shuffle: false
82
+ num_workers: ${data.num_workers}
83
+ visual_test: null
84
+ generator:
85
+ kind: pix2pixhd_global
86
+ input_nc: 4
87
+ output_nc: 3
88
+ ngf: 64
89
+ n_downsampling: 3
90
+ n_blocks: 9
91
+ conv_kind: default
92
+ add_out_act: sigmoid
93
+ discriminator:
94
+ kind: pix2pixhd_nlayer
95
+ input_nc: 3
96
+ ndf: 64
97
+ n_layers: 4
98
+ evaluator:
99
+ kind: default
100
+ inpainted_key: inpainted
101
+ integral_kind: ssim_fid100_f1
102
+ trainer:
103
+ kwargs:
104
+ gpus: -1
105
+ distributed_backend: ddp
106
+ max_epochs: 40
107
+ gradient_clip_val: 1
108
+ log_gpu_memory: None
109
+ limit_train_batches: 25000
110
+ val_check_interval: 2600
111
+ log_save_interval: 250
112
+ precision: 32
113
+ terminate_on_nan: false
114
+ check_val_every_n_epoch: 1
115
+ num_sanity_val_steps: 8
116
+ replace_sampler_ddp: false
117
+ checkpoint_kwargs:
118
+ verbose: true
119
+ save_top_k: 5
120
+ save_last: true
121
+ period: 1
122
+ monitor: val_ssim_fid100_f1_total_mean
123
+ mode: max
lama-celeba-hq/lama_small_train_masks/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e84c94a80cdbd6fb1315dffbf418cd421fb2e4f16ee260bd6d455fa2ff1a1ef6
3
+ size 388009574
lama-pl-abl/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/config.yaml ADDED
@@ -0,0 +1,130 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ location:
2
+ data_root_dir: /home/${env:USER}/inpainting_data_root_final
3
+ out_root_dir: /home/${env:USER}/inpainting/experiments
4
+ tb_dir: /home/${env:USER}/inpainting/tb_logs
5
+ data:
6
+ batch_size: 10
7
+ val_batch_size: 2
8
+ num_workers: 3
9
+ train:
10
+ indir: ${location.data_root_dir}/train
11
+ out_size: 256
12
+ mask_gen_kwargs:
13
+ irregular_proba: 1
14
+ irregular_kwargs:
15
+ max_angle: 4
16
+ max_len: 200
17
+ max_width: 100
18
+ max_times: 5
19
+ min_times: 1
20
+ box_proba: 1
21
+ box_kwargs:
22
+ margin: 10
23
+ bbox_min_size: 30
24
+ bbox_max_size: 150
25
+ max_times: 4
26
+ min_times: 1
27
+ segm_proba: 0
28
+ transform_variant: distortions
29
+ dataloader_kwargs:
30
+ batch_size: ${data.batch_size}
31
+ shuffle: true
32
+ num_workers: ${data.num_workers}
33
+ val:
34
+ indir: ${location.data_root_dir}/val
35
+ img_suffix: .png
36
+ dataloader_kwargs:
37
+ batch_size: ${data.val_batch_size}
38
+ shuffle: false
39
+ num_workers: ${data.num_workers}
40
+ visual_test:
41
+ indir: ${location.data_root_dir}/korean_test
42
+ img_suffix: _input.png
43
+ pad_out_to_modulo: 32
44
+ dataloader_kwargs:
45
+ batch_size: 1
46
+ shuffle: false
47
+ num_workers: ${data.num_workers}
48
+ generator:
49
+ kind: pix2pixhd_global
50
+ input_nc: 4
51
+ output_nc: 3
52
+ ngf: 64
53
+ n_downsampling: 3
54
+ n_blocks: 9
55
+ conv_kind: default
56
+ add_out_act: sigmoid
57
+ discriminator:
58
+ kind: pix2pixhd_nlayer
59
+ input_nc: 3
60
+ ndf: 64
61
+ n_layers: 4
62
+ visualizer:
63
+ kind: directory
64
+ outdir: /home/${env:USER}/inpainting/experiments/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/samples
65
+ key_order:
66
+ - image
67
+ - predicted_image
68
+ - discr_output_fake
69
+ - discr_output_real
70
+ - inpainted
71
+ rescale_keys:
72
+ - discr_output_fake
73
+ - discr_output_real
74
+ evaluator:
75
+ kind: default
76
+ inpainted_key: inpainted
77
+ integral_kind: ssim_fid100_f1
78
+ trainer:
79
+ kwargs:
80
+ gpus: -1
81
+ accelerator: ddp
82
+ max_epochs: 40
83
+ gradient_clip_val: 1
84
+ log_gpu_memory: None
85
+ limit_train_batches: 25000
86
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
87
+ log_every_n_steps: 250
88
+ precision: 32
89
+ terminate_on_nan: false
90
+ check_val_every_n_epoch: 1
91
+ num_sanity_val_steps: 8
92
+ replace_sampler_ddp: false
93
+ checkpoint_kwargs:
94
+ verbose: true
95
+ save_top_k: 5
96
+ save_last: true
97
+ period: 1
98
+ monitor: val_ssim_fid100_f1_total_mean
99
+ mode: max
100
+ run_title: csirpl03_fixed
101
+ training_model:
102
+ kind: default
103
+ visualize_each_iters: 1000
104
+ concat_mask: true
105
+ store_discr_outputs_for_vis: true
106
+ losses:
107
+ l1:
108
+ weight_missing: 0
109
+ weight_known: 10
110
+ perceptual:
111
+ weight: 0
112
+ adversarial:
113
+ kind: r1
114
+ weight: 10
115
+ gp_coef: 0.001
116
+ mask_as_fake_target: true
117
+ allow_scale_mask: true
118
+ feature_matching:
119
+ weight: 100
120
+ segm_pl:
121
+ weight: 0.3
122
+ arch_encoder: resnet50
123
+ imagenet_weights: true
124
+ optimizers:
125
+ generator:
126
+ kind: adam
127
+ lr: 0.001
128
+ discriminator:
129
+ kind: adam
130
+ lr: 0.0001
lama-pl-abl/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5bcc70055960584b05717e0f4c4aa11fa2e17165f930d38966497a7829144c7
3
+ size 388032511
lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/config.yaml ADDED
@@ -0,0 +1,130 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ location:
2
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
3
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
4
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
5
+ data:
6
+ batch_size: 10
7
+ val_batch_size: 2
8
+ num_workers: 3
9
+ train:
10
+ indir: ${location.data_root_dir}/train
11
+ out_size: 256
12
+ mask_gen_kwargs:
13
+ irregular_proba: 1
14
+ irregular_kwargs:
15
+ max_angle: 4
16
+ max_len: 200
17
+ max_width: 100
18
+ max_times: 5
19
+ min_times: 1
20
+ box_proba: 1
21
+ box_kwargs:
22
+ margin: 10
23
+ bbox_min_size: 30
24
+ bbox_max_size: 150
25
+ max_times: 4
26
+ min_times: 1
27
+ segm_proba: 0
28
+ transform_variant: distortions
29
+ dataloader_kwargs:
30
+ batch_size: ${data.batch_size}
31
+ shuffle: true
32
+ num_workers: ${data.num_workers}
33
+ val:
34
+ indir: ${location.data_root_dir}/val
35
+ img_suffix: .png
36
+ dataloader_kwargs:
37
+ batch_size: ${data.val_batch_size}
38
+ shuffle: false
39
+ num_workers: ${data.num_workers}
40
+ visual_test:
41
+ indir: ${location.data_root_dir}/korean_test
42
+ img_suffix: _input.png
43
+ pad_out_to_modulo: 32
44
+ dataloader_kwargs:
45
+ batch_size: 1
46
+ shuffle: false
47
+ num_workers: ${data.num_workers}
48
+ generator:
49
+ kind: pix2pixhd_global
50
+ input_nc: 4
51
+ output_nc: 3
52
+ ngf: 64
53
+ n_downsampling: 3
54
+ n_blocks: 9
55
+ conv_kind: default
56
+ add_out_act: sigmoid
57
+ discriminator:
58
+ kind: pix2pixhd_nlayer
59
+ input_nc: 3
60
+ ndf: 64
61
+ n_layers: 4
62
+ visualizer:
63
+ kind: directory
64
+ outdir: /group-volume/User-Driven-Content-Generation/e.logacheva/inpainting/experiments/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/samples
65
+ key_order:
66
+ - image
67
+ - predicted_image
68
+ - discr_output_fake
69
+ - discr_output_real
70
+ - inpainted
71
+ rescale_keys:
72
+ - discr_output_fake
73
+ - discr_output_real
74
+ evaluator:
75
+ kind: default
76
+ inpainted_key: inpainted
77
+ integral_kind: ssim_fid100_f1
78
+ trainer:
79
+ kwargs:
80
+ gpus: -1
81
+ accelerator: ddp
82
+ max_epochs: 40
83
+ gradient_clip_val: 1
84
+ log_gpu_memory: None
85
+ limit_train_batches: 25000
86
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
87
+ log_every_n_steps: 250
88
+ precision: 32
89
+ terminate_on_nan: false
90
+ check_val_every_n_epoch: 1
91
+ num_sanity_val_steps: 8
92
+ replace_sampler_ddp: false
93
+ benchmark: true
94
+ checkpoint_kwargs:
95
+ verbose: true
96
+ save_top_k: 5
97
+ save_last: true
98
+ period: 1
99
+ monitor: val_ssim_fid100_f1_total_mean
100
+ mode: max
101
+ run_title: csdilirpl1_new
102
+ training_model:
103
+ kind: default
104
+ visualize_each_iters: 1000
105
+ concat_mask: true
106
+ store_discr_outputs_for_vis: true
107
+ losses:
108
+ l1:
109
+ weight_missing: 0
110
+ weight_known: 10
111
+ perceptual:
112
+ weight: 0
113
+ adversarial:
114
+ kind: r1
115
+ weight: 10
116
+ gp_coef: 0.001
117
+ mask_as_fake_target: true
118
+ allow_scale_mask: true
119
+ feature_matching:
120
+ weight: 100
121
+ segm_pl:
122
+ weight: 1
123
+ imagenet_weights: true
124
+ optimizers:
125
+ generator:
126
+ kind: adam
127
+ lr: 0.001
128
+ discriminator:
129
+ kind: adam
130
+ lr: 0.0001
lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e5f5fc644afefa2ecfddb232b1c397d87bd490fd34f1b2d94c8d44b94fad292
3
+ size 388032365
lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/config.yaml ADDED
@@ -0,0 +1,130 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ location:
2
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
3
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
4
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
5
+ data:
6
+ batch_size: 10
7
+ val_batch_size: 2
8
+ num_workers: 3
9
+ train:
10
+ indir: ${location.data_root_dir}/train
11
+ out_size: 256
12
+ mask_gen_kwargs:
13
+ irregular_proba: 1
14
+ irregular_kwargs:
15
+ max_angle: 4
16
+ max_len: 200
17
+ max_width: 100
18
+ max_times: 5
19
+ min_times: 1
20
+ box_proba: 1
21
+ box_kwargs:
22
+ margin: 10
23
+ bbox_min_size: 30
24
+ bbox_max_size: 150
25
+ max_times: 4
26
+ min_times: 1
27
+ segm_proba: 0
28
+ transform_variant: distortions
29
+ dataloader_kwargs:
30
+ batch_size: ${data.batch_size}
31
+ shuffle: true
32
+ num_workers: ${data.num_workers}
33
+ val:
34
+ indir: ${location.data_root_dir}/val
35
+ img_suffix: .png
36
+ dataloader_kwargs:
37
+ batch_size: ${data.val_batch_size}
38
+ shuffle: false
39
+ num_workers: ${data.num_workers}
40
+ visual_test:
41
+ indir: ${location.data_root_dir}/korean_test
42
+ img_suffix: _input.png
43
+ pad_out_to_modulo: 32
44
+ dataloader_kwargs:
45
+ batch_size: 1
46
+ shuffle: false
47
+ num_workers: ${data.num_workers}
48
+ generator:
49
+ kind: pix2pixhd_global
50
+ input_nc: 4
51
+ output_nc: 3
52
+ ngf: 64
53
+ n_downsampling: 3
54
+ n_blocks: 9
55
+ conv_kind: default
56
+ add_out_act: sigmoid
57
+ discriminator:
58
+ kind: pix2pixhd_nlayer
59
+ input_nc: 3
60
+ ndf: 64
61
+ n_layers: 4
62
+ visualizer:
63
+ kind: directory
64
+ outdir: /group-volume/User-Driven-Content-Generation/e.logacheva/inpainting/experiments/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/samples
65
+ key_order:
66
+ - image
67
+ - predicted_image
68
+ - discr_output_fake
69
+ - discr_output_real
70
+ - inpainted
71
+ rescale_keys:
72
+ - discr_output_fake
73
+ - discr_output_real
74
+ evaluator:
75
+ kind: default
76
+ inpainted_key: inpainted
77
+ integral_kind: ssim_fid100_f1
78
+ trainer:
79
+ kwargs:
80
+ gpus: -1
81
+ accelerator: ddp
82
+ max_epochs: 40
83
+ gradient_clip_val: 1
84
+ log_gpu_memory: None
85
+ limit_train_batches: 25000
86
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
87
+ log_every_n_steps: 250
88
+ precision: 32
89
+ terminate_on_nan: false
90
+ check_val_every_n_epoch: 1
91
+ num_sanity_val_steps: 8
92
+ replace_sampler_ddp: false
93
+ checkpoint_kwargs:
94
+ verbose: true
95
+ save_top_k: 5
96
+ save_last: true
97
+ period: 1
98
+ monitor: val_ssim_fid100_f1_total_mean
99
+ mode: max
100
+ run_title: l2_vgg003_new
101
+ training_model:
102
+ kind: default
103
+ visualize_each_iters: 1000
104
+ concat_mask: true
105
+ store_discr_outputs_for_vis: true
106
+ losses:
107
+ l1:
108
+ weight_missing: 0
109
+ weight_known: 10
110
+ perceptual:
111
+ weight: 0.03
112
+ kwargs:
113
+ metric: l2
114
+ adversarial:
115
+ kind: r1
116
+ weight: 10
117
+ gp_coef: 0.001
118
+ mask_as_fake_target: true
119
+ allow_scale_mask: true
120
+ feature_matching:
121
+ weight: 100
122
+ segm_pl:
123
+ weight: 0
124
+ optimizers:
125
+ generator:
126
+ kind: adam
127
+ lr: 0.001
128
+ discriminator:
129
+ kind: adam
130
+ lr: 0.0001
lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e66fd161b99155ae00b001ba3d727d2b468805529852f6f798ae348f1b2fb9e1
3
+ size 388025416
lama-places/big-lama-regular/config.yaml ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ location:
2
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
3
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
4
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
5
+ data:
6
+ batch_size: 5
7
+ val_batch_size: 2
8
+ num_workers: 3
9
+ train:
10
+ indir: ${location.data_root_dir}/train
11
+ out_size: 256
12
+ mask_gen_kwargs:
13
+ irregular_proba: 1
14
+ irregular_kwargs:
15
+ max_angle: 4
16
+ max_len: 200
17
+ max_width: 100
18
+ max_times: 5
19
+ min_times: 1
20
+ box_proba: 1
21
+ box_kwargs:
22
+ margin: 10
23
+ bbox_min_size: 30
24
+ bbox_max_size: 150
25
+ max_times: 4
26
+ min_times: 1
27
+ segm_proba: 0
28
+ transform_variant: distortions
29
+ dataloader_kwargs:
30
+ batch_size: ${data.batch_size}
31
+ shuffle: true
32
+ num_workers: ${data.num_workers}
33
+ val:
34
+ indir: ${location.data_root_dir}/val
35
+ img_suffix: .png
36
+ dataloader_kwargs:
37
+ batch_size: ${data.val_batch_size}
38
+ shuffle: false
39
+ num_workers: ${data.num_workers}
40
+ visual_test:
41
+ indir: ${location.data_root_dir}/korean_test
42
+ img_suffix: _input.png
43
+ pad_out_to_modulo: 32
44
+ dataloader_kwargs:
45
+ batch_size: 1
46
+ shuffle: false
47
+ num_workers: ${data.num_workers}
48
+ generator:
49
+ kind: pix2pixhd_global
50
+ input_nc: 4
51
+ output_nc: 3
52
+ ngf: 64
53
+ n_downsampling: 3
54
+ n_blocks: 15
55
+ conv_kind: default
56
+ add_out_act: sigmoid
57
+ discriminator:
58
+ kind: pix2pixhd_nlayer
59
+ input_nc: 3
60
+ ndf: 64
61
+ n_layers: 4
62
+ visualizer:
63
+ kind: directory
64
+ outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-06-11_13-21-15_train_ablv2_work_rebuttal-b15/samples
65
+ key_order:
66
+ - image
67
+ - predicted_image
68
+ - discr_output_fake
69
+ - discr_output_real
70
+ - inpainted
71
+ rescale_keys:
72
+ - discr_output_fake
73
+ - discr_output_real
74
+ evaluator:
75
+ kind: default
76
+ inpainted_key: inpainted
77
+ integral_kind: ssim_fid100_f1
78
+ trainer:
79
+ kwargs:
80
+ gpus: -1
81
+ accelerator: ddp
82
+ max_epochs: 40
83
+ gradient_clip_val: 1
84
+ log_gpu_memory: None
85
+ limit_train_batches: 25000
86
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
87
+ log_every_n_steps: 250
88
+ precision: 32
89
+ terminate_on_nan: false
90
+ check_val_every_n_epoch: 1
91
+ num_sanity_val_steps: 8
92
+ replace_sampler_ddp: false
93
+ checkpoint_kwargs:
94
+ verbose: true
95
+ save_top_k: 5
96
+ save_last: true
97
+ period: 1
98
+ monitor: val_ssim_fid100_f1_total_mean
99
+ mode: max
100
+ run_title: rebuttal-b15
101
+ training_model:
102
+ kind: default
103
+ visualize_each_iters: 1000
104
+ concat_mask: true
105
+ store_discr_outputs_for_vis: true
106
+ losses:
107
+ l1:
108
+ weight_missing: 0
109
+ weight_known: 10
110
+ perceptual:
111
+ weight: 0
112
+ adversarial:
113
+ kind: r1
114
+ weight: 10
115
+ gp_coef: 0.001
116
+ mask_as_fake_target: true
117
+ allow_scale_mask: true
118
+ feature_matching:
119
+ weight: 100
120
+ resnet_pl:
121
+ weight: 30
122
+ weights_path: ${env:TORCH_HOME}
123
+ optimizers:
124
+ generator:
125
+ kind: adam
126
+ lr: 0.001
127
+ discriminator:
128
+ kind: adam
129
+ lr: 0.0001
lama-places/big-lama-regular/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40886923da4741b8c5fa25264371c0fca6ebc1b680e4744ae94714f2c26a8e11
3
+ size 501445597
lama-places/lama-dilated/config.yaml ADDED
@@ -0,0 +1,133 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ location:
2
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
3
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
4
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
5
+ data:
6
+ batch_size: 10
7
+ val_batch_size: 2
8
+ num_workers: 3
9
+ train:
10
+ indir: ${location.data_root_dir}/train
11
+ out_size: 256
12
+ mask_gen_kwargs:
13
+ irregular_proba: 1
14
+ irregular_kwargs:
15
+ max_angle: 4
16
+ max_len: 200
17
+ max_width: 100
18
+ max_times: 5
19
+ min_times: 1
20
+ box_proba: 1
21
+ box_kwargs:
22
+ margin: 10
23
+ bbox_min_size: 30
24
+ bbox_max_size: 150
25
+ max_times: 4
26
+ min_times: 1
27
+ segm_proba: 0
28
+ transform_variant: distortions
29
+ dataloader_kwargs:
30
+ batch_size: ${data.batch_size}
31
+ shuffle: true
32
+ num_workers: ${data.num_workers}
33
+ val:
34
+ indir: ${location.data_root_dir}/val
35
+ img_suffix: .png
36
+ dataloader_kwargs:
37
+ batch_size: ${data.val_batch_size}
38
+ shuffle: false
39
+ num_workers: ${data.num_workers}
40
+ visual_test:
41
+ indir: ${location.data_root_dir}/korean_test
42
+ img_suffix: _input.png
43
+ pad_out_to_modulo: 32
44
+ dataloader_kwargs:
45
+ batch_size: 1
46
+ shuffle: false
47
+ num_workers: ${data.num_workers}
48
+ generator:
49
+ kind: pix2pixhd_multidilated
50
+ input_nc: 4
51
+ output_nc: 3
52
+ ngf: 64
53
+ n_downsampling: 3
54
+ n_blocks: 9
55
+ conv_kind: default
56
+ add_out_act: sigmoid
57
+ multidilation_kwargs:
58
+ comb_mode: cat_in
59
+ dilation_num: 4
60
+ discriminator:
61
+ kind: pix2pixhd_nlayer
62
+ input_nc: 3
63
+ ndf: 64
64
+ n_layers: 4
65
+ visualizer:
66
+ kind: directory
67
+ outdir: /group-volume/User-Driven-Content-Generation/e.logacheva/inpainting/experiments/e.logacheva_2021-09-23_11-53-00_train_ablv2_work_md_new/samples
68
+ key_order:
69
+ - image
70
+ - predicted_image
71
+ - discr_output_fake
72
+ - discr_output_real
73
+ - inpainted
74
+ rescale_keys:
75
+ - discr_output_fake
76
+ - discr_output_real
77
+ evaluator:
78
+ kind: default
79
+ inpainted_key: inpainted
80
+ integral_kind: ssim_fid100_f1
81
+ trainer:
82
+ kwargs:
83
+ gpus: -1
84
+ accelerator: ddp
85
+ max_epochs: 40
86
+ gradient_clip_val: 1
87
+ log_gpu_memory: None
88
+ limit_train_batches: 25000
89
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
90
+ log_every_n_steps: 250
91
+ precision: 32
92
+ terminate_on_nan: false
93
+ check_val_every_n_epoch: 1
94
+ num_sanity_val_steps: 8
95
+ replace_sampler_ddp: false
96
+ benchmark: true
97
+ checkpoint_kwargs:
98
+ verbose: true
99
+ save_top_k: 5
100
+ save_last: true
101
+ period: 1
102
+ monitor: val_ssim_fid100_f1_total_mean
103
+ mode: max
104
+ run_title: new
105
+ training_model:
106
+ kind: default
107
+ visualize_each_iters: 1000
108
+ concat_mask: true
109
+ store_discr_outputs_for_vis: true
110
+ losses:
111
+ l1:
112
+ weight_missing: 0
113
+ weight_known: 10
114
+ perceptual:
115
+ weight: 0
116
+ adversarial:
117
+ kind: r1
118
+ weight: 10
119
+ gp_coef: 0.001
120
+ mask_as_fake_target: true
121
+ allow_scale_mask: true
122
+ feature_matching:
123
+ weight: 100
124
+ segm_pl:
125
+ weight: 30
126
+ weights_path: ${env:TORCH_HOME}
127
+ optimizers:
128
+ generator:
129
+ kind: adam
130
+ lr: 0.001
131
+ discriminator:
132
+ kind: adam
133
+ lr: 0.0001
lama-places/lama-dilated/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e09dfa9ab3c74149a4ee5db115f23904acc6349f55f16972d11aea903c9496a0
3
+ size 388184818
lama-places/lama-fourier/config.yaml ADDED
@@ -0,0 +1,142 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: resume
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ resnet_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: dummy_lol
43
+
44
+ location:
45
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
46
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
47
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
48
+ data:
49
+ batch_size: 10
50
+ val_batch_size: 2
51
+ num_workers: 3
52
+ train:
53
+ indir: ${location.data_root_dir}/train
54
+ out_size: 256
55
+ mask_gen_kwargs:
56
+ irregular_proba: 1
57
+ irregular_kwargs:
58
+ max_angle: 4
59
+ max_len: 200
60
+ max_width: 100
61
+ max_times: 5
62
+ min_times: 1
63
+ box_proba: 1
64
+ box_kwargs:
65
+ margin: 10
66
+ bbox_min_size: 30
67
+ bbox_max_size: 150
68
+ max_times: 4
69
+ min_times: 1
70
+ segm_proba: 0
71
+ transform_variant: distortions
72
+ dataloader_kwargs:
73
+ batch_size: ${data.batch_size}
74
+ shuffle: true
75
+ num_workers: ${data.num_workers}
76
+ val:
77
+ indir: ${location.data_root_dir}/val
78
+ img_suffix: .png
79
+ dataloader_kwargs:
80
+ batch_size: ${data.val_batch_size}
81
+ shuffle: false
82
+ num_workers: ${data.num_workers}
83
+ visual_test:
84
+ indir: ${location.data_root_dir}/korean_test
85
+ img_suffix: _input.png
86
+ pad_out_to_modulo: 32
87
+ dataloader_kwargs:
88
+ batch_size: 1
89
+ shuffle: false
90
+ num_workers: ${data.num_workers}
91
+ generator:
92
+ kind: ffc_resnet
93
+ input_nc: 4
94
+ output_nc: 3
95
+ ngf: 64
96
+ n_downsampling: 3
97
+ n_blocks: 9
98
+ add_out_act: sigmoid
99
+ init_conv_kwargs:
100
+ ratio_gin: 0
101
+ ratio_gout: 0
102
+ enable_lfu: false
103
+ downsample_conv_kwargs:
104
+ ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
105
+ ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
106
+ enable_lfu: false
107
+ resnet_conv_kwargs:
108
+ ratio_gin: 0.75
109
+ ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
110
+ enable_lfu: false
111
+ discriminator:
112
+ kind: pix2pixhd_nlayer
113
+ input_nc: 3
114
+ ndf: 64
115
+ n_layers: 4
116
+ evaluator:
117
+ kind: default
118
+ inpainted_key: inpainted
119
+ integral_kind: ssim_fid100_f1
120
+ trainer:
121
+ kwargs:
122
+ gpus: -1
123
+ distributed_backend: ddp
124
+ max_epochs: 40
125
+ gradient_clip_val: 1
126
+ log_gpu_memory: None
127
+ limit_train_batches: 25000
128
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
129
+ log_save_interval: 250
130
+ precision: 32
131
+ terminate_on_nan: false
132
+ check_val_every_n_epoch: 1
133
+ num_sanity_val_steps: 8
134
+ replace_sampler_ddp: false
135
+ resume_from_checkpoint: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-04_13-48-33_train_ablv2_work_ffc075_/models/last.ckpt
136
+ checkpoint_kwargs:
137
+ verbose: true
138
+ save_top_k: 5
139
+ save_last: true
140
+ period: 1
141
+ monitor: val_ssim_fid100_f1_total_mean
142
+ mode: max
lama-places/lama-fourier/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2456284b604786a88a38549432ddf2e73a5911f9868ea692b5122e89a5f1f54
3
+ size 313967681
lama-places/lama-fourier/models/last.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2456284b604786a88a38549432ddf2e73a5911f9868ea692b5122e89a5f1f54
3
+ size 313967681
lama-places/lama-regular/config.yaml ADDED
@@ -0,0 +1,130 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: resume
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ resnet_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-05_17-08-35_train_ablv2_work_resume/samples
43
+ location:
44
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
45
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
46
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
47
+ data:
48
+ batch_size: 10
49
+ val_batch_size: 2
50
+ num_workers: 3
51
+ train:
52
+ indir: ${location.data_root_dir}/train
53
+ out_size: 256
54
+ mask_gen_kwargs:
55
+ irregular_proba: 1
56
+ irregular_kwargs:
57
+ max_angle: 4
58
+ max_len: 200
59
+ max_width: 100
60
+ max_times: 5
61
+ min_times: 1
62
+ box_proba: 1
63
+ box_kwargs:
64
+ margin: 10
65
+ bbox_min_size: 30
66
+ bbox_max_size: 150
67
+ max_times: 4
68
+ min_times: 1
69
+ segm_proba: 0
70
+ transform_variant: distortions
71
+ dataloader_kwargs:
72
+ batch_size: ${data.batch_size}
73
+ shuffle: true
74
+ num_workers: ${data.num_workers}
75
+ val:
76
+ indir: ${location.data_root_dir}/val
77
+ img_suffix: .png
78
+ dataloader_kwargs:
79
+ batch_size: ${data.val_batch_size}
80
+ shuffle: false
81
+ num_workers: ${data.num_workers}
82
+ visual_test:
83
+ indir: ${location.data_root_dir}/korean_test
84
+ img_suffix: _input.png
85
+ pad_out_to_modulo: 32
86
+ dataloader_kwargs:
87
+ batch_size: 1
88
+ shuffle: false
89
+ num_workers: ${data.num_workers}
90
+ generator:
91
+ kind: pix2pixhd_global
92
+ input_nc: 4
93
+ output_nc: 3
94
+ ngf: 64
95
+ n_downsampling: 3
96
+ n_blocks: 9
97
+ conv_kind: default
98
+ add_out_act: sigmoid
99
+ discriminator:
100
+ kind: pix2pixhd_nlayer
101
+ input_nc: 3
102
+ ndf: 64
103
+ n_layers: 4
104
+ evaluator:
105
+ kind: default
106
+ inpainted_key: inpainted
107
+ integral_kind: ssim_fid100_f1
108
+ trainer:
109
+ kwargs:
110
+ gpus: -1
111
+ distributed_backend: ddp
112
+ max_epochs: 40
113
+ gradient_clip_val: 1
114
+ log_gpu_memory: None
115
+ limit_train_batches: 25000
116
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
117
+ log_save_interval: 250
118
+ precision: 32
119
+ terminate_on_nan: false
120
+ check_val_every_n_epoch: 1
121
+ num_sanity_val_steps: 8
122
+ replace_sampler_ddp: false
123
+ resume_from_checkpoint: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-04_13-44-49_train_ablv2_work_/models/last.ckpt
124
+ checkpoint_kwargs:
125
+ verbose: true
126
+ save_top_k: 5
127
+ save_last: true
128
+ period: 1
129
+ monitor: val_ssim_fid100_f1_total_mean
130
+ mode: max
lama-places/lama-regular/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acb3a3693e0c0f363d4ee1a0d22aeb1dd7dcda6c84cb442d8d479131ff0b14b5
3
+ size 388021609
lama-places/lama_small_train_masks/config.yaml ADDED
@@ -0,0 +1,130 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_title: resume
2
+ training_model:
3
+ kind: default
4
+ visualize_each_iters: 1000
5
+ concat_mask: true
6
+ store_discr_outputs_for_vis: true
7
+ losses:
8
+ l1:
9
+ weight_missing: 0
10
+ weight_known: 10
11
+ perceptual:
12
+ weight: 0
13
+ adversarial:
14
+ kind: r1
15
+ weight: 10
16
+ gp_coef: 0.001
17
+ mask_as_fake_target: true
18
+ allow_scale_mask: true
19
+ feature_matching:
20
+ weight: 100
21
+ resnet_pl:
22
+ weight: 30
23
+ weights_path: ${env:TORCH_HOME}
24
+ optimizers:
25
+ generator:
26
+ kind: adam
27
+ lr: 0.001
28
+ discriminator:
29
+ kind: adam
30
+ lr: 0.0001
31
+ visualizer:
32
+ key_order:
33
+ - image
34
+ - predicted_image
35
+ - discr_output_fake
36
+ - discr_output_real
37
+ - inpainted
38
+ rescale_keys:
39
+ - discr_output_fake
40
+ - discr_output_real
41
+ kind: directory
42
+ outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-05_17-04-06_train_ablv2_work_small_holes_resume/samples
43
+ location:
44
+ data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
45
+ out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
46
+ tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
47
+ data:
48
+ batch_size: 10
49
+ val_batch_size: 2
50
+ num_workers: 3
51
+ train:
52
+ indir: ${location.data_root_dir}/train
53
+ out_size: 256
54
+ mask_gen_kwargs:
55
+ irregular_proba: 1
56
+ irregular_kwargs:
57
+ max_angle: 4
58
+ max_len: 80
59
+ max_width: 40
60
+ max_times: 12
61
+ min_times: 4
62
+ box_proba: 1
63
+ box_kwargs:
64
+ margin: 0
65
+ bbox_min_size: 30
66
+ bbox_max_size: 128
67
+ max_times: 1
68
+ min_times: 1
69
+ segm_proba: 0
70
+ transform_variant: default
71
+ dataloader_kwargs:
72
+ batch_size: ${data.batch_size}
73
+ shuffle: true
74
+ num_workers: ${data.num_workers}
75
+ val:
76
+ indir: ${location.data_root_dir}/val
77
+ img_suffix: .png
78
+ dataloader_kwargs:
79
+ batch_size: ${data.val_batch_size}
80
+ shuffle: false
81
+ num_workers: ${data.num_workers}
82
+ visual_test:
83
+ indir: ${location.data_root_dir}/korean_test
84
+ img_suffix: _input.png
85
+ pad_out_to_modulo: 32
86
+ dataloader_kwargs:
87
+ batch_size: 1
88
+ shuffle: false
89
+ num_workers: ${data.num_workers}
90
+ generator:
91
+ kind: pix2pixhd_global
92
+ input_nc: 4
93
+ output_nc: 3
94
+ ngf: 64
95
+ n_downsampling: 3
96
+ n_blocks: 9
97
+ conv_kind: default
98
+ add_out_act: sigmoid
99
+ discriminator:
100
+ kind: pix2pixhd_nlayer
101
+ input_nc: 3
102
+ ndf: 64
103
+ n_layers: 4
104
+ evaluator:
105
+ kind: default
106
+ inpainted_key: inpainted
107
+ integral_kind: ssim_fid100_f1
108
+ trainer:
109
+ kwargs:
110
+ gpus: -1
111
+ distributed_backend: ddp
112
+ max_epochs: 40
113
+ gradient_clip_val: 1
114
+ log_gpu_memory: None
115
+ limit_train_batches: 25000
116
+ val_check_interval: ${trainer.kwargs.limit_train_batches}
117
+ log_save_interval: 250
118
+ precision: 32
119
+ terminate_on_nan: false
120
+ check_val_every_n_epoch: 1
121
+ num_sanity_val_steps: 8
122
+ replace_sampler_ddp: false
123
+ resume_from_checkpoint: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-04_15-09-38_train_ablv2_work_small_holes_/models/last.ckpt
124
+ checkpoint_kwargs:
125
+ verbose: true
126
+ save_top_k: 5
127
+ save_last: true
128
+ period: 1
129
+ monitor: val_ssim_fid100_f1_total_mean
130
+ mode: max
lama-places/lama_small_train_masks/models/best.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6423c4d504c5f135557b316ee6574983424a6078d591d332c97d243f46195e20
3
+ size 388021609