HReynaud commited on
Commit
9d095b0
1 Parent(s): dd15266

upload weights

Browse files
1SCM_v2/config.yaml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ unets:
2
+ unet1:
3
+ dim: 64
4
+ num_resnet_blocks: 2
5
+ dim_mults:
6
+ - 1
7
+ - 2
8
+ - 4
9
+ max_text_len: 1
10
+ layer_attns: false
11
+ layer_cross_attns:
12
+ - false
13
+ - false
14
+ - true
15
+ cond_images_channels: 3
16
+ attend_at_middle: false
17
+ imagen:
18
+ condition_on_text: true
19
+ image_sizes:
20
+ - 112
21
+ text_embed_dim: 1
22
+ num_sample_steps: 64
23
+ temporal_downsample_factor:
24
+ - 1
25
+ lowres_sample_noise_level: 0.2
26
+ sigma_min: 0.002
27
+ sigma_max: 80
28
+ sigma_data: 0.25
29
+ rho: 7
30
+ P_mean: -1.2
31
+ P_std: 1.2
32
+ S_churn: 160
33
+ S_tmin: 0.05
34
+ S_tmax: 50
35
+ S_noise: 1.003
36
+ trainer:
37
+ split_batches: false
38
+ lr: 0.0005
39
+ dl_tuple_output_keywords_names:
40
+ - images
41
+ - text_embeds
42
+ - cond_images
43
+ dataset:
44
+ data_path: /path/to/EchoNet-Dynamic
45
+ deactivate_cache: false
46
+ fps: 8
47
+ duration: 2.0
48
+ grayscale: false
49
+ dataloader:
50
+ batch_size: 8
51
+ num_workers: 8
52
+ wandb:
53
+ project: EchoDiffusion
54
+ # entity: your-login
55
+ checkpoint:
56
+ path: /path/to/checkpoints
57
+ batch_size: 4
58
+ cond_scale: 5.0
59
+ save_every_x_it: 5000
1SCM_v2/merged.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:724eb5f0580198979f174dd41ee3747ee8c8cc73ebcbdff973f7682ab00b1e74
3
+ size 300968361
2SCM_v6/config.yaml ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ unets:
2
+ unet1:
3
+ dim: 64
4
+ num_resnet_blocks: 2
5
+ dim_mults:
6
+ - 1
7
+ - 2
8
+ - 4
9
+ max_text_len: 1
10
+ layer_attns: false
11
+ layer_cross_attns:
12
+ - false
13
+ - false
14
+ - true
15
+ cond_images_channels: 3
16
+ unet2:
17
+ dim: 64
18
+ num_resnet_blocks: 2
19
+ dim_mults:
20
+ - 1
21
+ - 2
22
+ - 4
23
+ max_text_len: 1
24
+ layer_attns: false
25
+ layer_cross_attns:
26
+ - false
27
+ - false
28
+ - true
29
+ memory_efficient: true
30
+ cond_images_channels: 3
31
+ imagen:
32
+ elucidated: true
33
+ condition_on_text: true
34
+ image_sizes:
35
+ - 56
36
+ - 112
37
+ text_embed_dim: 1
38
+ num_sample_steps:
39
+ - 32
40
+ - 64
41
+ random_crop_sizes:
42
+ - null
43
+ - 56
44
+ temporal_downsample_factor:
45
+ - 4
46
+ - 1
47
+ sigma_min: 0.002
48
+ sigma_max: 80
49
+ sigma_data: 0.25
50
+ rho: 7
51
+ P_mean: -1.2
52
+ P_std: 1.2
53
+ S_churn:
54
+ - 80
55
+ - 160
56
+ S_tmin: 0.05
57
+ S_tmax: 50
58
+ S_noise: 1.003
59
+ resize_mode: trilinear
60
+ trainer:
61
+ split_batches: false
62
+ lr: 0.0005
63
+ dl_tuple_output_keywords_names:
64
+ - images
65
+ - text_embeds
66
+ - cond_images
67
+ dataset:
68
+ data_path: /path/to/EchoNet-Dynamic
69
+ deactivate_cache: false
70
+ fps: 32
71
+ duration: 2.0
72
+ grayscale: false
73
+ dataloader:
74
+ batch_size: 8
75
+ num_workers: 8
76
+ wandb:
77
+ project: EchoDiffusion
78
+ # entity: your-login
79
+ checkpoint:
80
+ path: /path/to/checkpoints
81
+ batch_size: 4
82
+ cond_scale: 5.0
83
+ save_every_x_it: 5000
2SCM_v6/merged.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daf9c964854734145651c69540e8befdad3ed741b8cefa4ca85fd11cf6d2f353
3
+ size 755800751
4SCM_v2/config.yaml ADDED
@@ -0,0 +1,119 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ unets:
2
+ unet1:
3
+ dim: 64
4
+ num_resnet_blocks: 2
5
+ dim_mults:
6
+ - 1
7
+ - 2
8
+ - 4
9
+ max_text_len: 1
10
+ layer_attns: false
11
+ layer_cross_attns:
12
+ - false
13
+ - false
14
+ - true
15
+ cond_images_channels: 3
16
+ unet2:
17
+ dim: 64
18
+ num_resnet_blocks: 2
19
+ dim_mults:
20
+ - 1
21
+ - 2
22
+ - 4
23
+ max_text_len: 1
24
+ layer_attns: false
25
+ layer_cross_attns:
26
+ - false
27
+ - false
28
+ - true
29
+ memory_efficient: true
30
+ cond_images_channels: 3
31
+ unet3:
32
+ dim: 64
33
+ num_resnet_blocks: 2
34
+ dim_mults:
35
+ - 1
36
+ - 2
37
+ - 4
38
+ max_text_len: 1
39
+ layer_attns: false
40
+ layer_cross_attns:
41
+ - false
42
+ - false
43
+ - true
44
+ memory_efficient: true
45
+ cond_images_channels: 3
46
+ unet4:
47
+ dim: 64
48
+ num_resnet_blocks: 2
49
+ dim_mults:
50
+ - 1
51
+ - 2
52
+ - 4
53
+ max_text_len: 1
54
+ layer_attns: false
55
+ layer_cross_attns: false
56
+ cond_images_channels: 3
57
+ attend_at_middle: false
58
+ imagen:
59
+ condition_on_text: true
60
+ image_sizes:
61
+ - 56
62
+ - 56
63
+ - 56
64
+ - 112
65
+ text_embed_dim: 1
66
+ num_sample_steps:
67
+ - 32
68
+ - 32
69
+ - 32
70
+ - 64
71
+ random_crop_sizes:
72
+ - null
73
+ - null
74
+ - null
75
+ - 56
76
+ temporal_downsample_factor:
77
+ - 4
78
+ - 2
79
+ - 1
80
+ - 1
81
+ lowres_sample_noise_level: 0.2
82
+ sigma_min: 0.002
83
+ sigma_max: 80
84
+ sigma_data: 0.25
85
+ rho: 7
86
+ P_mean: -1.2
87
+ P_std: 1.2
88
+ S_churn:
89
+ - 40
90
+ - 80
91
+ - 160
92
+ - 160
93
+ S_tmin: 0.05
94
+ S_tmax: 50
95
+ S_noise: 1.003
96
+ trainer:
97
+ split_batches: false
98
+ lr: 0.0005
99
+ dl_tuple_output_keywords_names:
100
+ - images
101
+ - text_embeds
102
+ - cond_images
103
+ dataset:
104
+ data_path: /path/to/EchoNet-Dynamic
105
+ deactivate_cache: false
106
+ fps: 32
107
+ duration: 2.0
108
+ grayscale: false
109
+ dataloader:
110
+ batch_size: 8
111
+ num_workers: 8
112
+ wandb:
113
+ project: EchoDiffusion
114
+ # entity: your-login
115
+ checkpoint:
116
+ path: /path/to/checkpoints
117
+ batch_size: 4
118
+ cond_scale: 5.0
119
+ save_every_x_it: 5000
4SCM_v2/merged.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:906f18d1665c69a69f3f65c201d08b63c2557a60ffdac700fec84d2b29c6774e
3
+ size 1523781649
README.md CHANGED
@@ -1,3 +1,18 @@
1
  ---
2
  license: gpl-2.0
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: gpl-2.0
3
  ---
4
+
5
+ This repository contains 3 models, corresponding to the ones described in *Feature-Conditioned Cascaded Video Diffusion Models for Precise Echocardiogram Synthesis*. Hadrien Reynaud, Mengyun Qiao, Mischa Dombrowski, Thomas Day, Reza Razavi, Alberto Gomez, Paul Leeson and Bernhard Kainz. 2023.
6
+
7
+ To see all the details, refer to the corresponding github repository: [https://github.com/HReynaud/EchoDiffusion](https://github.com/HReynaud/EchoDiffusion).
8
+
9
+ The available models are:
10
+ 1SCM: Single Stage Cascade Model
11
+ 2SCM: Two Stage Cascade Model
12
+ 4SCM: Four Stage Cascade Model
13
+
14
+ All weights files contains the weights of all the diffusion model in the cascade.
15
+ To see a demo of the 1SCM, head to [https://huggingface.co/spaces/HReynaud/echocardiogram-video-diffusion](https://huggingface.co/spaces/HReynaud/echocardiogram-video-diffusion).
16
+
17
+ In each model folder, you will find:
18
+ - `config.yaml`: the configuration file associated to the model. It contains the hyperparameters of the model.