Epoch 0
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitignore +2 -0
- checkpoint-1000/optimizer.bin +3 -0
- checkpoint-1000/random_states_0.pkl +3 -0
- checkpoint-1000/scaler.pt +3 -0
- checkpoint-1000/scheduler.bin +3 -0
- checkpoint-1000/unet/config.json +60 -0
- checkpoint-1000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-1000/unet_ema/config.json +67 -0
- checkpoint-1000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-1500/optimizer.bin +3 -0
- checkpoint-1500/random_states_0.pkl +3 -0
- checkpoint-1500/scaler.pt +3 -0
- checkpoint-1500/scheduler.bin +3 -0
- checkpoint-1500/unet/config.json +60 -0
- checkpoint-1500/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-1500/unet_ema/config.json +67 -0
- checkpoint-1500/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-2000/optimizer.bin +3 -0
- checkpoint-2000/random_states_0.pkl +3 -0
- checkpoint-2000/scaler.pt +3 -0
- checkpoint-2000/scheduler.bin +3 -0
- checkpoint-2000/unet/config.json +60 -0
- checkpoint-2000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-2000/unet_ema/config.json +67 -0
- checkpoint-2000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-2500/optimizer.bin +3 -0
- checkpoint-2500/random_states_0.pkl +3 -0
- checkpoint-2500/scaler.pt +3 -0
- checkpoint-2500/scheduler.bin +3 -0
- checkpoint-2500/unet/config.json +60 -0
- checkpoint-2500/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-2500/unet_ema/config.json +67 -0
- checkpoint-2500/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-3000/optimizer.bin +3 -0
- checkpoint-3000/random_states_0.pkl +3 -0
- checkpoint-3000/scaler.pt +3 -0
- checkpoint-3000/scheduler.bin +3 -0
- checkpoint-3000/unet/config.json +60 -0
- checkpoint-3000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-3000/unet_ema/config.json +67 -0
- checkpoint-3000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-500/optimizer.bin +3 -0
- checkpoint-500/random_states_0.pkl +3 -0
- checkpoint-500/scaler.pt +3 -0
- checkpoint-500/scheduler.bin +3 -0
- checkpoint-500/unet/config.json +60 -0
- checkpoint-500/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-500/unet_ema/config.json +67 -0
- checkpoint-500/unet_ema/diffusion_pytorch_model.bin +3 -0
- model_index.json +12 -0
.gitignore
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
step_*
|
2 |
+
epoch_*
|
checkpoint-1000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a77936f971d8d2ea1acd4422d4db8c237425dbc060d925dd62900f4163bd96a9
|
3 |
+
size 73251413
|
checkpoint-1000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de63daf99e1e85577a98eb464946bfdf57af9cf3d994a1890c117f900500e031
|
3 |
+
size 14663
|
checkpoint-1000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68cff80b680ddf6e7abbef98b5f336b97f9b5963e2209307f639383870e8cc71
|
3 |
+
size 557
|
checkpoint-1000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7223915606ffeb4740373e378fc6ee25a8063899d81b73e9d9630a18bf386915
|
3 |
+
size 563
|
checkpoint-1000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-1000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0477eb3c3da58436fe7693878f450a3e69f7433db4b6d64148040d747932e0a4
|
3 |
+
size 36621969
|
checkpoint-1000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 1000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-1000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fc32e94b6f9c420a0f6bedd1b118084b0245e5eb2a629bb0a42890f0fcb290e
|
3 |
+
size 36616081
|
checkpoint-1500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:388a25582110c6010f1d4b7fbda1d958a222789efcac65af04579d360123fe67
|
3 |
+
size 73251413
|
checkpoint-1500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86ed5ce96de2e3c8754ac07d03c8821c114ad84b467e60f3b26e38ffa8f2f3a6
|
3 |
+
size 14663
|
checkpoint-1500/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:203a72d6c29f42a0e2964fdddc8d7a98df1eccee78fea9de0fa416613390f5c6
|
3 |
+
size 557
|
checkpoint-1500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1bc53d21d5be22242495d40019e29e447be310bc47a92764b1589cb8c4e4483
|
3 |
+
size 563
|
checkpoint-1500/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-1500/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8add4a43c1a1db5684f0d2cd55111c1913da47423f7cee6b3a20332752863cf
|
3 |
+
size 36621969
|
checkpoint-1500/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 1500,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-1500/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e74396c9b33addec059b775ab45cd1cf68977d48595193d5f5bc1050374b3c83
|
3 |
+
size 36616081
|
checkpoint-2000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa19110b484d3e8835f8af390579d747dc676c6d6fb88470b470a9868d876067
|
3 |
+
size 73251413
|
checkpoint-2000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e9469ece6dcdb0453cef4fc90f3a4c75c62f81cee97472304b775164a5bcc11
|
3 |
+
size 14663
|
checkpoint-2000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd2de9749828adacdf103bf6e9592702bb7067a2c1df27dd62ab38c1eb8c070f
|
3 |
+
size 557
|
checkpoint-2000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cc6a2e9846582647ba829a5cab5e19379ab6169fd378876d9a2c2b5a948f3fb
|
3 |
+
size 563
|
checkpoint-2000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-2000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f031e9cc3237b6887c68efab79a28c90b749773e6666cdddc8c8baed3252c5c5
|
3 |
+
size 36621969
|
checkpoint-2000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 2000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-2000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87774ed9e33e0d376e35fce7d12b616f01f6f11465633254672a6d003395b9ce
|
3 |
+
size 36616081
|
checkpoint-2500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33a5906232d8b5340b2798a2386d794822167bb0c50067a05cf640f19fe5fab1
|
3 |
+
size 73251413
|
checkpoint-2500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50c0cb8597bad2e92fd83ebd2e3f8b2a93db3b2c2a08002c5904d457e207a498
|
3 |
+
size 14663
|
checkpoint-2500/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fbcebc8f5487b0c117b5dd47f2ea304af3eebf408d297118d9307e1223927e1
|
3 |
+
size 557
|
checkpoint-2500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdee5d0999ddc7c72ad066f56b8124a7730e2bdf658fa2439ba19b02cd9f42a4
|
3 |
+
size 563
|
checkpoint-2500/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-2500/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82129e54faee0789504b93182c5be5e4e3b420b5abbb9f06be442fcef356877b
|
3 |
+
size 36621969
|
checkpoint-2500/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 2500,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-2500/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2e218d62ccfb426d69e9fd9cd48f1039f86bd27f0fc5ecd18c4ccb3983ea5b0
|
3 |
+
size 36616081
|
checkpoint-3000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f56cda5f86ba292b1597f9730a62f9cb225895fb8d7a29067a761a00df701ba
|
3 |
+
size 73251413
|
checkpoint-3000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3068affad1a930678c6735175ca5d3dfa0984dc67a3962b2497b204ebeb3ef5
|
3 |
+
size 14663
|
checkpoint-3000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb1f9398b77268202e8e1465734a63d123b1ef11c27f20f2473677e9883a6869
|
3 |
+
size 557
|
checkpoint-3000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c7d765e228e9ca3b9dccd3fd0195cdbf25c24ea82c4bcf3f3ac6bd257583232
|
3 |
+
size 563
|
checkpoint-3000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-3000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad5eb4c3197ea5ddf0ab55d38cb1e20a8ca3aebf01cb5df5dd940a75bcf2b167
|
3 |
+
size 36621969
|
checkpoint-3000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 3000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-3000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:676b476c0f696e91d8fe7792584f22e2b6d430837768412307a6aacb2b29c576
|
3 |
+
size 36616081
|
checkpoint-500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56d7698aa7b35cbea9ce99010e5f33918567c9e960274198f4228d9fa0fc4aa9
|
3 |
+
size 73251413
|
checkpoint-500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77af94b4d3fc305349206cfc5301339c4d0593d60b943db6d53a25e2d2f57af9
|
3 |
+
size 14663
|
checkpoint-500/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3f196a54202bb4ba1220e8c59f42f9cda0702d68ea83147d814c2fb2f36b8f2
|
3 |
+
size 557
|
checkpoint-500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1eedad58536ac188d101845e13deb36e3aca8514e3298625b0fb265ebd7ea7a
|
3 |
+
size 563
|
checkpoint-500/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-500/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:506c50a28416c82c4ed9476e0dfeda6135694134ec4e0ea046aba0b7b719d743
|
3 |
+
size 36621969
|
checkpoint-500/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 500,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-500/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58d7b1b09e4b5d30175b767403b8ec619ef8d23ef4938369b4a7de08166e68ce
|
3 |
+
size 36616081
|
model_index.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "LayoutDDPMPipeline",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"scheduler": [
|
5 |
+
"diffusers",
|
6 |
+
"DDPMScheduler"
|
7 |
+
],
|
8 |
+
"unet": [
|
9 |
+
"diffusers",
|
10 |
+
"UNet2DConditionModel"
|
11 |
+
]
|
12 |
+
}
|