diff --git a/checkpoint-120000/optimizer.bin b/checkpoint-120000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac312bc6b6e58fcf082c842526793cee577b727d --- /dev/null +++ b/checkpoint-120000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4de4d7d6105ef49ae239ffcfb1fc365c86bdc872ac6190886fe6e4fc3613913 +size 6876841811 diff --git a/checkpoint-120000/random_states_0.pkl b/checkpoint-120000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..344d30037e061e112442b1cc712ff26701c27a57 --- /dev/null +++ b/checkpoint-120000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56cb28312d5f1e130321b558bae7822868c4783bbe4ef7342ec69c8f1d573fbd +size 14599 diff --git a/checkpoint-120000/scheduler.bin b/checkpoint-120000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..2eba023d6a44bc35d3b3e890a9a0d97f18affaba --- /dev/null +++ b/checkpoint-120000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db79196ccb783459ff3eff62483504671e8bd4c7f9ef2ec1f0c6dfef6da7df35 +size 563 diff --git a/checkpoint-120000/unet/config.json b/checkpoint-120000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-120000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-120000/unet/diffusion_pytorch_model.safetensors b/checkpoint-120000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d1ae8344549d5c11d058a0dff85cd469edd662d --- /dev/null +++ b/checkpoint-120000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97629b2a6602ae8759ff78a23c0190ac39fcd5296fffc1ad064905f298943dd +size 3438213624 diff --git a/checkpoint-150000/optimizer.bin b/checkpoint-150000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..c4a3057bb1d0d344a7ac9e8b8907137137143238 --- /dev/null +++ b/checkpoint-150000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b22ca2addfc23189331c9d9172236e257930ef6650f3e725781c77ba41db561c +size 6876841811 diff --git a/checkpoint-150000/random_states_0.pkl b/checkpoint-150000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..c30d544e09ca042830a21efb2bb23968a3855188 --- /dev/null +++ b/checkpoint-150000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab02b4e2e19a2d5e71c374280050f4b8121ec2477279be4c6062e9396567d1d +size 14599 diff --git a/checkpoint-150000/scheduler.bin b/checkpoint-150000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d1dd14c3369e47c395c061eb20fe2358b4eeaac --- /dev/null +++ b/checkpoint-150000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03276cadfacf9ce73fff537820baa908221049cfce1b29e2f023191ed7d524e +size 563 diff --git a/checkpoint-150000/unet/config.json b/checkpoint-150000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-150000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-150000/unet/diffusion_pytorch_model.safetensors b/checkpoint-150000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..520953c5ca006ff67c5b1dad52bd9949c15fa049 --- /dev/null +++ b/checkpoint-150000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef30ef2209a38a8e91598f9419017f2a3c2b5024e09691eff52cc189060410aa +size 3438213624 diff --git a/checkpoint-180000/optimizer.bin b/checkpoint-180000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..28aa8f00f00bd34b3f553e5e67dc0f9dea875ef5 --- /dev/null +++ b/checkpoint-180000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c26ee751e83d7ac65186553683c4130bbdee45c687a0ec321fb42a5a1413f3f +size 6876841811 diff --git a/checkpoint-180000/random_states_0.pkl b/checkpoint-180000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..fe307bdb32378c1f722dcb7a5f1c15fdb1707ac2 --- /dev/null +++ b/checkpoint-180000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:982926dc7ba4365322950073305a310b74a179514481b56e930da5f023a23827 +size 14599 diff --git a/checkpoint-180000/scheduler.bin b/checkpoint-180000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..318e4094dc340988dae1cf2935be77bc8aefcc18 --- /dev/null +++ b/checkpoint-180000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee9d9f25e581737fcb1e7f46dfbee0df90021e5b2c4692dd2996e88e2a4a323 +size 563 diff --git a/checkpoint-180000/unet/config.json b/checkpoint-180000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-180000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-180000/unet/diffusion_pytorch_model.safetensors b/checkpoint-180000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..109bb60e230f1c42ea1e4d64b2cc4d971ba345bf --- /dev/null +++ b/checkpoint-180000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ffabc13af6fe111b01b1725970e15e3c9300697dd0c4888997338a425859546 +size 3438213624 diff --git a/checkpoint-210000/optimizer.bin b/checkpoint-210000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..46514e7b62f0d18c91e02fe5ad23615a19a4b233 --- /dev/null +++ b/checkpoint-210000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d642e3e0d0ec5363a5e167226257cb31be62ecd47da08e8554857227b69e7393 +size 6876841811 diff --git a/checkpoint-210000/random_states_0.pkl b/checkpoint-210000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..9ede59f67285948d23d5fc72b4f283a61ce5bb14 --- /dev/null +++ b/checkpoint-210000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:165aa162eb3d486b971f4f6369e4b73701f08367028d6e6b9ef59be151144d65 +size 14599 diff --git a/checkpoint-210000/scheduler.bin b/checkpoint-210000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..be3072a7dcab423e5a6844490bb42d27c29fa61e --- /dev/null +++ b/checkpoint-210000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:279b134570854f65e35c3a2519f09ee9b6ebef47ef1bd7765b8d27b76a0e16a4 +size 563 diff --git a/checkpoint-210000/unet/config.json b/checkpoint-210000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-210000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-210000/unet/diffusion_pytorch_model.safetensors b/checkpoint-210000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..007f258208cadd7ef7d4dc11319b3fef96f09efd --- /dev/null +++ b/checkpoint-210000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100270c75114d5ea6130c857290250f1f6ba2cb59012589cb1f831c9cdcec16c +size 3438213624 diff --git a/checkpoint-240000/optimizer.bin b/checkpoint-240000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..a7f88c0e377fc5f5e4685c5af9b5d94e4d8807b4 --- /dev/null +++ b/checkpoint-240000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca73f930c918ebf15521145eed27644ca13f6baa103474b2f5a8b94fdc303e0 +size 6876841811 diff --git a/checkpoint-240000/random_states_0.pkl b/checkpoint-240000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a56ebe353955fea1aa1e8b1bab874176312280ca --- /dev/null +++ b/checkpoint-240000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac09614e25c3ca2054ca8b014440f3dcb6ea6faee49f71e5acceb5984dcf34f8 +size 14599 diff --git a/checkpoint-240000/scheduler.bin b/checkpoint-240000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..501cad3edca1a5dc34098a1e6109df562ceed4ce --- /dev/null +++ b/checkpoint-240000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:570f92a6d849ca8c7083bc7c9000e4641474c77dba3e2e546601d2eaa8390a02 +size 563 diff --git a/checkpoint-240000/unet/config.json b/checkpoint-240000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-240000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-240000/unet/diffusion_pytorch_model.safetensors b/checkpoint-240000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c41e5ba9da4705329efa3bd296d93a5ec46562c --- /dev/null +++ b/checkpoint-240000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbafc55d3fa24d2d7885da80ec23be6a849c62b3c04b25fa74daa60b37669489 +size 3438213624 diff --git a/checkpoint-270000/optimizer.bin b/checkpoint-270000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..82a631150f2ac934982d364eb24f93cb8b757369 --- /dev/null +++ b/checkpoint-270000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:359dc4a62e2d010991ca5a735411d8d94d31a37c0a5851f0ca2686f191ff2339 +size 6876841811 diff --git a/checkpoint-270000/random_states_0.pkl b/checkpoint-270000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..9ef55ebbf0dd788ba82f5d84529585335f05a042 --- /dev/null +++ b/checkpoint-270000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae3637653c0e62a39a91b66b014967bfe54ab847922774663e7f399e519f3d9 +size 14599 diff --git a/checkpoint-270000/scheduler.bin b/checkpoint-270000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..c852978733c7b22b18f1508ca7fb18249d306780 --- /dev/null +++ b/checkpoint-270000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8917bcb80dfa8bf628446a89b18b16b04b25ea9d50d3de5d65aae40273aa282b +size 563 diff --git a/checkpoint-270000/unet/config.json b/checkpoint-270000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-270000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-270000/unet/diffusion_pytorch_model.safetensors b/checkpoint-270000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d7a5741530e747e1d70797f1884e5a4f745e6a9a --- /dev/null +++ b/checkpoint-270000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68a5fcbe914479a1a208f59ac21d342c7a493c6ec128c72c9a3c16fc02489f0 +size 3438213624 diff --git a/checkpoint-30000/optimizer.bin b/checkpoint-30000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..70b2bc0cfed9c956b0a03e86f62f75a073dcd02d --- /dev/null +++ b/checkpoint-30000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c64a530884af1feb4129197e0fcdfb058eb5f8763e13261a8eb36d597f0f636 +size 6876841811 diff --git a/checkpoint-30000/random_states_0.pkl b/checkpoint-30000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0d1a1a28c03564bce6e363175aa7c2c7e1252ccd --- /dev/null +++ b/checkpoint-30000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:187101d5c73a033a42577b157a6cbad2b00ee7257d5bee2f0acd96c92a5a86ce +size 14599 diff --git a/checkpoint-30000/scheduler.bin b/checkpoint-30000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..942af45453a36b8e1c669b95f8b8643963d217fa --- /dev/null +++ b/checkpoint-30000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31cccaa8c27dbc041ed70da0594aee04359be4f1878b6d9ca03fcd1b8eb819f4 +size 563 diff --git a/checkpoint-30000/unet/config.json b/checkpoint-30000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-30000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-30000/unet/diffusion_pytorch_model.safetensors b/checkpoint-30000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7280037077bd70285c972c5d05fb5b9d6f978e3a --- /dev/null +++ b/checkpoint-30000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a0a0d515c404b69ded80afad086dad656df5d84ec714dcc22e52d65b9a65a5 +size 3438213624 diff --git a/checkpoint-300000/optimizer.bin b/checkpoint-300000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..5aa3cf0d224b01b221b325ef8372432c55c0815a --- /dev/null +++ b/checkpoint-300000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99b5215e8cd5e5f9cf1e7080334666d5e918527adfe6a3f91152bfd77f5ae850 +size 6876841811 diff --git a/checkpoint-300000/random_states_0.pkl b/checkpoint-300000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..23cf2fe5d483743c10d4a3ff6464abd9a7c44b15 --- /dev/null +++ b/checkpoint-300000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21823413484314b467301157cb75bc86f5656c5eeaab6ec4afe2156c738568b +size 14599 diff --git a/checkpoint-300000/scheduler.bin b/checkpoint-300000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..d55855248498b5e9adc57796e4f33353dc5223ab --- /dev/null +++ b/checkpoint-300000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f1e2317888ed71fb8af112371e08364f85393a736a5d73210d87b0d090394ef +size 563 diff --git a/checkpoint-300000/unet/config.json b/checkpoint-300000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-300000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-300000/unet/diffusion_pytorch_model.safetensors b/checkpoint-300000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d61e9c35f9e9006ab06619f3f5cbbf4a150c3cfd --- /dev/null +++ b/checkpoint-300000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6742d235c25ecaad87810f00f7dd58a18a9209ae6925e073e63465d46e7d6c15 +size 3438213624 diff --git a/checkpoint-60000/optimizer.bin b/checkpoint-60000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..c16126876e5102ae33bb2f46e35fcc5f2c37505d --- /dev/null +++ b/checkpoint-60000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa9dbdb287d08d5e2351d920478287bed276a0b3a9f6fd7f2781fb72de078fe5 +size 6876841811 diff --git a/checkpoint-60000/random_states_0.pkl b/checkpoint-60000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..9d66d9a27a17b03d620278deeac203b2574ca8a4 --- /dev/null +++ b/checkpoint-60000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8884ac4f9e1e4ee190d85e2a542f466b7e1e762f10eb8132938ee59176fc5f84 +size 14599 diff --git a/checkpoint-60000/scheduler.bin b/checkpoint-60000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..3033938c7e44e6a1e4fc753eec81d5ee2a4db0de --- /dev/null +++ b/checkpoint-60000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b5e103328555ea5469e73fddb0f9f1ceb827ff21f8b9ee76cc50fbe1a231db +size 563 diff --git a/checkpoint-60000/unet/config.json b/checkpoint-60000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-60000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-60000/unet/diffusion_pytorch_model.safetensors b/checkpoint-60000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6bb5353d7e923b91f56c2de27a68a2b8000dfdf0 --- /dev/null +++ b/checkpoint-60000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c69053db033d9a60dcd1e562a00776a573cc484e6b47bfec459a5d479e4ab38 +size 3438213624 diff --git a/checkpoint-90000/optimizer.bin b/checkpoint-90000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..10f9e0668de82f0044dfae23cc1c92b9f0935f60 --- /dev/null +++ b/checkpoint-90000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:289347f34ff33d870ded1a693030e1e549354c8ce149abdb20d44218c10bdade +size 6876841811 diff --git a/checkpoint-90000/random_states_0.pkl b/checkpoint-90000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0c0556dcaf2254c6b3ca7ad165659465467ce7c8 --- /dev/null +++ b/checkpoint-90000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beabc57ba78c5f5f575a6dbef95964c431245f971a33721c23e2183a796f8a77 +size 14599 diff --git a/checkpoint-90000/scheduler.bin b/checkpoint-90000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..e04def315cc5fed60ff7c64f52511f0c4c96a736 --- /dev/null +++ b/checkpoint-90000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9778701b5bb648a2128fd0375ace83370d1fb400dfb73319e419b8831f7d9a7a +size 563 diff --git a/checkpoint-90000/unet/config.json b/checkpoint-90000/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0eb05dd5d134ed55aab553fdcbc03ba9c0be269 --- /dev/null +++ b/checkpoint-90000/unet/config.json @@ -0,0 +1,68 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.24.0", + "_name_or_path": "riffusion/riffusion-model-v1", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "conv_out_kernel": 3, + "cross_attention_dim": 768, + "cross_attention_norm": null, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 8, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_out_scale_factor": 1.0, + "resnet_skip_time_act": false, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 32, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-90000/unet/diffusion_pytorch_model.safetensors b/checkpoint-90000/unet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dd878c981bd7695d3a18e25d58165e8198975bbb --- /dev/null +++ b/checkpoint-90000/unet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d111e0b16ebe270d5cebfbf57d88fd92801cac5f13c1ba4dd4edc39198508dc1 +size 3438213624 diff --git a/unet/diffusion_pytorch_model.safetensors b/unet/diffusion_pytorch_model.safetensors index ebfe19f1e1295ad3784be73452bf525d9e19bfda..d61e9c35f9e9006ab06619f3f5cbbf4a150c3cfd 100644 --- a/unet/diffusion_pytorch_model.safetensors +++ b/unet/diffusion_pytorch_model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:257cbdcade13ae968ef000347d90c96ed275fb2b4f28fbed0c4080a45dcb6329 +oid sha256:6742d235c25ecaad87810f00f7dd58a18a9209ae6925e073e63465d46e7d6c15 size 3438213624