diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0cd258f48f64b24e208210dfa1e3b3313b8b485c --- /dev/null +++ b/README.md @@ -0,0 +1,53 @@ +--- +license: creativeml-openrail-m +library_name: diffusers +tags: +- stable-diffusion +- stable-diffusion-diffusers +- text-to-image +- diffusers +- controlnet +- diffusers-training +base_model: runwayml/stable-diffusion-v1-5 +inference: true +--- + + + + +# controlnet-louistichelman/controlnet_streetview_seg_bins_safety_simple + +These are controlnet weights trained on runwayml/stable-diffusion-v1-5 with new type of conditioning. +You can find some example images below. + +prompt: A realistic and safe-looking google streetview image taken in the USA. +![images_0)](./images_0.png) +prompt: A realistic and dangerous-looking google streetview image taken in the USA. +![images_1)](./images_1.png) +prompt: A realistic and google streetview image taken in Israel. +![images_2)](./images_2.png) +prompt: A realistic and google streetview image taken in Japan. +![images_3)](./images_3.png) +prompt: A realistic and safe-looking google streetview image taken in Mexico. +![images_4)](./images_4.png) +prompt: A realistic and dangerous-looking google streetview image taken in Mexico. +![images_5)](./images_5.png) + + + +## Intended uses & limitations + +#### How to use + +```python +# TODO: add an example code snippet for running this diffusion pipeline +``` + +#### Limitations and bias + +[TODO: provide examples of latent issues and potential remediations] + +## Training details + +[TODO: describe the data used to train the model] \ No newline at end of file diff --git a/checkpoint-10000/controlnet/config.json b/checkpoint-10000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-10000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-10000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-10000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08b5e139d55807f513099b6797ec6c30828424fc --- /dev/null +++ b/checkpoint-10000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45631202cb107894653fccfbef977d6a6fc5fc23ec95fc04b07f41c06a298d19 +size 1445157120 diff --git a/checkpoint-10000/optimizer.bin b/checkpoint-10000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b8cdcea39a8dde10e2feace51b0add5e02c1128 --- /dev/null +++ b/checkpoint-10000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e445474c9729ae1238d95107313052095b686b806bfda16fbab6f6a58b82d56 +size 2890518478 diff --git a/checkpoint-10000/random_states_0.pkl b/checkpoint-10000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..16ec37da7c72d3f633e4c53319571786a8abd87e --- /dev/null +++ b/checkpoint-10000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f874f5153612302c35f941acfb86b21724c19f694b2ac1ced9462c152c08e1ef +size 14344 diff --git a/checkpoint-10000/scheduler.bin b/checkpoint-10000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..404dfd6422eb26d29b37d4327709c308ac4d1907 --- /dev/null +++ b/checkpoint-10000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d31ad9a5150e341b638f838a47b3cb3db0d48efa493bcc8d1f8bf787b2c8cee3 +size 1000 diff --git a/checkpoint-15000/controlnet/config.json b/checkpoint-15000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-15000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-15000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-15000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2666d15f9ece4857c3e1b5f91808253bdc5661c6 --- /dev/null +++ b/checkpoint-15000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b87b4d309dcc6d4f44efebe0b4ee3d47dd5f29827d1ce1ba20f2ad3529bf503 +size 1445157120 diff --git a/checkpoint-15000/optimizer.bin b/checkpoint-15000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..06faf40df2af82df888648c1384c4f5d6c574f76 --- /dev/null +++ b/checkpoint-15000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5acc7bd73c668b22b6a56f22b4ad799e03101f99cd49bfe382b701a354887089 +size 2890518478 diff --git a/checkpoint-15000/random_states_0.pkl b/checkpoint-15000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..746a2d31588e61b7341b285a904f50611eb7da75 --- /dev/null +++ b/checkpoint-15000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458adf2f28fe49d0d25c1fb8894fba0c7713144f2f734284fdd43ebf75cb4559 +size 14408 diff --git a/checkpoint-15000/scheduler.bin b/checkpoint-15000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b446f749a0637774df7577a25badd8627d7bdcf --- /dev/null +++ b/checkpoint-15000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f8cb1c00499c9a11be98e1d3df14acb1c3f608844e19988fc0598608b723e0 +size 1000 diff --git a/checkpoint-20000/controlnet/config.json b/checkpoint-20000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-20000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-20000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-20000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eac5fccec48fca9e987ec6afee53a01de075ac3e --- /dev/null +++ b/checkpoint-20000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b82d2db14ba5585925fd5abe1b89babda53de5231b0f8d20aefe4e5690e45b +size 1445157120 diff --git a/checkpoint-20000/optimizer.bin b/checkpoint-20000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..721bcf6f8bea2dd66375cac4b4b2a0ac49fde863 --- /dev/null +++ b/checkpoint-20000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b53c5aff705d0240663566685d590f7c69de3f989aa49c4d510da17b673f73c +size 2890518478 diff --git a/checkpoint-20000/random_states_0.pkl b/checkpoint-20000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a0518c7028f165925dec84fa63123793048b2302 --- /dev/null +++ b/checkpoint-20000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb08a605d3f29e5acea53e7afdfc21d83f6a260ae9d8d25aab846766526d31d +size 14344 diff --git a/checkpoint-20000/scheduler.bin b/checkpoint-20000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..86c15d06a20918c0bcdf8341881c0f1294ac62e3 --- /dev/null +++ b/checkpoint-20000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51e0d744a95b954d01691d43399197ed4341f27678cc9bb35b811a7c14d85702 +size 1000 diff --git a/checkpoint-25000/controlnet/config.json b/checkpoint-25000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-25000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-25000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-25000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ffc81991f104108b16b94e9f2b91b69887e1da2 --- /dev/null +++ b/checkpoint-25000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225be6aafcd9bca7e0099ee8dc60f579095888793431b1323a9739574cf07c73 +size 1445157120 diff --git a/checkpoint-25000/optimizer.bin b/checkpoint-25000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..32a4e277b54f8e1c0730012b7cd84953737c6b57 --- /dev/null +++ b/checkpoint-25000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f04e8c4901d1a1ef434e660094180b95d6e6450f3460d64bae243a3fee4b83 +size 2890518478 diff --git a/checkpoint-25000/random_states_0.pkl b/checkpoint-25000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0a189d3373e1bb48711906438acb4ca366f21cdf --- /dev/null +++ b/checkpoint-25000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:811235d8f5012159715e7d2be928f754807f020ad90b38cde1c40c37655fb85b +size 14344 diff --git a/checkpoint-25000/scheduler.bin b/checkpoint-25000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..41bec17875142463bc9b16c71d2054658885748b --- /dev/null +++ b/checkpoint-25000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d095dfcbafb08fe578bbdae5202ad1cb8a6b5023afa619ce1ad50ba348cc0a86 +size 1000 diff --git a/checkpoint-30000/controlnet/config.json b/checkpoint-30000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-30000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-30000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-30000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..82179b316eea4f4afe18b61c7fb0f175364850d1 --- /dev/null +++ b/checkpoint-30000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a8186d6998d575fbe43bd999afbc6d2a92e44b9006daf316900bd6ab11c398 +size 1445157120 diff --git a/checkpoint-30000/optimizer.bin b/checkpoint-30000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..098562848686fe47b9d7bb55397ad030f100e4b8 --- /dev/null +++ b/checkpoint-30000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a3427437c0a4a91764e97c6285a0c8370eea7453b76d98fd04de75400570d61 +size 2890518478 diff --git a/checkpoint-30000/random_states_0.pkl b/checkpoint-30000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..f2f86f9689aba8e6525b89a327a3667b7e5d08f2 --- /dev/null +++ b/checkpoint-30000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd4fdfb012794b425a931e378aa1584c8a39c93f33309e573ec30314f5298014 +size 14344 diff --git a/checkpoint-30000/scheduler.bin b/checkpoint-30000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..bde8eae1ab025bf0923b7b48a874ee145b65f99f --- /dev/null +++ b/checkpoint-30000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4f7eab2bd1edeecc4557a33bfb3d0be4e8a4fa29560d5219a021898f3b612eb +size 1000 diff --git a/checkpoint-35000/controlnet/config.json b/checkpoint-35000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-35000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-35000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-35000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6fa90ce759e834babd6252ccf7d4e6375acfd33a --- /dev/null +++ b/checkpoint-35000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f1c7797504f176ec09f6d07191bf31fe1582a2cd3e30c3b80b6524b3ac48ee5 +size 1445157120 diff --git a/checkpoint-35000/optimizer.bin b/checkpoint-35000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..988ddf5999ab4bb3f62bff821a8af06572ae194c --- /dev/null +++ b/checkpoint-35000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31289fa3373a86e5d2ee2ecc25af596ae674a5d1bcc4c59e74dbc1a43dd20334 +size 2890518478 diff --git a/checkpoint-35000/random_states_0.pkl b/checkpoint-35000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..d0d86fbd842ff568574cc3843c423c2848c3a960 --- /dev/null +++ b/checkpoint-35000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f728f0249c6cd4fa7e589aa0128624ebbef00340eaf245e30e060a86fb8d08fd +size 14344 diff --git a/checkpoint-35000/scheduler.bin b/checkpoint-35000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..33c27e6931111993f5114531046b734968d011be --- /dev/null +++ b/checkpoint-35000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c651a22b64e15483287791d87b3d753e1c4331309e2bf9a4cd33d9bf2df0e79a +size 1000 diff --git a/checkpoint-40000/controlnet/config.json b/checkpoint-40000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-40000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-40000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-40000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..80e432e1def5a411bc07ce61eaa3aa79fa195343 --- /dev/null +++ b/checkpoint-40000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:952b4e384aec4483c2039d89b3ef28f6ff738bfb9699fff372c3d1723eb95056 +size 1445157120 diff --git a/checkpoint-40000/optimizer.bin b/checkpoint-40000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..71b06238ac4a3113cc8e29560cbd047fb9a70e3f --- /dev/null +++ b/checkpoint-40000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66195d4543cd883ce1a6a3e57fed430d8d48c2bc0f5af005ce40525fb7db11cf +size 2890518478 diff --git a/checkpoint-40000/random_states_0.pkl b/checkpoint-40000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..05260b94b447b28ae3d3a02abb5e3340e4960d9c --- /dev/null +++ b/checkpoint-40000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7691d48b943d15ebfd786352b178f2d931b8ce9c7d1a62fc06431c6b017aae6c +size 14408 diff --git a/checkpoint-40000/scheduler.bin b/checkpoint-40000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..6dffcd00bd74d2df525dd6d7257097ae5660f00d --- /dev/null +++ b/checkpoint-40000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3545acd782fef9a3052d35e8588ad863cba8df6191a8d8b91634d123b7bb20e +size 1000 diff --git a/checkpoint-45000/controlnet/config.json b/checkpoint-45000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-45000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-45000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-45000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3d9600cb8a12594f2597d98809d5981513e4807 --- /dev/null +++ b/checkpoint-45000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a73bb6da6be64983c725f28560d851d79614ca9377f309445f9811b8c6dd97 +size 1445157120 diff --git a/checkpoint-45000/optimizer.bin b/checkpoint-45000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..fba7dd29aa8ca997adaebc21237722054d10b420 --- /dev/null +++ b/checkpoint-45000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49d5bf881e97fc622ebf5a5a25ba700310594d57effa5aa5dfa2bb99c1ed9ea +size 2890518478 diff --git a/checkpoint-45000/random_states_0.pkl b/checkpoint-45000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..ecc89deef9c81f5e901bd747f4c6363dffd10301 --- /dev/null +++ b/checkpoint-45000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:657c60169d81d3a57b254ad5864d0aeff5b21cbed5bbb56f0dd10cd048bbe5b3 +size 14344 diff --git a/checkpoint-45000/scheduler.bin b/checkpoint-45000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..0abb898216aee28281ab9b5e41dc7e0c4e848e6b --- /dev/null +++ b/checkpoint-45000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb5bf84762fc90d32709f3ec06b0a2d5c831d3803eb5e15dbed5d07a9f75493c +size 1000 diff --git a/checkpoint-5000/controlnet/config.json b/checkpoint-5000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/checkpoint-5000/controlnet/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-5000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-5000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9e70d30cac0299169c1fbb1f492423985694700d --- /dev/null +++ b/checkpoint-5000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da14bfbc87ef10e359b90db80bbbbbe170af33105b98dddf6d950b6a41949e5e +size 1445157120 diff --git a/checkpoint-5000/optimizer.bin b/checkpoint-5000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..78a4e65b98213f70d53e24fcaf1e8f725d8f4592 --- /dev/null +++ b/checkpoint-5000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b4cf5618acbf2e6af5a67f5d005ea02cc729b49bfd7c769ae7e12d7cd032824 +size 2890518478 diff --git a/checkpoint-5000/random_states_0.pkl b/checkpoint-5000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..3363af9e302026280c3aa738610ed84a3b940fc2 --- /dev/null +++ b/checkpoint-5000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dfe8c7d581342d6641c515e28e9d6b6d195b8287be0214750de180d1667f8da +size 14344 diff --git a/checkpoint-5000/scheduler.bin b/checkpoint-5000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..976a27de201da5488bc7b42ce6d3ddff38320cae --- /dev/null +++ b/checkpoint-5000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920333155b08e76154b89a85170c320833074db7b84649a9cfe79fd10b6bf2d9 +size 1000 diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd576a944645f4041ed3f35cdd72f3195187e229 --- /dev/null +++ b/config.json @@ -0,0 +1,51 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.29.0.dev0", + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": 1, + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/diffusion_pytorch_model.safetensors b/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..50f28002d57b8d437ac28d1e09e99e9f8b762fb1 --- /dev/null +++ b/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e36d26b758da841125340d3d6aa289da6332251ec7ec98c557a0e722fff25ecf +size 1445157120 diff --git a/image_control.png b/image_control.png new file mode 100644 index 0000000000000000000000000000000000000000..413964fe5df00247dcde089cbeb30600ceeda368 Binary files /dev/null and b/image_control.png differ diff --git a/images_0.png b/images_0.png new file mode 100644 index 0000000000000000000000000000000000000000..a89af3943810f0748e6b811250bda41b14e3c522 Binary files /dev/null and b/images_0.png differ diff --git a/images_1.png b/images_1.png new file mode 100644 index 0000000000000000000000000000000000000000..9a4ee64ba9142529d7020a90bcc8e3cb288cb9ef Binary files /dev/null and b/images_1.png differ diff --git a/images_2.png b/images_2.png new file mode 100644 index 0000000000000000000000000000000000000000..c8d536a5e3a31572ee4d3d12c2af356f55d55950 Binary files /dev/null and b/images_2.png differ diff --git a/images_3.png b/images_3.png new file mode 100644 index 0000000000000000000000000000000000000000..1b9b601d9efa0032dba4095ddf1fd5b07057cbf7 Binary files /dev/null and b/images_3.png differ diff --git a/images_4.png b/images_4.png new file mode 100644 index 0000000000000000000000000000000000000000..ca7ff8a03cee3884dd2a620b76d0d007bdc90e0c Binary files /dev/null and b/images_4.png differ diff --git a/images_5.png b/images_5.png new file mode 100644 index 0000000000000000000000000000000000000000..8852c2a3f2864051e149d171ffb62a16e7cd9fc5 Binary files /dev/null and b/images_5.png differ