diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..dad60b4a1f88f4de5bd65ea12f26fc9f6eeed088 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +images_0.png filter=lfs diff=lfs merge=lfs -text +images_1.png filter=lfs diff=lfs merge=lfs -text +images_2.png filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8b1ef7631ba48bc729dac474c714daf07c7c8e4f --- /dev/null +++ b/README.md @@ -0,0 +1,47 @@ +--- +license: openrail++ +library_name: diffusers +tags: +- stable-diffusion-xl +- stable-diffusion-xl-diffusers +- text-to-image +- diffusers +- controlnet +- diffusers-training +base_model: stabilityai/stable-diffusion-xl-base-1.0 +inference: true +--- + + + + +# controlnet-cld07/sd3ep_output + +These are controlnet weights trained on stabilityai/stable-diffusion-xl-base-1.0 with new type of conditioning. +You can find some example images below. + +prompt: a baby with black hair +![images_0)](./images_0.png) +prompt: a man with glasses +![images_1)](./images_1.png) +prompt: a woman smiling +![images_2)](./images_2.png) + + + +## Intended uses & limitations + +#### How to use + +```python +# TODO: add an example code snippet for running this diffusion pipeline +``` + +#### Limitations and bias + +[TODO: provide examples of latent issues and potential remediations] + +## Training details + +[TODO: describe the data used to train the model] \ No newline at end of file diff --git a/checkpoint-12000/controlnet/config.json b/checkpoint-12000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-12000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-12000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-12000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5da4dcc93dd1183d7599d18275cc0f3b0f04d98 --- /dev/null +++ b/checkpoint-12000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19ba1033a301d2d79d986d186e09ed3ebf2f731dba91bb90ff4abe79d5b56c17 +size 5004167864 diff --git a/checkpoint-12000/optimizer.bin b/checkpoint-12000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..64c0097c86534feaf094c9dc2c02692c05daca42 --- /dev/null +++ b/checkpoint-12000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c005ee82bf9d6fb8cec7b13e12b4f68ef1e407ee91bb7b9e87be9e789b6a85e2 +size 10008840997 diff --git a/checkpoint-12000/random_states_0.pkl b/checkpoint-12000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..44b3308c9aee6560e09f701151b52976d9412a99 --- /dev/null +++ b/checkpoint-12000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b3f5403a975dc0686f325ec5a384c0961c64b54f6821d5aed527ea2aeb89af +size 14599 diff --git a/checkpoint-12000/scaler.pt b/checkpoint-12000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae5a342bd933b8ae0fc4bbe4175a5005e1f40290 --- /dev/null +++ b/checkpoint-12000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a61fa205a26ba2985bf4e0e515406104e0b0e5d6ebd86749ac9477a519632ca +size 557 diff --git a/checkpoint-12000/scheduler.bin b/checkpoint-12000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..e6243fe8b64a7112d637d0f1a8abdad6968fc7e8 --- /dev/null +++ b/checkpoint-12000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9855aba5ac021cfcebb517ce8e7c056e6a3e01548a489078133809249c0000db +size 563 diff --git a/checkpoint-15000/controlnet/config.json b/checkpoint-15000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-15000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-15000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-15000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e09c8a429040c56e36a5ba7fb12d862f7ce3d3d --- /dev/null +++ b/checkpoint-15000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a35d2423b08b9076517597d851ff6476c27ad30bf867abac6695917e6d0b988b +size 5004167864 diff --git a/checkpoint-15000/optimizer.bin b/checkpoint-15000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..581a231647fab018147ba183093aaa6a6aec0a2c --- /dev/null +++ b/checkpoint-15000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf319654e8d7f098bb2c45e068dfa3569e10a8afcd227ffe4f25c074d189e64 +size 10008840997 diff --git a/checkpoint-15000/random_states_0.pkl b/checkpoint-15000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..b9a4b87096fea4261aeb4cc6c8475e24e5625d54 --- /dev/null +++ b/checkpoint-15000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e2284039d849aa5efabe7489903a9477acc2a5ed4ff509179abee6e81e07459 +size 14599 diff --git a/checkpoint-15000/scaler.pt b/checkpoint-15000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..29312d48fe0c2715d29a9441129c714a6ea8e195 --- /dev/null +++ b/checkpoint-15000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb33b1da2125feaa501f6acf7c67409ff703b0320e8e55bf616863891dd3346 +size 557 diff --git a/checkpoint-15000/scheduler.bin b/checkpoint-15000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..2e0498a72c22a040ef520f0478bb4dabde66f3e8 --- /dev/null +++ b/checkpoint-15000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c8f230c5668e90ef511def579b79e44de9d3b35808be0f4dc30dd690dd88396 +size 563 diff --git a/checkpoint-18000/controlnet/config.json b/checkpoint-18000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-18000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-18000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-18000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c6aa4713f2ad635246e193ac530d97b4fa1e684 --- /dev/null +++ b/checkpoint-18000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06859cf92b170368f9bba8e9d26a193971d1f231ce594c3ce1b3038e47f9c28b +size 5004167864 diff --git a/checkpoint-18000/optimizer.bin b/checkpoint-18000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..8df0bebfd30ff04a3039ae75599e706ca35658f1 --- /dev/null +++ b/checkpoint-18000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b3ed5708bf691e0494813a3906448a2642025769cbd24baf08649aadd89eb4 +size 10008840997 diff --git a/checkpoint-18000/random_states_0.pkl b/checkpoint-18000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..ee9446f3809bd1c6473ca683cffe3f6997f01397 --- /dev/null +++ b/checkpoint-18000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb1c9d9fd211af43fa83ba450985e9e59e3c0decc733a93632a82dd8aa059a4 +size 14599 diff --git a/checkpoint-18000/scaler.pt b/checkpoint-18000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..17d61ff93819cbe3594bc4408e2867ce2acfd220 --- /dev/null +++ b/checkpoint-18000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7d5fbe54d973b1b835eeb6a35c1f93bc3dcba3bfd4282bf5a13169af034c31 +size 557 diff --git a/checkpoint-18000/scheduler.bin b/checkpoint-18000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c78cffe1bfd1c9430f4e2e7ecacdd68cfebc8a4 --- /dev/null +++ b/checkpoint-18000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a81cc678ca117e8d93df67c5439b52214da903413ecbe7e0b2e7472e33033f +size 563 diff --git a/checkpoint-21000/controlnet/config.json b/checkpoint-21000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-21000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-21000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-21000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..71454e4b7bcd8c202e01dd1d6b9f0a4696896517 --- /dev/null +++ b/checkpoint-21000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ebbf4c771d516728fa9441ddd5d1e0abad9d6e6601c0c6b5a32f7a7b8467116 +size 5004167864 diff --git a/checkpoint-21000/optimizer.bin b/checkpoint-21000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b18a4f3a3e2f20cdd48f894e5eae9a5ea228960 --- /dev/null +++ b/checkpoint-21000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c94ab9ea0ba4f39012c08d967dfa457b158ed29dacb8d5ad9c1c1232799ca4 +size 10008840997 diff --git a/checkpoint-21000/random_states_0.pkl b/checkpoint-21000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..c9b2797b29f1bb6775d5cc16dbc1eb7b75dfcd3d --- /dev/null +++ b/checkpoint-21000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb0c84b6c6a8b43d51882770c2eb3d11b72c8ea4ffcb2c86221d4c641ae37225 +size 14599 diff --git a/checkpoint-21000/scaler.pt b/checkpoint-21000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ee6fc1c25629d139087d2cf550a72037e75adb --- /dev/null +++ b/checkpoint-21000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d92f7ff116c055ac3535701c7ed50562c852881f5945b2285173e280936154 +size 557 diff --git a/checkpoint-21000/scheduler.bin b/checkpoint-21000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..806fe8f8827252998428f2caa4519367ecc27081 --- /dev/null +++ b/checkpoint-21000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f1bb82c106f03d1adf8e8fa1d7d4e15d7220f161ef1a57135b14efa7607386 +size 563 diff --git a/checkpoint-24000/controlnet/config.json b/checkpoint-24000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-24000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-24000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-24000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d85e5ae1c5f32ac77c6aff962047fe465feaa9d --- /dev/null +++ b/checkpoint-24000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e60c6cdad770111fb25ae9f04f683eb136e128027954f5ab1ef2283f7b5f7d0e +size 5004167864 diff --git a/checkpoint-24000/optimizer.bin b/checkpoint-24000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..f76f7479713dc4c0b678f4d2682773b0b9778c08 --- /dev/null +++ b/checkpoint-24000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f99455101a3418c1e6c20b740ef40ebd401d4402b0989377439b6781b039e83 +size 10008840997 diff --git a/checkpoint-24000/random_states_0.pkl b/checkpoint-24000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..84a5708d22d4403eb0a5a1b760f67736e02a7f2f --- /dev/null +++ b/checkpoint-24000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee30133bc5e9bb5cc5a207751eb3628db32bfa94b6061d5c25f5c5318a8b16d5 +size 14599 diff --git a/checkpoint-24000/scaler.pt b/checkpoint-24000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bc4af419b96442b5d4914292b7cc8c1a130fc23 --- /dev/null +++ b/checkpoint-24000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e448f3ad3e626597b0d1fdea51b974fc1a4a0c1203311e81c0820e5a37d35db7 +size 557 diff --git a/checkpoint-24000/scheduler.bin b/checkpoint-24000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..07d420d771111d4309b4c039c048ae61e551a547 --- /dev/null +++ b/checkpoint-24000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d4a74f3c1185f38f8a73a6e302e0645e4be711eb8e0e482c475f2ad0093672 +size 563 diff --git a/checkpoint-27000/controlnet/config.json b/checkpoint-27000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-27000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-27000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-27000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0746a6230cf3d3fedde65ff226298aa76a780000 --- /dev/null +++ b/checkpoint-27000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64cd102e22669bb2c44c8f1fb00f7d1942e090ffdb3223e8ad0abe5eb55b669 +size 5004167864 diff --git a/checkpoint-27000/optimizer.bin b/checkpoint-27000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..57d9e9dcc97d28448a3aaabb4533802ef1b4d2a9 --- /dev/null +++ b/checkpoint-27000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca75507111de2a61b8d602965a1e29750fe425570d946daf36d77bc8e6473fbe +size 10008840997 diff --git a/checkpoint-27000/random_states_0.pkl b/checkpoint-27000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..7c1a235fce71549f80623e519b255f8d191857ed --- /dev/null +++ b/checkpoint-27000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f942eef0d7466b6189384bc78dce4f362e8d84d26a703f57378c63793765d185 +size 14599 diff --git a/checkpoint-27000/scaler.pt b/checkpoint-27000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f13a0d55db9cd26115644d1f72cff9ab546063ac --- /dev/null +++ b/checkpoint-27000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3789c1d68fdc4bd86444622d1909f758d6e05318dbbb156b6ef20dbb61560383 +size 557 diff --git a/checkpoint-27000/scheduler.bin b/checkpoint-27000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..42c375eaf05d6b129a8e7b2ded10d38c0ee3aaff --- /dev/null +++ b/checkpoint-27000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:addd1999ffe5da315bded19c591d78a81576e422d3588e78f530eb4a9f50e0b9 +size 563 diff --git a/checkpoint-3000/controlnet/config.json b/checkpoint-3000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-3000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-3000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-3000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..149caf3ae75c7792d03449614757b7bb0d492690 --- /dev/null +++ b/checkpoint-3000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40be5bd8ff1b5e630921ece41c2cd02caafdeb22b9a5b40a7fc8b358e563a6e9 +size 5004167864 diff --git a/checkpoint-3000/optimizer.bin b/checkpoint-3000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..660fd595f921cb1d1162d6ff5878e736e723fd90 --- /dev/null +++ b/checkpoint-3000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8658895c0c4451c4ccb9dada99855b23effe52d1ec4aae62182ce8b353f63b52 +size 10008840997 diff --git a/checkpoint-3000/random_states_0.pkl b/checkpoint-3000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..849afa8986b4e90c91dc808ab39f66a7af8a5ba2 --- /dev/null +++ b/checkpoint-3000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e361dda8a471a9752db230d2b3d76af21805f3ec40939a068a3463a562ab209c +size 14599 diff --git a/checkpoint-3000/scaler.pt b/checkpoint-3000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2888c9ddc2c30e6b47ce0e6abcc8e2d1303aab00 --- /dev/null +++ b/checkpoint-3000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb1f9398b77268202e8e1465734a63d123b1ef11c27f20f2473677e9883a6869 +size 557 diff --git a/checkpoint-3000/scheduler.bin b/checkpoint-3000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b6eaa6a5a88bbc1e19c9479751f75698e848c9d --- /dev/null +++ b/checkpoint-3000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d6ec0338061ab706b1805a9e2966ca126b26619cd90bb73133127681b9de370 +size 563 diff --git a/checkpoint-30000/controlnet/config.json b/checkpoint-30000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-30000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-30000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-30000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9c2ec87b94d40a6560958f473ed1ed24a4c83644 --- /dev/null +++ b/checkpoint-30000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbf0414ff0914c3d395e772f516b76e8b0f43fe9408906ae7e7068aaebaa9c7 +size 5004167864 diff --git a/checkpoint-30000/optimizer.bin b/checkpoint-30000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..9ae2ebfc865e4187c9c31bbd7222630aa6ec9054 --- /dev/null +++ b/checkpoint-30000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2aca05edfe1cdf7f2a2f21b1e980187ad8276e6d14cbeebca6c9aaa45e70a47 +size 10008840997 diff --git a/checkpoint-30000/random_states_0.pkl b/checkpoint-30000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..393e6c1dc373e64040cf28f8e391e6e58573ebaa --- /dev/null +++ b/checkpoint-30000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdcd0140be104849590684482f0b921f3b86b30de4365d69231cba9b3fe189d7 +size 14599 diff --git a/checkpoint-30000/scaler.pt b/checkpoint-30000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..744f23bfce3bfea3832c25c47f14bfd36d256d64 --- /dev/null +++ b/checkpoint-30000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efb54b61e3444dfa52fbdcd9ab900d311b5e5031b20203a577b1583f65903190 +size 557 diff --git a/checkpoint-30000/scheduler.bin b/checkpoint-30000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..13a22ca9aca0f5e7d1865338eff6d17af5fd569f --- /dev/null +++ b/checkpoint-30000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e413f00c8696f8d849f51c390d8fa9ef8d93fd61b9bfab3401aa0e2a1f917546 +size 563 diff --git a/checkpoint-33000/controlnet/config.json b/checkpoint-33000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-33000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-33000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-33000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3c86e392ce2c1ec2a1abb264614858c310d3b307 --- /dev/null +++ b/checkpoint-33000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939e3984726a5f0d3169053b2313ced0f587e1441392016d8bc431d2100155c4 +size 5004167864 diff --git a/checkpoint-33000/optimizer.bin b/checkpoint-33000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b77bf7cf526ce267bee9bc49e42a5cd4395e1fa --- /dev/null +++ b/checkpoint-33000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c35687e709736edb654db6b1bf7f5f7b634481a88d2fd198ea6740c2e18468 +size 10008840997 diff --git a/checkpoint-33000/random_states_0.pkl b/checkpoint-33000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..d49d8047e1d7ca0b5b4cc4eb8022ee43ba2b5fe0 --- /dev/null +++ b/checkpoint-33000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b535bf7f61e100946d3b7b4991beff7626efd78bb6b339956280860edf8d64da +size 14599 diff --git a/checkpoint-33000/scaler.pt b/checkpoint-33000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b617e8b17bca7799855be430b0c9e873633c8910 --- /dev/null +++ b/checkpoint-33000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b099f99d271d1d70668795bcbebf8f9154e435b3dd48069de26ea325e86d2c +size 557 diff --git a/checkpoint-33000/scheduler.bin b/checkpoint-33000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c064632a49c1fe919982422237d3baf8017aaa1 --- /dev/null +++ b/checkpoint-33000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4470ab8d5b7a351fad407ea1f7c385256c0d9161c97ccf5a66c870418a02b6 +size 563 diff --git a/checkpoint-36000/controlnet/config.json b/checkpoint-36000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-36000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-36000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-36000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2926d88ed62139bf7c5c66dc012ea641cf1a7fc --- /dev/null +++ b/checkpoint-36000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f399ff251b03a9defc381330958ad6087f945e8bb048a5ddd1a0568cf0c3bfe +size 5004167864 diff --git a/checkpoint-36000/optimizer.bin b/checkpoint-36000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b9d088a80925056d184849fc595032c29192fd9 --- /dev/null +++ b/checkpoint-36000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8b5919e9ee85528dfbd0a8511b3d5f8d2f70c6b05a3ed01da1be00cc7133d2d +size 10008840997 diff --git a/checkpoint-36000/random_states_0.pkl b/checkpoint-36000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a6b872480ce0e1d0055ed1bf8580c8ce67b1fd3d --- /dev/null +++ b/checkpoint-36000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2a5614b63a3425ef769e5949993a2f48d4433d150d17de50d3e3ba2a343730c +size 14599 diff --git a/checkpoint-36000/scaler.pt b/checkpoint-36000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ef70604e1b6cb2ab8ec631b2462e888ad4c224d --- /dev/null +++ b/checkpoint-36000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a28b19c09e76c25d28dc38360bd5d2ba720e7de3c61edaf40cb4d69852aa9ec0 +size 557 diff --git a/checkpoint-36000/scheduler.bin b/checkpoint-36000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..3afb9df9c6daefc6ddcd6c32f813058ac55a3eca --- /dev/null +++ b/checkpoint-36000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4edcf308a08e9dcb4dedb915da98d3140ca83391b2be28ea2c9d16a49ff81c50 +size 563 diff --git a/checkpoint-6000/controlnet/config.json b/checkpoint-6000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-6000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-6000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-6000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1afb91208e5d5c56aa4ef1fe451aed4351343399 --- /dev/null +++ b/checkpoint-6000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acaf4774775a42bb4fdae861c826024b635807a0818cfa8b45a70a0bb3faeb83 +size 5004167864 diff --git a/checkpoint-6000/optimizer.bin b/checkpoint-6000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..69ada658cc74ef9fb93d7169ed8164e29e7cba45 --- /dev/null +++ b/checkpoint-6000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65203a8185b634ceea7853f980e151524502578cdf35b559fbbbc7b5488711ab +size 10008840997 diff --git a/checkpoint-6000/random_states_0.pkl b/checkpoint-6000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0d2acc228a6c3994ddb37a7d7cb4114dd31091fd --- /dev/null +++ b/checkpoint-6000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c1c6f7e064c8200fccac9ad3f6a7b7dc6e871c4056fa4b9ea847b8581bc36d +size 14599 diff --git a/checkpoint-6000/scaler.pt b/checkpoint-6000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fd17ac3026715d5a68d70922df4742631319059 --- /dev/null +++ b/checkpoint-6000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a00ef97fc41c0d653df466126d855f16646dd10726d3ac99a23f55ca70ec19a +size 557 diff --git a/checkpoint-6000/scheduler.bin b/checkpoint-6000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..7413abefc4f8286274da3243afd962fa1696fff1 --- /dev/null +++ b/checkpoint-6000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0df2dffc0559ef6134e0571ccfecb406ec3a612efe566ae6f1c62bcf1ab353 +size 563 diff --git a/checkpoint-9000/controlnet/config.json b/checkpoint-9000/controlnet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/checkpoint-9000/controlnet/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/checkpoint-9000/controlnet/diffusion_pytorch_model.safetensors b/checkpoint-9000/controlnet/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..558c52138077adcdab712b39f27f91b505b5bba3 --- /dev/null +++ b/checkpoint-9000/controlnet/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce65d7313efa21eefdd90ae218227ce37d30970aa3ac5ae377c3266ef087d9e +size 5004167864 diff --git a/checkpoint-9000/optimizer.bin b/checkpoint-9000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c2ff31c881280acb34cbb33d16011a1b409f89c --- /dev/null +++ b/checkpoint-9000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3d6ac9b3ba3335e8c2011b88516be1b662a1154f25e78f0e8087cac2875a37 +size 10008840997 diff --git a/checkpoint-9000/random_states_0.pkl b/checkpoint-9000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..a8ffabe1b786f7ced5a19d5ba9a927593d133197 --- /dev/null +++ b/checkpoint-9000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24b1e895c71c638d2a0b0a010fddd50866ca3a8c6de64fb0abf286879be2b62 +size 14599 diff --git a/checkpoint-9000/scaler.pt b/checkpoint-9000/scaler.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7306b1b0e5b21e2fec7bb12b5a46cc7b66591f --- /dev/null +++ b/checkpoint-9000/scaler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be7a7b56cfc3e79d33648a4c49d4f11c6593d8d653b129207b2e38f2684a284 +size 557 diff --git a/checkpoint-9000/scheduler.bin b/checkpoint-9000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..441f03705c86ea73ba155600524d371b9ec283e5 --- /dev/null +++ b/checkpoint-9000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c13d19a790c3b70de0c58d8be6eda53cbc852819b276ffcfe81fcb4f0bbdb79a +size 563 diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..040c087b669e780e6231ca7ba37885da8d59ce81 --- /dev/null +++ b/config.json @@ -0,0 +1,57 @@ +{ + "_class_name": "ControlNetModel", + "_diffusers_version": "0.28.0.dev0", + "act_fn": "silu", + "addition_embed_type": "text_time", + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": 256, + "attention_head_dim": [ + 5, + 10, + 20 + ], + "block_out_channels": [ + 320, + 640, + 1280 + ], + "class_embed_type": null, + "conditioning_channels": 3, + "conditioning_embedding_out_channels": [ + 16, + 32, + 96, + 256 + ], + "controlnet_conditioning_channel_order": "rgb", + "cross_attention_dim": 2048, + "down_block_types": [ + "DownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D" + ], + "downsample_padding": 1, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "global_pool_conditions": false, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "projection_class_embeddings_input_dim": 2816, + "resnet_time_scale_shift": "default", + "transformer_layers_per_block": [ + 1, + 2, + 10 + ], + "upcast_attention": null, + "use_linear_projection": true +} diff --git a/diffusion_pytorch_model.safetensors b/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1eec3d2e8a5b96dcee07a780fb6b5da856a11448 --- /dev/null +++ b/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d1b0c94aaf41b11d295c3bbbb497b5bda3488e1bba6c25c755e384371feb24 +size 5004167864 diff --git a/image_control.png b/image_control.png new file mode 100644 index 0000000000000000000000000000000000000000..33d93418c5aef8abaa0f465299cd50f821dc9169 Binary files /dev/null and b/image_control.png differ diff --git a/images_0.png b/images_0.png new file mode 100644 index 0000000000000000000000000000000000000000..9377192f78a084b78410b26b1fd872a0b811380a --- /dev/null +++ b/images_0.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739743064eac67bf0193986bc093c9d12c7500245933cc0e9e5d81267b255c82 +size 1335369 diff --git a/images_1.png b/images_1.png new file mode 100644 index 0000000000000000000000000000000000000000..8dce56d44139dc4d556aad2771a5492733867390 --- /dev/null +++ b/images_1.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd602bb2c8c8a388807a175f3977626b4f5cdf3561a60efb5f7c9c743c3d5bb +size 1653772 diff --git a/images_2.png b/images_2.png new file mode 100644 index 0000000000000000000000000000000000000000..0fa208889e7e0e91dca48f51a61f6328b4e1da6a --- /dev/null +++ b/images_2.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcf22f333e438d7d1e00dd73febe7248cfdee090c477409d513985d106b20f30 +size 1615477