Wawaworker
/

mzskgl

Model card Files Files and versions Community

Upload folder using huggingface_hub

by Wawaworker - opened Jun 24

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+824

-0

Files changed (16) hide show

mzskgl2024-06-24_02-29-11-save-600-60-0.safetensors +3 -0
mzskgl2024-06-24_02-29-11-save-600-60-0.yaml +100 -0
mzskgl2024-06-24_02-38-29-save-900-90-0.safetensors +3 -0
mzskgl2024-06-24_02-38-29-save-900-90-0.yaml +100 -0
mzskgl2024-06-24_02-47-42-save-1200-120-0.safetensors +3 -0
mzskgl2024-06-24_02-47-42-save-1200-120-0.yaml +100 -0
mzskgl2024-06-24_02-56-58-save-1500-150-0.safetensors +3 -0
mzskgl2024-06-24_02-56-58-save-1500-150-0.yaml +100 -0
mzskgl2024-06-24_03-06-22-save-1800-180-0.safetensors +3 -0
mzskgl2024-06-24_03-06-22-save-1800-180-0.yaml +100 -0
mzskgl2024-06-24_03-15-46-save-2100-210-0.safetensors +3 -0
mzskgl2024-06-24_03-15-46-save-2100-210-0.yaml +100 -0
mzskgl2024-06-24_03-25-20-save-2400-240-0.safetensors +3 -0
mzskgl2024-06-24_03-25-20-save-2400-240-0.yaml +100 -0
mzskgl2024-06-24_03-34-48-save-2700-270-0.safetensors +3 -0
mzskgl2024-06-24_03-34-48-save-2700-270-0.yaml +100 -0

mzskgl2024-06-24_02-29-11-save-600-60-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cce3f1afd34f234baef1579da0b333dc63dd21e54203868bed18bd783aade099
+size 6938084280

mzskgl2024-06-24_02-29-11-save-600-60-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_02-38-29-save-900-90-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ea7e3309fe5847da177e5025d3cdcac241a824672d6ea5c47d34d210d17a560
+size 6938084280

mzskgl2024-06-24_02-38-29-save-900-90-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_02-47-42-save-1200-120-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dea325dfe6f0610f4e6949466df12c17509ff77cdb04fd91e02697bdb668fece
+size 6938084280

mzskgl2024-06-24_02-47-42-save-1200-120-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_02-56-58-save-1500-150-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:50469766da2b4f0c76c5d8598e65066527bc30a640387f75f33c8a521e2aa9f6
+size 6938084280

mzskgl2024-06-24_02-56-58-save-1500-150-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_03-06-22-save-1800-180-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00955de218f8b61a33382f1e7f985416460202a47acf59d39c2d6d53d288ac9e
+size 6938084280

mzskgl2024-06-24_03-06-22-save-1800-180-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_03-15-46-save-2100-210-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:374993cfc22f950689cafd335775daa4fb144f07ae3cf6361e2ac9fbbc843e00
+size 6938084280

mzskgl2024-06-24_03-15-46-save-2100-210-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_03-25-20-save-2400-240-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:402be8fa858d554acaa1253e283235a305eeb7ad4288a11341a7c6e6169e4048
+size 6938084280

mzskgl2024-06-24_03-25-20-save-2400-240-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_03-34-48-save-2700-270-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5b56777a15824e01c0634ac8c4daf783635af5e2cb9b1604e857c19306c9674
+size 6938084280

mzskgl2024-06-24_03-34-48-save-2700-270-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine