Wawaworker
/

dvdyrmchn

Model card Files Files and versions Community

Upload folder using huggingface_hub

by Wawaworker - opened Jun 24, 2024

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+927

-0

Files changed (18) hide show

mzskgl2024-06-24_21-33-44-save-300-30-0.safetensors +3 -0
mzskgl2024-06-24_21-33-44-save-300-30-0.yaml +100 -0
mzskgl2024-06-24_21-42-56-save-600-60-0.safetensors +3 -0
mzskgl2024-06-24_21-42-56-save-600-60-0.yaml +100 -0
mzskgl2024-06-24_21-52-15-save-900-90-0.safetensors +3 -0
mzskgl2024-06-24_21-52-15-save-900-90-0.yaml +100 -0
mzskgl2024-06-24_22-01-37-save-1200-120-0.safetensors +3 -0
mzskgl2024-06-24_22-01-37-save-1200-120-0.yaml +100 -0
mzskgl2024-06-24_22-10-56-save-1500-150-0.safetensors +3 -0
mzskgl2024-06-24_22-10-56-save-1500-150-0.yaml +100 -0
mzskgl2024-06-24_22-20-12-save-1800-180-0.safetensors +3 -0
mzskgl2024-06-24_22-20-12-save-1800-180-0.yaml +100 -0
mzskgl2024-06-24_22-29-23-save-2100-210-0.safetensors +3 -0
mzskgl2024-06-24_22-29-23-save-2100-210-0.yaml +100 -0
mzskgl2024-06-24_22-38-38-save-2400-240-0.safetensors +3 -0
mzskgl2024-06-24_22-38-38-save-2400-240-0.yaml +100 -0
mzskgl2024-06-24_22-47-50-save-2700-270-0.safetensors +3 -0
mzskgl2024-06-24_22-47-50-save-2700-270-0.yaml +100 -0

mzskgl2024-06-24_21-33-44-save-300-30-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a0fc6fb3923eae2d77b435f4c52ef7ed91c9c23a35ba695cff3cbe4abce7a6f5
+size 6938084280

mzskgl2024-06-24_21-33-44-save-300-30-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_21-42-56-save-600-60-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:058645e129daa0e81ce5ff83a83b6861cac8da6f2a1709bd3ea20a138733265c
+size 6938084280

mzskgl2024-06-24_21-42-56-save-600-60-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_21-52-15-save-900-90-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fedb136dd88ec58c3d6776f938a8455d49b2c693cf1a2f0d5a39aaa3f5318ec3
+size 6938084280

mzskgl2024-06-24_21-52-15-save-900-90-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_22-01-37-save-1200-120-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a87da1c058165fd4af7d987fbe49a506924c74a3887ee136518350036592aba5
+size 6938084280

mzskgl2024-06-24_22-01-37-save-1200-120-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_22-10-56-save-1500-150-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c588020c29d282cef98736cdeac2340e9a3da61d715ee93b6229cdac8283837
+size 6938084280

mzskgl2024-06-24_22-10-56-save-1500-150-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_22-20-12-save-1800-180-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:82168c7125ca6e14ffbecd87859399c5cd8c0bcca94b1701404946057165bd98
+size 6938084280

mzskgl2024-06-24_22-20-12-save-1800-180-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_22-29-23-save-2100-210-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0a6957ea129fa35e53a9be049c89a35421864c87c7f16bf754fc24d352f32488
+size 6938084280

mzskgl2024-06-24_22-29-23-save-2100-210-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_22-38-38-save-2400-240-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c76eed47da78ad977e0aed229b10c8960528e9a680a717438fb5537979cadcb0
+size 6938084280

mzskgl2024-06-24_22-38-38-save-2400-240-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine

mzskgl2024-06-24_22-47-50-save-2700-270-0.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e147cd4d72525e0a601345aa5b63495350b1bfda78ff35c7acf08693fa328b9
+size 6938084280

mzskgl2024-06-24_22-47-50-save-2700-270-0.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine