Upload folder using huggingface_hub

#1
by Wawaworker - opened
mzskgl2024-06-24_21-33-44-save-300-30-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0fc6fb3923eae2d77b435f4c52ef7ed91c9c23a35ba695cff3cbe4abce7a6f5
3
+ size 6938084280
mzskgl2024-06-24_21-33-44-save-300-30-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine
mzskgl2024-06-24_21-42-56-save-600-60-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:058645e129daa0e81ce5ff83a83b6861cac8da6f2a1709bd3ea20a138733265c
3
+ size 6938084280
mzskgl2024-06-24_21-42-56-save-600-60-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine
mzskgl2024-06-24_21-52-15-save-900-90-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fedb136dd88ec58c3d6776f938a8455d49b2c693cf1a2f0d5a39aaa3f5318ec3
3
+ size 6938084280
mzskgl2024-06-24_21-52-15-save-900-90-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine
mzskgl2024-06-24_22-01-37-save-1200-120-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a87da1c058165fd4af7d987fbe49a506924c74a3887ee136518350036592aba5
3
+ size 6938084280
mzskgl2024-06-24_22-01-37-save-1200-120-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine
mzskgl2024-06-24_22-10-56-save-1500-150-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c588020c29d282cef98736cdeac2340e9a3da61d715ee93b6229cdac8283837
3
+ size 6938084280
mzskgl2024-06-24_22-10-56-save-1500-150-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine
mzskgl2024-06-24_22-20-12-save-1800-180-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82168c7125ca6e14ffbecd87859399c5cd8c0bcca94b1701404946057165bd98
3
+ size 6938084280
mzskgl2024-06-24_22-20-12-save-1800-180-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine
mzskgl2024-06-24_22-29-23-save-2100-210-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a6957ea129fa35e53a9be049c89a35421864c87c7f16bf754fc24d352f32488
3
+ size 6938084280
mzskgl2024-06-24_22-29-23-save-2100-210-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine
mzskgl2024-06-24_22-38-38-save-2400-240-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c76eed47da78ad977e0aed229b10c8960528e9a680a717438fb5537979cadcb0
3
+ size 6938084280
mzskgl2024-06-24_22-38-38-save-2400-240-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine
mzskgl2024-06-24_22-47-50-save-2700-270-0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e147cd4d72525e0a601345aa5b63495350b1bfda78ff35c7acf08693fa328b9
3
+ size 6938084280
mzskgl2024-06-24_22-47-50-save-2700-270-0.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ params:
3
+ conditioner_config:
4
+ params:
5
+ emb_models:
6
+ - input_key: txt
7
+ is_trainable: false
8
+ params:
9
+ layer: hidden
10
+ layer_idx: 11
11
+ target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
12
+ - input_key: txt
13
+ is_trainable: false
14
+ params:
15
+ always_return_pooled: true
16
+ arch: ViT-bigG-14
17
+ freeze: true
18
+ layer: penultimate
19
+ legacy: false
20
+ version: laion2b_s39b_b160k
21
+ target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
22
+ - input_key: original_size_as_tuple
23
+ is_trainable: false
24
+ params:
25
+ outdim: 256
26
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
27
+ - input_key: crop_coords_top_left
28
+ is_trainable: false
29
+ params:
30
+ outdim: 256
31
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
32
+ - input_key: target_size_as_tuple
33
+ is_trainable: false
34
+ params:
35
+ outdim: 256
36
+ target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
37
+ target: sgm.modules.GeneralConditioner
38
+ denoiser_config:
39
+ params:
40
+ discretization_config:
41
+ target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
42
+ num_idx: 1000
43
+ scaling_config:
44
+ target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
45
+ weighting_config:
46
+ target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
47
+ target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
48
+ disable_first_stage_autocast: true
49
+ first_stage_config:
50
+ params:
51
+ ddconfig:
52
+ attn_resolutions: []
53
+ attn_type: vanilla-xformers
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ double_z: true
61
+ dropout: 0.0
62
+ in_channels: 3
63
+ num_res_blocks: 2
64
+ out_ch: 3
65
+ resolution: 256
66
+ z_channels: 4
67
+ embed_dim: 4
68
+ lossconfig:
69
+ target: torch.nn.Identity
70
+ monitor: val/rec_loss
71
+ target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
72
+ network_config:
73
+ params:
74
+ adm_in_channels: 2816
75
+ attention_resolutions:
76
+ - 4
77
+ - 2
78
+ channel_mult:
79
+ - 1
80
+ - 2
81
+ - 4
82
+ context_dim: 2048
83
+ in_channels: 4
84
+ legacy: false
85
+ model_channels: 320
86
+ num_classes: sequential
87
+ num_head_channels: 64
88
+ num_res_blocks: 2
89
+ out_channels: 4
90
+ spatial_transformer_attn_type: softmax-xformers
91
+ transformer_depth:
92
+ - 1
93
+ - 2
94
+ - 10
95
+ use_checkpoint: true
96
+ use_linear_in_transformer: true
97
+ use_spatial_transformer: true
98
+ target: sgm.modules.diffusionmodules.openaimodel.UNetModel
99
+ scale_factor: 0.13025
100
+ target: sgm.models.diffusion.DiffusionEngine