Epoch 3
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint-10500/optimizer.bin +3 -0
- checkpoint-10500/random_states_0.pkl +3 -0
- checkpoint-10500/scaler.pt +3 -0
- checkpoint-10500/scheduler.bin +3 -0
- checkpoint-10500/unet/config.json +60 -0
- checkpoint-10500/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-10500/unet_ema/config.json +67 -0
- checkpoint-10500/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-11000/optimizer.bin +3 -0
- checkpoint-11000/random_states_0.pkl +3 -0
- checkpoint-11000/scaler.pt +3 -0
- checkpoint-11000/scheduler.bin +3 -0
- checkpoint-11000/unet/config.json +60 -0
- checkpoint-11000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-11000/unet_ema/config.json +67 -0
- checkpoint-11000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-11500/optimizer.bin +3 -0
- checkpoint-11500/random_states_0.pkl +3 -0
- checkpoint-11500/scaler.pt +3 -0
- checkpoint-11500/scheduler.bin +3 -0
- checkpoint-11500/unet/config.json +60 -0
- checkpoint-11500/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-11500/unet_ema/config.json +67 -0
- checkpoint-11500/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-12000/optimizer.bin +3 -0
- checkpoint-12000/random_states_0.pkl +3 -0
- checkpoint-12000/scaler.pt +3 -0
- checkpoint-12000/scheduler.bin +3 -0
- checkpoint-12000/unet/config.json +60 -0
- checkpoint-12000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-12000/unet_ema/config.json +67 -0
- checkpoint-12000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-12500/optimizer.bin +3 -0
- checkpoint-12500/random_states_0.pkl +3 -0
- checkpoint-12500/scaler.pt +3 -0
- checkpoint-12500/scheduler.bin +3 -0
- checkpoint-12500/unet/config.json +60 -0
- checkpoint-12500/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-12500/unet_ema/config.json +67 -0
- checkpoint-12500/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-13000/optimizer.bin +3 -0
- checkpoint-13000/random_states_0.pkl +3 -0
- checkpoint-13000/scaler.pt +3 -0
- checkpoint-13000/scheduler.bin +3 -0
- checkpoint-13000/unet/config.json +60 -0
- checkpoint-13000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-13000/unet_ema/config.json +67 -0
- checkpoint-13000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-13500/optimizer.bin +3 -0
- checkpoint-13500/random_states_0.pkl +3 -0
checkpoint-10500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d069752d553e844a0d9fd312651dde9d39701257def98551fb6e765b81b5183e
|
3 |
+
size 73251413
|
checkpoint-10500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c176434a90a69e6daa24223250f4dc3b4425ada8c2bd31dccf851497b8fc57a8
|
3 |
+
size 14663
|
checkpoint-10500/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:930aa4121a2a38f44b8af20e66d414b77fba3198866a0d743e0016592e1c420e
|
3 |
+
size 557
|
checkpoint-10500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f880b6fdac81d333a28d35151b681f977b7d9683f1c80e80ed34339ca0814b6
|
3 |
+
size 563
|
checkpoint-10500/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-10500/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4833e2f77288142a970e10ca8e1fe8cce5318deb8dd44795ffe4777b09170f69
|
3 |
+
size 36621969
|
checkpoint-10500/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 10500,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-10500/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:210322ed229f8c67e54c3e2eb1b9170b6c7a706fd5415b1af2c0ef78247939b8
|
3 |
+
size 36616081
|
checkpoint-11000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8edd4b512d28005e4bd4855a66b14c4f417c5998ac8294d2e9374cb405c624d2
|
3 |
+
size 73251413
|
checkpoint-11000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b74f4ceebdeb98333c28c6a41b66aa4bb14011702fc995cc1b5fa9106a2be483
|
3 |
+
size 14663
|
checkpoint-11000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8df4dd185a129710516223a132f1321dd530e937b37d9a1dca8d2915b9d5a04a
|
3 |
+
size 557
|
checkpoint-11000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:639cd51071e686afddf9c099ad4c78eed0fb800504d15c7cf337ce6a0d327ee2
|
3 |
+
size 563
|
checkpoint-11000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-11000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a041163ff52058de2cca2226122ee64b4b0dfc0a7b562454d74819a949c566f2
|
3 |
+
size 36621969
|
checkpoint-11000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 11000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-11000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5892a70cf5403921ea53d00744e98e9d739723b5def3298f35388f7c81788208
|
3 |
+
size 36616081
|
checkpoint-11500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08dc26f52e9b86fbd60c442a490513041876a6dab18082860b1fbfdc84d60e23
|
3 |
+
size 73251413
|
checkpoint-11500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d54e81c10e51975e4f7b1d33fe48a7337bf29a4811a72aa978bad1e5fcfe562
|
3 |
+
size 14663
|
checkpoint-11500/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cab7988ce4c8b69e7970aada0017afc1c2120661c865bce9234915457ce96c2
|
3 |
+
size 557
|
checkpoint-11500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aadecd4a538b5d1dba9865109d974365b5fef3a16a8f15b84ad9bb69396810ab
|
3 |
+
size 563
|
checkpoint-11500/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-11500/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:585777626add9c1eb930daee056a68a0c65fe82f4ca61a152202fc7e13dc6ff9
|
3 |
+
size 36621969
|
checkpoint-11500/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 11500,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-11500/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c900e3c277e02cd5dcfb1f83182fe3d6a1fedff838f1d8953b8d7250a60c3d2
|
3 |
+
size 36616081
|
checkpoint-12000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce749e708deb4834e510ee65f85ed9e541cd79227a3c9eaa2561080906f46db0
|
3 |
+
size 73251413
|
checkpoint-12000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e6be413308fdb0597b191695edf341acc944140c7f581268dae0d5cb5c64710
|
3 |
+
size 14663
|
checkpoint-12000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bce458d2f0e0937df767175ef2da719ebfea2dc13abb18accc5a26fd31d6b24c
|
3 |
+
size 557
|
checkpoint-12000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b0c5f7195a61f91e5bb9678cbb2c9866f6c8a95c81d28ec8cbff36e6b782060
|
3 |
+
size 563
|
checkpoint-12000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-12000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:281c9e178c6cb08790db694c96498cfc9d19f20fbe90591b0e3477c3ba13c3fb
|
3 |
+
size 36621969
|
checkpoint-12000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 12000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-12000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2d8f56d62d75b15dae5234e3d958eccc3079bf86199f8e423064c991a7bed48
|
3 |
+
size 36616081
|
checkpoint-12500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0ce0b1beca70fd5bd2240008fedeaa2102d9f4a4a24f777f966147644129e6d
|
3 |
+
size 73251413
|
checkpoint-12500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:632ade90bd4a222b5beffbf4ec1c47bbc20e3f8c313319748e513f13bbabd23f
|
3 |
+
size 14663
|
checkpoint-12500/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:676c7ca172a8e0e2d2a49c50360fb5615bee6c75b2b21b58c40691d9ce37f540
|
3 |
+
size 557
|
checkpoint-12500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca652ab09470c7d8ef9b2b18cd87478bea008d2b73edad3cae70fb852092376a
|
3 |
+
size 563
|
checkpoint-12500/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-12500/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9ce1765878ae36cad5674beb9fe0767842b3c333d4195819e5e3f6df76bdfbc
|
3 |
+
size 36621969
|
checkpoint-12500/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 12500,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-12500/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a400841cc3476abd9fece5d3e0bf34bd4abc08a4b8865daf3c8d4d88913840c9
|
3 |
+
size 36616081
|
checkpoint-13000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f6057e095320ebbfd1e7bfec9a15022e766c67fd01002ca99c86b14b9d31c13
|
3 |
+
size 73251413
|
checkpoint-13000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74b8086748391706549155a071ad9215fee237acc56ef94e1acbe9cf7183b187
|
3 |
+
size 14663
|
checkpoint-13000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3bd46694cab01abb585c817c8192debd3ba2bfb2caed79a96d5c18143c7bb9a
|
3 |
+
size 557
|
checkpoint-13000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30d3c01f1a05ef1ae8354a8a28a3b01698b6f62fc98b5d5285d87757eccf76a4
|
3 |
+
size 563
|
checkpoint-13000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-13000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd72031f2c1afdc33010eba7cfd0191a94cc8a09a784df5a685934c4ceedf328
|
3 |
+
size 36621969
|
checkpoint-13000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 13000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-13000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13fd9bc6975a8592e2b95a9c4ad317b4d2043daa4b771e2d1dc705e27cc036a7
|
3 |
+
size 36616081
|
checkpoint-13500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba170594436c302cd6e37c329786d79601a77c7d9f4a810194b9a356a5c81b35
|
3 |
+
size 73251413
|
checkpoint-13500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ce88771f3eb88369f5d3eb8100a6bdcd594ab8bcb9cd1720d146c43abe10a3
|
3 |
+
size 14663
|