Epoch 2
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint-10000/optimizer.bin +3 -0
- checkpoint-10000/random_states_0.pkl +3 -0
- checkpoint-10000/scaler.pt +3 -0
- checkpoint-10000/scheduler.bin +3 -0
- checkpoint-10000/unet/config.json +60 -0
- checkpoint-10000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-10000/unet_ema/config.json +67 -0
- checkpoint-10000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-7000/optimizer.bin +3 -0
- checkpoint-7000/random_states_0.pkl +3 -0
- checkpoint-7000/scaler.pt +3 -0
- checkpoint-7000/scheduler.bin +3 -0
- checkpoint-7000/unet/config.json +60 -0
- checkpoint-7000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-7000/unet_ema/config.json +67 -0
- checkpoint-7000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-7500/optimizer.bin +3 -0
- checkpoint-7500/random_states_0.pkl +3 -0
- checkpoint-7500/scaler.pt +3 -0
- checkpoint-7500/scheduler.bin +3 -0
- checkpoint-7500/unet/config.json +60 -0
- checkpoint-7500/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-7500/unet_ema/config.json +67 -0
- checkpoint-7500/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-8000/optimizer.bin +3 -0
- checkpoint-8000/random_states_0.pkl +3 -0
- checkpoint-8000/scaler.pt +3 -0
- checkpoint-8000/scheduler.bin +3 -0
- checkpoint-8000/unet/config.json +60 -0
- checkpoint-8000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-8000/unet_ema/config.json +67 -0
- checkpoint-8000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-8500/optimizer.bin +3 -0
- checkpoint-8500/random_states_0.pkl +3 -0
- checkpoint-8500/scaler.pt +3 -0
- checkpoint-8500/scheduler.bin +3 -0
- checkpoint-8500/unet/config.json +60 -0
- checkpoint-8500/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-8500/unet_ema/config.json +67 -0
- checkpoint-8500/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-9000/optimizer.bin +3 -0
- checkpoint-9000/random_states_0.pkl +3 -0
- checkpoint-9000/scaler.pt +3 -0
- checkpoint-9000/scheduler.bin +3 -0
- checkpoint-9000/unet/config.json +60 -0
- checkpoint-9000/unet/diffusion_pytorch_model.bin +3 -0
- checkpoint-9000/unet_ema/config.json +67 -0
- checkpoint-9000/unet_ema/diffusion_pytorch_model.bin +3 -0
- checkpoint-9500/optimizer.bin +3 -0
- checkpoint-9500/random_states_0.pkl +3 -0
checkpoint-10000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3461f23d40cad5af783e587ff9f3f6260c623437cdd5b85b93162c05378951e8
|
3 |
+
size 73251413
|
checkpoint-10000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:852b8476e89ba9ca5d3b25b798857f40f02fdf04681cf82395053e27e3d3ae05
|
3 |
+
size 14663
|
checkpoint-10000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9be2ad76dcbc923b00e6a142f6db62aad4a46c47bb83864ccb68ddc899d0ce78
|
3 |
+
size 557
|
checkpoint-10000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f1bb79807602853a9b929a33930e620d3677c056b865ac90c06fdbcf9fe5a39
|
3 |
+
size 563
|
checkpoint-10000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-10000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd5dcebaea0b32d33b85641dd3cb1452713faa00880a7e40026487baf54cb489
|
3 |
+
size 36621969
|
checkpoint-10000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 10000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-10000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a7a58232fc4bca56bdccfc5651ede62692b6b9ef4c2e922b592b6e5afc488dc
|
3 |
+
size 36616081
|
checkpoint-7000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7f5d59b7e393078953eff769f6b788d77aa9efbff6af00e2e761479e22a74f3
|
3 |
+
size 73251413
|
checkpoint-7000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:591d6d4d059dc97c7659a135895e593d93af39b1c25c432bdfca1f644cc6e698
|
3 |
+
size 14663
|
checkpoint-7000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d22aed3a858ee389297b2101bb2ed7ee9e37744f1a1f75273dbdf045d65b041a
|
3 |
+
size 557
|
checkpoint-7000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5ffa669c96b14b85dd0b293ca82f551eb33c2fe4c81ccb71442e454826f0525
|
3 |
+
size 563
|
checkpoint-7000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-7000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62e4469e7d57c318031d778d85c27b45b281aa539fb0256099c302eda379dd56
|
3 |
+
size 36621969
|
checkpoint-7000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 7000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-7000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c8ceb1273db471f16e62f0087e4a3cd414c62c7a392e3877e8e82143651a321
|
3 |
+
size 36616081
|
checkpoint-7500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9485ad1321d89efa5b5c76eb67df347001c6a3864ed8a55ee5d7cd84656a88d
|
3 |
+
size 73251413
|
checkpoint-7500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b378e80df497993a2202f8309cf0d1ebaa089d805885b310d1187c43875462d1
|
3 |
+
size 14663
|
checkpoint-7500/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fab868730e2cdc5d83f898b6c5399b352e14373e48bdbdfa9179803e96fd314f
|
3 |
+
size 557
|
checkpoint-7500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:facedcdc17eb26e1728619ebe64654dc4fd1908b60d23ecb9f21dc05c8bd1136
|
3 |
+
size 563
|
checkpoint-7500/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-7500/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f7dc2a519753a97c06a9b38d0fb1fe3eae7eb809059847ac3585c4f2c9f93b0
|
3 |
+
size 36621969
|
checkpoint-7500/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 7500,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-7500/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4fc91cbb312284924ea0c1af0b1c076168ef0d2f5843c097962cecdb91d38d8
|
3 |
+
size 36616081
|
checkpoint-8000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28511e509205687dc07a5c92676cb95aedf6a72a2bec4f7f105449f00197a9ee
|
3 |
+
size 73251413
|
checkpoint-8000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:751afdbaf6c1bfba002501fa84058ab837f7e3fc7182aa1201a93617028de380
|
3 |
+
size 14663
|
checkpoint-8000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b278cd6e09360f31a3d837f80dee4c2ce4d9c9d186a939ecf157e1a0deb793f3
|
3 |
+
size 557
|
checkpoint-8000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d94c1d7c3e2abb40d6062281af4303f8cef91c9fa7a7d997f1cc9c88abcf650
|
3 |
+
size 563
|
checkpoint-8000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-8000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cd07fd95f5ac75626a08bd003ea15c7cacd630ecbadca9f7e979b92ce286d97
|
3 |
+
size 36621969
|
checkpoint-8000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 8000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-8000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c9c030559358248221cb1e409719df455ca3deb8d2835114b157fa3572db848
|
3 |
+
size 36616081
|
checkpoint-8500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f89ad1c2f73469bb21f1944a0b3370bfaf719ef99325248b8603b7ed275f921
|
3 |
+
size 73251413
|
checkpoint-8500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ef629902f50f8c547877a9c1b35eb6779d4489e90fef1853db3a8920168f1d9
|
3 |
+
size 14663
|
checkpoint-8500/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ed0eced7c80f9d236fedf48c2537ab9b4e6957d5129ef3aec426e866324bfd1
|
3 |
+
size 557
|
checkpoint-8500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8a36ce5f73caf5b02af6dfbe5f7940870d5612887621a11651ef28fa88084ef
|
3 |
+
size 563
|
checkpoint-8500/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-8500/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9be248b149100ef7209d0716a1b0f02aed97d503489f23e0afea999ffc4f3487
|
3 |
+
size 36621969
|
checkpoint-8500/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 8500,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-8500/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1feb02d8d019532605d12e559279c5fc97fdf1b3fe700a61732f68446d5dbf4b
|
3 |
+
size 36616081
|
checkpoint-9000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4e26421234c8e5db4534258d3b4d8d86c5cfce8fed7742b5e581d9021031af6
|
3 |
+
size 73251413
|
checkpoint-9000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac5be4875559e7991191515194cec5555fd9e7d029815ef533e84328e06e1d40
|
3 |
+
size 14663
|
checkpoint-9000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4be7a7b56cfc3e79d33648a4c49d4f11c6593d8d653b129207b2e38f2684a284
|
3 |
+
size 557
|
checkpoint-9000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bea4d834a8bceefe229ff7073ce740a413ead6db8f7c0c937e081bb6dee7f57c
|
3 |
+
size 563
|
checkpoint-9000/unet/config.json
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"down_block_types": [
|
22 |
+
"DownBlock2D",
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"CrossAttnDownBlock2D"
|
26 |
+
],
|
27 |
+
"downsample_padding": 1,
|
28 |
+
"dual_cross_attention": false,
|
29 |
+
"encoder_hid_dim": null,
|
30 |
+
"flip_sin_to_cos": true,
|
31 |
+
"freq_shift": 0,
|
32 |
+
"in_channels": 3,
|
33 |
+
"layers_per_block": 2,
|
34 |
+
"mid_block_only_cross_attention": null,
|
35 |
+
"mid_block_scale_factor": 1,
|
36 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
37 |
+
"norm_eps": 1e-05,
|
38 |
+
"norm_num_groups": 32,
|
39 |
+
"num_class_embeds": null,
|
40 |
+
"only_cross_attention": false,
|
41 |
+
"out_channels": 3,
|
42 |
+
"projection_class_embeddings_input_dim": null,
|
43 |
+
"resnet_out_scale_factor": 1.0,
|
44 |
+
"resnet_skip_time_act": false,
|
45 |
+
"resnet_time_scale_shift": "default",
|
46 |
+
"sample_size": 256,
|
47 |
+
"time_cond_proj_dim": null,
|
48 |
+
"time_embedding_act_fn": null,
|
49 |
+
"time_embedding_dim": null,
|
50 |
+
"time_embedding_type": "positional",
|
51 |
+
"timestep_post_act": null,
|
52 |
+
"up_block_types": [
|
53 |
+
"CrossAttnUpBlock2D",
|
54 |
+
"UpBlock2D",
|
55 |
+
"UpBlock2D",
|
56 |
+
"UpBlock2D"
|
57 |
+
],
|
58 |
+
"upcast_attention": false,
|
59 |
+
"use_linear_projection": false
|
60 |
+
}
|
checkpoint-9000/unet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4016a37dd139a39b303d25450933460fdad7267ef0d7578b3ca2abb3e877dbe4
|
3 |
+
size 36621969
|
checkpoint-9000/unet_ema/config.json
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "UNet2DConditionModel",
|
3 |
+
"_diffusers_version": "0.16.1",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": null,
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"attention_head_dim": 8,
|
8 |
+
"block_out_channels": [
|
9 |
+
64,
|
10 |
+
64,
|
11 |
+
128,
|
12 |
+
128
|
13 |
+
],
|
14 |
+
"center_input_sample": false,
|
15 |
+
"class_embed_type": null,
|
16 |
+
"class_embeddings_concat": false,
|
17 |
+
"conv_in_kernel": 3,
|
18 |
+
"conv_out_kernel": 3,
|
19 |
+
"cross_attention_dim": 256,
|
20 |
+
"cross_attention_norm": null,
|
21 |
+
"decay": 0.9999,
|
22 |
+
"down_block_types": [
|
23 |
+
"DownBlock2D",
|
24 |
+
"DownBlock2D",
|
25 |
+
"DownBlock2D",
|
26 |
+
"CrossAttnDownBlock2D"
|
27 |
+
],
|
28 |
+
"downsample_padding": 1,
|
29 |
+
"dual_cross_attention": false,
|
30 |
+
"encoder_hid_dim": null,
|
31 |
+
"flip_sin_to_cos": true,
|
32 |
+
"freq_shift": 0,
|
33 |
+
"in_channels": 3,
|
34 |
+
"inv_gamma": 1.0,
|
35 |
+
"layers_per_block": 2,
|
36 |
+
"mid_block_only_cross_attention": null,
|
37 |
+
"mid_block_scale_factor": 1,
|
38 |
+
"mid_block_type": "UNetMidBlock2DCrossAttn",
|
39 |
+
"min_decay": 0.0,
|
40 |
+
"norm_eps": 1e-05,
|
41 |
+
"norm_num_groups": 32,
|
42 |
+
"num_class_embeds": null,
|
43 |
+
"only_cross_attention": false,
|
44 |
+
"optimization_step": 9000,
|
45 |
+
"out_channels": 3,
|
46 |
+
"power": 0.75,
|
47 |
+
"projection_class_embeddings_input_dim": null,
|
48 |
+
"resnet_out_scale_factor": 1.0,
|
49 |
+
"resnet_skip_time_act": false,
|
50 |
+
"resnet_time_scale_shift": "default",
|
51 |
+
"sample_size": 256,
|
52 |
+
"time_cond_proj_dim": null,
|
53 |
+
"time_embedding_act_fn": null,
|
54 |
+
"time_embedding_dim": null,
|
55 |
+
"time_embedding_type": "positional",
|
56 |
+
"timestep_post_act": null,
|
57 |
+
"up_block_types": [
|
58 |
+
"CrossAttnUpBlock2D",
|
59 |
+
"UpBlock2D",
|
60 |
+
"UpBlock2D",
|
61 |
+
"UpBlock2D"
|
62 |
+
],
|
63 |
+
"upcast_attention": false,
|
64 |
+
"update_after_step": 0,
|
65 |
+
"use_ema_warmup": true,
|
66 |
+
"use_linear_projection": false
|
67 |
+
}
|
checkpoint-9000/unet_ema/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e53447dff3025dc5320871a1df84f9e4e7ce3831374133310101a7622356c31
|
3 |
+
size 36616081
|
checkpoint-9500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:866c325db787f5fac5c272c689eb6f29ff4ef59ee4bd68780d0daaa160186e21
|
3 |
+
size 73251413
|
checkpoint-9500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c8f57baeef99ba3d0630be969218cce5a7c7606412ed67f0af2c4a395e4565b
|
3 |
+
size 14663
|