Epoch 339

Browse files

Files changed (4) hide show

model_index.json +3 -3
scheduler/scheduler_config.json +1 -1
unet/config.json +48 -19
unet/diffusion_pytorch_model.safetensors +2 -2

model_index.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "_class_name": "DDPMPipeline",
-  "_diffusers_version": "0.29.0",
   "scheduler": [
     "diffusers",
     "DDIMScheduler"
   ],
   "unet": [
-    "diffusers",
-    "UNet2DModel"
   ]
 }

 {
   "_class_name": "DDPMPipeline",
+  "_diffusers_version": "0.29.2",
   "scheduler": [
     "diffusers",
     "DDIMScheduler"
   ],
   "unet": [
+    "audioldm2",
+    "AudioLDM2UNet2DConditionModel"
   ]
 }

scheduler/scheduler_config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "_class_name": "DDIMScheduler",
-  "_diffusers_version": "0.29.0",
   "beta_end": 0.0195,
   "beta_schedule": "scaled_linear",
   "beta_start": 0.0015,

 {
   "_class_name": "DDIMScheduler",
+  "_diffusers_version": "0.29.2",
   "beta_end": 0.0195,
   "beta_schedule": "scaled_linear",
   "beta_start": 0.0015,

unet/config.json CHANGED Viewed

@@ -1,46 +1,75 @@
 {
-  "_class_name": "UNet2DModel",
-  "_diffusers_version": "0.29.0",
-  "_name_or_path": "michaelpiro1/train_model",
   "act_fn": "silu",
-  "add_attention": true,
   "attention_head_dim": 8,
-  "attn_norm_num_groups": null,
   "block_out_channels": [
     128,
     256,
     384,
     640
   ],
-  "center_input_sample": false,
   "class_embed_type": null,
   "down_block_types": [
-    "AttnDownBlock2D",
-    "AttnDownBlock2D",
-    "AttnDownBlock2D",
-    "DownBlock2D"
   ],
   "downsample_padding": 1,
-  "downsample_type": "conv",
-  "dropout": 0.0,
   "flip_sin_to_cos": true,
   "freq_shift": 0,
   "in_channels": 16,
   "layers_per_block": 2,
   "mid_block_scale_factor": 1,
   "norm_eps": 1e-05,
   "norm_num_groups": 32,
   "num_class_embeds": null,
-  "num_train_timesteps": null,
   "out_channels": 8,
   "resnet_time_scale_shift": "default",
-  "sample_size": 512,
   "time_embedding_type": "positional",
   "up_block_types": [
-    "UpBlock2D",
-    "AttnUpBlock2D",
-    "AttnUpBlock2D",
-    "AttnUpBlock2D"
   ],
-  "upsample_type": "conv"
 }

 {
+  "_class_name": "AudioLDM2UNet2DConditionModel",
+  "_diffusers_version": "0.29.2",
+  "_name_or_path": "michaelpiro1/new_unet_fromLDM",
   "act_fn": "silu",
   "attention_head_dim": 8,
   "block_out_channels": [
     128,
     256,
     384,
     640
   ],
   "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": [
+    [
+      null,
+      768,
+      1024
+    ],
+    [
+      null,
+      768,
+      1024
+    ],
+    [
+      null,
+      768,
+      1024
+    ],
+    [
+      null,
+      768,
+      1024
+    ]
+  ],
   "down_block_types": [
+    "DownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D"
   ],
   "downsample_padding": 1,
   "flip_sin_to_cos": true,
   "freq_shift": 0,
   "in_channels": 16,
   "layers_per_block": 2,
   "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
   "norm_eps": 1e-05,
   "norm_num_groups": 32,
+  "num_attention_heads": null,
   "num_class_embeds": null,
+  "only_cross_attention": false,
   "out_channels": 8,
+  "projection_class_embeddings_input_dim": null,
   "resnet_time_scale_shift": "default",
+  "sample_size": 256,
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
   "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
   "up_block_types": [
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "UpBlock2D"
   ],
+  "upcast_attention": false,
+  "use_linear_projection": false
 }

unet/diffusion_pytorch_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a66bdec9ac60336ec587a112d0a8f393e3e03aedf031de9ad896506c988cac71
-size 436573952

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f41f2714c77930fc77408b3ee1ddad1edfd3574d33045b51f1574f697db4340
+size 1388001648