Spaces:

rahul7star
/

ai-toolkit

Running

App Files Files Community

rahul7star commited on Jun 3

Commit

cdc4fd7

verified ·

1 Parent(s): d446991

Update toolkit/models/diffusion_feature_extraction.py

Browse files

Files changed (1) hide show

toolkit/models/diffusion_feature_extraction.py +21 -21

toolkit/models/diffusion_feature_extraction.py CHANGED Viewed

@@ -255,30 +255,30 @@ class DiffusionFeatureExtractor3(nn.Module):
         dtype = torch.bfloat16
         device = self.vae.device
-        # first we step the scheduler from current timestep to the very end for a full denoise
-        # bs = noise_pred.shape[0]
-        # noise_pred_chunks = torch.chunk(noise_pred, bs)
-        # timestep_chunks = torch.chunk(timesteps, bs)
-        # noisy_latent_chunks = torch.chunk(noisy_latents, bs)
-        # stepped_chunks = []
-        # for idx in range(bs):
-        #     model_output = noise_pred_chunks[idx]
-        #     timestep = timestep_chunks[idx]
-        #     scheduler._step_index = None
-        #     scheduler._init_step_index(timestep)
-        #     sample = noisy_latent_chunks[idx].to(torch.float32)
-        #     sigma = scheduler.sigmas[scheduler.step_index]
-        #     sigma_next = scheduler.sigmas[-1] # use last sigma for final step
-        #     prev_sample = sample + (sigma_next - sigma) * model_output
-        #     stepped_chunks.append(prev_sample)
-        # stepped_latents = torch.cat(stepped_chunks, dim=0)
         if model is not None and hasattr(model, 'get_stepped_pred'):
             stepped_latents = model.get_stepped_pred(noise_pred, noise)
         else:
-            stepped_latents = noise - noise_pred
         latents = stepped_latents.to(self.vae.device, dtype=self.vae.dtype)
@@ -374,4 +374,4 @@ def load_dfe(model_path, vae=None) -> DiffusionFeatureExtractor:
     dfe.load_state_dict(state_dict)
     dfe.eval()
-    return dfe

         dtype = torch.bfloat16
         device = self.vae.device
         if model is not None and hasattr(model, 'get_stepped_pred'):
             stepped_latents = model.get_stepped_pred(noise_pred, noise)
         else:
+            # stepped_latents = noise - noise_pred
+            # first we step the scheduler from current timestep to the very end for a full denoise
+            bs = noise_pred.shape[0]
+            noise_pred_chunks = torch.chunk(noise_pred, bs)
+            timestep_chunks = torch.chunk(timesteps, bs)
+            noisy_latent_chunks = torch.chunk(noisy_latents, bs)
+            stepped_chunks = []
+            for idx in range(bs):
+                model_output = noise_pred_chunks[idx]
+                timestep = timestep_chunks[idx]
+                scheduler._step_index = None
+                scheduler._init_step_index(timestep)
+                sample = noisy_latent_chunks[idx].to(torch.float32)
+                sigma = scheduler.sigmas[scheduler.step_index]
+                sigma_next = scheduler.sigmas[-1] # use last sigma for final step
+                prev_sample = sample + (sigma_next - sigma) * model_output
+                stepped_chunks.append(prev_sample)
+            stepped_latents = torch.cat(stepped_chunks, dim=0)
         latents = stepped_latents.to(self.vae.device, dtype=self.vae.dtype)
     dfe.load_state_dict(state_dict)
     dfe.eval()
+    return dfe