smoothieAI
/

pipeline_animatediff_context_controlnet

Model card Files Files and versions Community

smoothieAI commited on Jan 28, 2024

Commit

f668249

verified ·

1 Parent(s): 1a81101

Update pipeline.py

Browse files

Files changed (1) hide show

pipeline.py +23 -10

pipeline.py CHANGED Viewed

@@ -1492,19 +1492,26 @@ class AnimateDiffPipeline(DiffusionPipeline, TextualInversionLoaderMixin, IPAdap
                             added_cond_kwargs=added_cond_kwargs,
                         ).sample
-                    # sum the noise predictions for the unconditional and text conditioned noise
-                    start_guidance_time = time.time()
                     if do_classifier_free_guidance:
-                        # Split tensor along its first dimension
                         torch.cuda.synchronize()  # Synchronize GPU before starting timing
-                        time_chunk = time.time()
                         noise_pred_uncond, noise_pred_text = torch.chunk(noise_pred, 2, dim=0)
-                        torch.cuda.synchronize()  # Synchronize GPU after operation
-                        print("chunk time", time.time() - time_chunk)
                         for i, context_index in enumerate(current_context_indexes):
                             # Perform batch addition
                             noise_pred_uncond_sum[..., context_index, :, :] += noise_pred_uncond[:, :, i, :, :]
@@ -1513,8 +1520,14 @@ class AnimateDiffPipeline(DiffusionPipeline, TextualInversionLoaderMixin, IPAdap
                             # Batch increment for latent_counter
                             latent_counter[context_index] += 1
-                    print("guidance time", time.time() - start_guidance_time)
                     # set the step index to the current batch
                     self.scheduler._step_index = i

                             added_cond_kwargs=added_cond_kwargs,
                         ).sample
                     if do_classifier_free_guidance:
+                        # Start timing for overall guidance process
                         torch.cuda.synchronize()  # Synchronize GPU before starting timing
+                        start_guidance_time = time.time()
+                        # Timing for chunk operation
+                        torch.cuda.synchronize()  # Synchronize GPU before chunking
+                        time_chunk_start = time.time()
                         noise_pred_uncond, noise_pred_text = torch.chunk(noise_pred, 2, dim=0)
+                        torch.cuda.synchronize()  # Synchronize GPU after chunking
+                        time_chunk_end = time.time()
+                        print("Chunk time: {:.6f} seconds".format(time_chunk_end - time_chunk_start))
+                        # Timing for batch addition and latent counter increment
+                        torch.cuda.synchronize()  # Synchronize GPU before batch addition
+                        time_batch_addition_start = time.time()
                         for i, context_index in enumerate(current_context_indexes):
                             # Perform batch addition
                             noise_pred_uncond_sum[..., context_index, :, :] += noise_pred_uncond[:, :, i, :, :]
                             # Batch increment for latent_counter
                             latent_counter[context_index] += 1
+                        torch.cuda.synchronize()  # Synchronize GPU after batch addition
+                        time_batch_addition_end = time.time()
+                        print("Batch addition and counter increment time: {:.6f} seconds".format(time_batch_addition_end - time_batch_addition_start))
+                        # End timing for overall guidance process
+                        torch.cuda.synchronize()  # Synchronize GPU after overall guidance process
+                        end_guidance_time = time.time()
+                        print("Total guidance time: {:.6f} seconds".format(end_guidance_time - start_guidance_time))
                     # set the step index to the current batch
                     self.scheduler._step_index = i