jokerbit
/

flux-qa-base

Model card Files Files and versions Community

jokerbit commited on Dec 21, 2024

Commit

1793600

·

verified ·

1 Parent(s): 560e4bf

quantize

Files changed (1) hide show

src/pipeline.py +1 -1

src/pipeline.py CHANGED Viewed

@@ -50,8 +50,8 @@ def load_pipeline() -> Pipeline:
     )
     pipeline.transformer.to(memory_format=torch.channels_last)
-    #    quantize_(pipeline.vae, int8_weight_only())
     pipeline.vae.to(memory_format=torch.channels_last)
     pipeline.vae = torch.compile(pipeline.vae, mode="max-autotune", fullgraph=True)
     pipeline.to("cuda")

     )
     pipeline.transformer.to(memory_format=torch.channels_last)
     pipeline.vae.to(memory_format=torch.channels_last)
+    quantize_(pipeline.vae, int8_weight_only())
     pipeline.vae = torch.compile(pipeline.vae, mode="max-autotune", fullgraph=True)
     pipeline.to("cuda")