jalvneis

Sleeping

patrickvonplaten commited on Nov 6, 2023

Commit

c7d725d

1 Parent(s): 8947670

speed up demo

Files changed (3) hide show

README.md CHANGED Viewed

@@ -4,10 +4,9 @@ emoji: 👀
 colorFrom: pink
 colorTo: purple
 sdk: gradio
-sdk_version: 3.50.2
 app_file: app.py
 pinned: false
-license: agpl-3.0
 ---
 Inference Code: https://github.com/PixArt-alpha/PixArt-alpha

 colorFrom: pink
 colorTo: purple
 sdk: gradio
+sdk_version: 4.1.1
 app_file: app.py
 pinned: false
 ---
 Inference Code: https://github.com/PixArt-alpha/PixArt-alpha

app.py CHANGED Viewed

@@ -22,7 +22,7 @@ if not torch.cuda.is_available():
 MAX_SEED = np.iinfo(np.int32).max
 CACHE_EXAMPLES = torch.cuda.is_available() and os.getenv("CACHE_EXAMPLES", "1") == "1"
 MAX_IMAGE_SIZE = int(os.getenv("MAX_IMAGE_SIZE", "1024"))
-USE_TORCH_COMPILE = os.getenv("USE_TORCH_COMPILE", "1") == "1"
 ENABLE_CPU_OFFLOAD = os.getenv("ENABLE_CPU_OFFLOAD", "0") == "1"
 device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
@@ -96,6 +96,7 @@ if torch.cuda.is_available():
     pipe = PixArtAlphaPipeline.from_pretrained(
         "PixArt-alpha/PixArt-XL-2-1024-MS",
         torch_dtype=torch.float16,
         use_safetensors=True,
     )
@@ -105,6 +106,9 @@ if torch.cuda.is_available():
         pipe.to(device)
         print("Loaded on Device!")
     if USE_TORCH_COMPILE:
         pipe.transformer = torch.compile(
             pipe.transformer, mode="reduce-overhead", fullgraph=True
@@ -254,7 +258,6 @@ with gr.Blocks(css="style.css") as demo:
         fn=lambda x: gr.update(visible=x),
         inputs=use_negative_prompt,
         outputs=negative_prompt,
-        queue=False,
         api_name=False,
     )
@@ -282,4 +285,5 @@ with gr.Blocks(css="style.css") as demo:
     )
 if __name__ == "__main__":
-    demo.queue(max_size=20).launch()

 MAX_SEED = np.iinfo(np.int32).max
 CACHE_EXAMPLES = torch.cuda.is_available() and os.getenv("CACHE_EXAMPLES", "1") == "1"
 MAX_IMAGE_SIZE = int(os.getenv("MAX_IMAGE_SIZE", "1024"))
+USE_TORCH_COMPILE = os.getenv("USE_TORCH_COMPILE", "0") == "1"
 ENABLE_CPU_OFFLOAD = os.getenv("ENABLE_CPU_OFFLOAD", "0") == "1"
 device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
     pipe = PixArtAlphaPipeline.from_pretrained(
         "PixArt-alpha/PixArt-XL-2-1024-MS",
         torch_dtype=torch.float16,
+        variant="fp16",
         use_safetensors=True,
     )
         pipe.to(device)
         print("Loaded on Device!")
+    # speed-up T5
+    pipe.text_encoder.to_bettertransformer()
     if USE_TORCH_COMPILE:
         pipe.transformer = torch.compile(
             pipe.transformer, mode="reduce-overhead", fullgraph=True
         fn=lambda x: gr.update(visible=x),
         inputs=use_negative_prompt,
         outputs=negative_prompt,
         api_name=False,
     )
     )
 if __name__ == "__main__":
+    # demo.queue(max_size=20).launch()
+    demo.launch(share=True)

requirements.txt CHANGED Viewed

@@ -1,7 +1,10 @@
-diffusers==0.22.0
-accelerate==0.24.1
 gradio==4.1.1
 Pillow==10.1.0
-torch==2.0.1
-transformers==4.35.0
 sentencepiece==0.1.99

+--index-url https://download.pytorch.org/whl/cu118
+torch==2.0.1
+diffusers==0.22.1
+accelerate
+transformers
 gradio==4.1.1
 Pillow==10.1.0
 sentencepiece==0.1.99