Spaces:

KoonJamesZ
/

ccib-qwen

Sleeping

KoonJamesZ commited on Dec 17, 2024

Commit

1df3240

verified ·

1 Parent(s): 3abaf20

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -14,27 +14,20 @@ import uuid
 import uuid
 from ultralytics import YOLO
 import gradio as gr
-import subprocess
-import sys
-try:
-    # Run the pip command
-    subprocess.check_call([sys.executable, "-m", "pip", "install", "flash-attn", "--no-build-isolation"])
-    print("flash-attn installed successfully.")
-except subprocess.CalledProcessError as e:
-    print(f"An error occurred while installing flash-attn: {e}")
-# # default: Load the model on the available device(s)
-# model = Qwen2VLForConditionalGeneration.from_pretrained(
-#     "Qwen/Qwen2-VL-7B-Instruct", torch_dtype="auto", device_map="auto"
-# )
-# We recommend enabling flash_attention_2 for better acceleration and memory saving, especially in multi-image and video scenarios.
 model = Qwen2VLForConditionalGeneration.from_pretrained(
-    "Qwen/Qwen2-VL-7B-Instruct",
-    torch_dtype=torch.bfloat16,
-    attn_implementation="flash_attention_2",
-    device_map="auto",
 )
 # default processer
 processor = AutoProcessor.from_pretrained("Qwen/Qwen2-VL-7B-Instruct")

 import uuid
 from ultralytics import YOLO
 import gradio as gr
+# # default: Load the model on the available device(s)
 model = Qwen2VLForConditionalGeneration.from_pretrained(
+    "Qwen/Qwen2-VL-7B-Instruct", torch_dtype="auto", device_map="auto"
 )
+# We recommend enabling flash_attention_2 for better acceleration and memory saving, especially in multi-image and video scenarios.
+# model = Qwen2VLForConditionalGeneration.from_pretrained(
+#     "Qwen/Qwen2-VL-7B-Instruct",
+#     torch_dtype=torch.bfloat16,
+#     attn_implementation="flash_attention_2",
+#     device_map="auto",
+# )
 # default processer
 processor = AutoProcessor.from_pretrained("Qwen/Qwen2-VL-7B-Instruct")