Spaces:

KoonJamesZ
/

ccib-qwen

Sleeping

KoonJamesZ commited on Dec 17, 2024

Commit

d96324e

verified ·

1 Parent(s): 28f7346

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -16,18 +16,18 @@ from ultralytics import YOLO
 import gradio as gr
 # # default: Load the model on the available device(s)
-# model = Qwen2VLForConditionalGeneration.from_pretrained(
-#     "Qwen/Qwen2-VL-7B-Instruct", torch_dtype="auto", device_map="auto"
-# )
-# We recommend enabling flash_attention_2 for better acceleration and memory saving, especially in multi-image and video scenarios.
 model = Qwen2VLForConditionalGeneration.from_pretrained(
-    "Qwen/Qwen2-VL-7B-Instruct",
-    torch_dtype=torch.bfloat16,
-    attn_implementation="flash_attention_2",
-    device_map="auto",
 )
 # default processer
 processor = AutoProcessor.from_pretrained("Qwen/Qwen2-VL-7B-Instruct")

 import gradio as gr
 # # default: Load the model on the available device(s)
 model = Qwen2VLForConditionalGeneration.from_pretrained(
+    "Qwen/Qwen2-VL-7B-Instruct", torch_dtype="auto", device_map="auto"
 )
+# We recommend enabling flash_attention_2 for better acceleration and memory saving, especially in multi-image and video scenarios.
+# model = Qwen2VLForConditionalGeneration.from_pretrained(
+#     "Qwen/Qwen2-VL-7B-Instruct",
+#     torch_dtype=torch.bfloat16,
+#     attn_implementation="flash_attention_2",
+#     device_map="auto",
+# )
 # default processer
 processor = AutoProcessor.from_pretrained("Qwen/Qwen2-VL-7B-Instruct")