chenjoya commited on
Commit
eba7e84
·
verified ·
1 Parent(s): c1771c7

Update demo/infer.py

Browse files
Files changed (1) hide show
  1. demo/infer.py +1 -1
demo/infer.py CHANGED
@@ -36,7 +36,7 @@ class LiveCCDemoInfer:
36
  self.model = Qwen2VLForConditionalGeneration.from_pretrained(
37
  model_path, torch_dtype="auto",
38
  device_map=f'cuda:{device_id}',
39
- attn_implementation='flash_attention_2'
40
  )
41
  self.processor = AutoProcessor.from_pretrained(model_path, use_fast=False)
42
  self.streaming_eos_token_id = self.processor.tokenizer(' ...').input_ids[-1]
 
36
  self.model = Qwen2VLForConditionalGeneration.from_pretrained(
37
  model_path, torch_dtype="auto",
38
  device_map=f'cuda:{device_id}',
39
+ # attn_implementation='flash_attention_2'
40
  )
41
  self.processor = AutoProcessor.from_pretrained(model_path, use_fast=False)
42
  self.streaming_eos_token_id = self.processor.tokenizer(' ...').input_ids[-1]