chenjoya commited on
Commit
bac1c17
·
verified ·
1 Parent(s): 267e889

Update demo/infer.py

Browse files
Files changed (1) hide show
  1. demo/infer.py +1 -2
demo/infer.py CHANGED
@@ -36,9 +36,8 @@ class LiveCCDemoInfer:
36
  self.model = Qwen2VLForConditionalGeneration.from_pretrained(
37
  model_path, torch_dtype="auto",
38
  device_map=device,
39
- # attn_implementation='flash_attention_2'
40
  )
41
- self.model.to(device)
42
  self.processor = AutoProcessor.from_pretrained(model_path, use_fast=False)
43
  self.streaming_eos_token_id = self.processor.tokenizer(' ...').input_ids[-1]
44
  self.model.prepare_inputs_for_generation = functools.partial(prepare_multiturn_multimodal_inputs_for_generation, self.model)
 
36
  self.model = Qwen2VLForConditionalGeneration.from_pretrained(
37
  model_path, torch_dtype="auto",
38
  device_map=device,
39
+ attn_implementation='sdpa'
40
  )
 
41
  self.processor = AutoProcessor.from_pretrained(model_path, use_fast=False)
42
  self.streaming_eos_token_id = self.processor.tokenizer(' ...').input_ids[-1]
43
  self.model.prepare_inputs_for_generation = functools.partial(prepare_multiturn_multimodal_inputs_for_generation, self.model)