bobber commited on
Commit
32952ac
·
verified ·
1 Parent(s): 078e1ae

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -34,8 +34,8 @@ cache_dir = "/data"
34
  # )
35
  model = Llama4ForConditionalGeneration.from_pretrained(
36
  model_name,
37
- # flex_attention is only needed for image
38
- # attn_implementation="flex_attention",
39
  # gguf_file=filename,
40
  cache_dir = cache_dir,
41
  torch_dtype=torch_dtype,
 
34
  # )
35
  model = Llama4ForConditionalGeneration.from_pretrained(
36
  model_name,
37
+ # default is eager attention
38
+ attn_implementation="flex_attention",
39
  # gguf_file=filename,
40
  cache_dir = cache_dir,
41
  torch_dtype=torch_dtype,