Update app.py
Browse files
app.py
CHANGED
@@ -34,8 +34,8 @@ cache_dir = "/data"
|
|
34 |
# )
|
35 |
model = Llama4ForConditionalGeneration.from_pretrained(
|
36 |
model_name,
|
37 |
-
#
|
38 |
-
|
39 |
# gguf_file=filename,
|
40 |
cache_dir = cache_dir,
|
41 |
torch_dtype=torch_dtype,
|
|
|
34 |
# )
|
35 |
model = Llama4ForConditionalGeneration.from_pretrained(
|
36 |
model_name,
|
37 |
+
# default is eager attention
|
38 |
+
attn_implementation="flex_attention",
|
39 |
# gguf_file=filename,
|
40 |
cache_dir = cache_dir,
|
41 |
torch_dtype=torch_dtype,
|