Tijmen2 commited on
Commit
7cd7cba
·
verified ·
1 Parent(s): ced96a4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +0 -1
app.py CHANGED
@@ -14,7 +14,6 @@ llm = Llama(
14
  n_ctx=2048,
15
  chat_format="llama-3",
16
  n_gpu_layers=-1, # ensure all layers are on GPU
17
- flash_attn=True,
18
  )
19
 
20
  # Placeholder responses for when context is empty
 
14
  n_ctx=2048,
15
  chat_format="llama-3",
16
  n_gpu_layers=-1, # ensure all layers are on GPU
 
17
  )
18
 
19
  # Placeholder responses for when context is empty