ccm commited on
Commit
c759f50
·
verified ·
1 Parent(s): 2b9ca20

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -68,7 +68,7 @@ publication_vectorstore = langchain_community.vectorstores.FAISS.load_local(
68
 
69
  # Create the callable LLM
70
  llm = transformers.pipeline(
71
- task="text-generation", model="Qwen/Qwen2.5-7B-Instruct-GPTQ-Int4", device="cuda"
72
  )
73
 
74
 
 
68
 
69
  # Create the callable LLM
70
  llm = transformers.pipeline(
71
+ task="text-generation", model="Qwen/Qwen2.5-7B-Instruct-AWQ", device="cuda", attn_implementation="flash_attention_2"
72
  )
73
 
74