Hackoor commited on
Commit
98059c3
·
1 Parent(s): 0c9339e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -61,7 +61,7 @@ def create_conversational_chain(vector_store):
61
  load_dotenv()
62
  # Create llm
63
  llm = CTransformers(streaming=True,
64
- model = AutoModel.from_pretrained("NousResearch/Nous-Hermes-llama-2-7b"),
65
  callbacks=[StreamingStdOutCallbackHandler()],
66
  model_type="llama", config={'max_new_tokens': 500, 'temperature': 0.01})
67
  # llm = Replicate(
 
61
  load_dotenv()
62
  # Create llm
63
  llm = CTransformers(streaming=True,
64
+ model = AutoModelForCausalLM.from_pretrained("NousResearch/Nous-Hermes-llama-2-7b", device_map='auto',torch_dtype=torch.float16,load_in_4bit=True, token=True ),
65
  callbacks=[StreamingStdOutCallbackHandler()],
66
  model_type="llama", config={'max_new_tokens': 500, 'temperature': 0.01})
67
  # llm = Replicate(