Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -61,7 +61,7 @@ def create_conversational_chain(vector_store):
|
|
61 |
load_dotenv()
|
62 |
# Create llm
|
63 |
llm = CTransformers(streaming=True,
|
64 |
-
model =
|
65 |
callbacks=[StreamingStdOutCallbackHandler()],
|
66 |
model_type="llama", config={'max_new_tokens': 500, 'temperature': 0.01})
|
67 |
# llm = Replicate(
|
|
|
61 |
load_dotenv()
|
62 |
# Create llm
|
63 |
llm = CTransformers(streaming=True,
|
64 |
+
model = AutoModelForCausalLM.from_pretrained("NousResearch/Nous-Hermes-llama-2-7b", device_map='auto',torch_dtype=torch.float16,load_in_4bit=True, token=True ),
|
65 |
callbacks=[StreamingStdOutCallbackHandler()],
|
66 |
model_type="llama", config={'max_new_tokens': 500, 'temperature': 0.01})
|
67 |
# llm = Replicate(
|