Update app.py
Browse files
app.py
CHANGED
@@ -39,10 +39,11 @@ retriever = vectordb.as_retriever()
|
|
39 |
#)
|
40 |
|
41 |
from transformers import pipeline
|
42 |
-
from transformers import AutoTokenizer, BitsAndBytesConfig
|
|
|
43 |
|
44 |
READER_MODEL = "HuggingFaceH4/zephyr-7b-beta"
|
45 |
-
bnb_config = BitsAndBytesConfig(load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=
|
46 |
model = AutoModelForCausalLM.from_pretrained(READER_MODEL, quantization_config=bnb_config)
|
47 |
tokenizer = AutoTokenizer.from_pretrained(READER_MODEL)
|
48 |
|
|
|
39 |
#)
|
40 |
|
41 |
from transformers import pipeline
|
42 |
+
from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
|
43 |
+
|
44 |
|
45 |
READER_MODEL = "HuggingFaceH4/zephyr-7b-beta"
|
46 |
+
bnb_config = BitsAndBytesConfig(load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=bfloat16)
|
47 |
model = AutoModelForCausalLM.from_pretrained(READER_MODEL, quantization_config=bnb_config)
|
48 |
tokenizer = AutoTokenizer.from_pretrained(READER_MODEL)
|
49 |
|