Namitg02 commited on
Commit
fae8f63
·
verified ·
1 Parent(s): f868774

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -43,8 +43,8 @@ from transformers import AutoTokenizer, AutoModelForCausalLM
43
 
44
 
45
  READER_MODEL = "HuggingFaceH4/zephyr-7b-beta"
46
- #bnb_config = BitsAndBytesConfig(load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4")
47
- model = AutoModelForCausalLM.from_pretrained(READER_MODEL)
48
  tokenizer = AutoTokenizer.from_pretrained(READER_MODEL)
49
 
50
  from langchain.llms import HuggingFacePipeline
 
43
 
44
 
45
  READER_MODEL = "HuggingFaceH4/zephyr-7b-beta"
46
+ #bnb_config = BitsAndBytesConfig(load_in_4bit=True, bnb_4bit_use_double_quant=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.float16)
47
+ model = AutoModelForCausalLM.from_pretrained(READER_MODEL,quantization_config=bnb_config)
48
  tokenizer = AutoTokenizer.from_pretrained(READER_MODEL)
49
 
50
  from langchain.llms import HuggingFacePipeline