peterpeter8585 commited on
Commit
85c868d
·
verified ·
1 Parent(s): 5b312c9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -1,7 +1,7 @@
1
  import os
2
  import torch
3
- from transformers import AutoModelForCausalLM as m, AutoTokenizer as t, GPTQConfig as quant
4
- qq=quant(bits=4, exllama_config={"version":2})
5
  mod=m.from_pretrained("peterpeter8585/sungyoonaimodel2", quantization_config=qq)
6
  tok=t.from_pretrained("peterpeter8585/sungyoonaimodel2", trust_remote_code=True)
7
  mod.eval()
 
1
  import os
2
  import torch
3
+ from transformers import AutoModelForCausalLM as m, AutoTokenizer as t, BitsAndBytesConfig as quant
4
+ qq=quant(load_in_8bit=True)
5
  mod=m.from_pretrained("peterpeter8585/sungyoonaimodel2", quantization_config=qq)
6
  tok=t.from_pretrained("peterpeter8585/sungyoonaimodel2", trust_remote_code=True)
7
  mod.eval()