peterpeter8585 commited on
Commit
2a75cf3
·
verified ·
1 Parent(s): fd73b3d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -3
app.py CHANGED
@@ -1,8 +1,7 @@
1
  import os
2
  import torch
3
- from transformers import AutoModelForCausalLM as m, AutoTokenizer as t, BitsAndBytesConfig as quant
4
- qq=quant(load_in_4bit=True)
5
- mod=m.from_pretrained("peterpeter8585/sungyoonaimodel2", quantization_config=qq)
6
  tok=t.from_pretrained("peterpeter8585/sungyoonaimodel2", trust_remote_code=True)
7
  mod.eval()
8
  import requests
 
1
  import os
2
  import torch
3
+ from transformers import AutoModelForCausalLM as m, AutoTokenizer as t
4
+ mod=m.from_pretrained("peterpeter8585/sungyoonaimodel2", low_cpu_mem_usage=True)
 
5
  tok=t.from_pretrained("peterpeter8585/sungyoonaimodel2", trust_remote_code=True)
6
  mod.eval()
7
  import requests