Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -1,7 +1,8 @@
|
|
1 |
import os
|
2 |
import torch
|
3 |
-
from transformers import AutoModelForCausalLM as m, AutoTokenizer as t
|
4 |
-
|
|
|
5 |
tok=t.from_pretrained("peterpeter8585/sungyoonaimodel2", trust_remote_code=True)
|
6 |
mod.eval()
|
7 |
import requests
|
|
|
1 |
import os
|
2 |
import torch
|
3 |
+
from transformers import AutoModelForCausalLM as m, AutoTokenizer as t, BitsAndBytesConfig as q
|
4 |
+
qq=q(load_in_4bit=True, bnb_4bit_quant_type="nf4", bnb_4bit_compute_dtype=torch.float16, bnb_4bit_use_double_quant=False)
|
5 |
+
mod=m.from_pretrained("peterpeter8585/sungyoonaimodel2", low_cpu_mem_usage=True, quantization_config=qq)
|
6 |
tok=t.from_pretrained("peterpeter8585/sungyoonaimodel2", trust_remote_code=True)
|
7 |
mod.eval()
|
8 |
import requests
|