Commit
·
23063a1
1
Parent(s):
a1fbbe4
Update app.py
Browse files
app.py
CHANGED
@@ -27,7 +27,7 @@ except:
|
|
27 |
if device == "cuda":
|
28 |
model = LlamaForCausalLM.from_pretrained(
|
29 |
BASE_MODEL,
|
30 |
-
load_in_8bit=
|
31 |
torch_dtype=torch.float16,
|
32 |
device_map="auto",
|
33 |
)
|
@@ -72,7 +72,8 @@ def generate_prompt(instruction, input=None):
|
|
72 |
### Response:"""
|
73 |
|
74 |
if device != "cpu":
|
75 |
-
|
|
|
76 |
model.eval()
|
77 |
if torch.__version__ >= "2":
|
78 |
model = torch.compile(model)
|
|
|
27 |
if device == "cuda":
|
28 |
model = LlamaForCausalLM.from_pretrained(
|
29 |
BASE_MODEL,
|
30 |
+
load_in_8bit=True,
|
31 |
torch_dtype=torch.float16,
|
32 |
device_map="auto",
|
33 |
)
|
|
|
72 |
### Response:"""
|
73 |
|
74 |
if device != "cpu":
|
75 |
+
pass
|
76 |
+
#model.half()
|
77 |
model.eval()
|
78 |
if torch.__version__ >= "2":
|
79 |
model = torch.compile(model)
|