Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -8,7 +8,7 @@ model, tokenizer = FastLanguageModel.from_pretrained(
|
|
8 |
max_seq_length = 2048,
|
9 |
dtype = torch.float16,
|
10 |
load_in_4bit = True,
|
11 |
-
)
|
12 |
FastLanguageModel.for_inference(model)
|
13 |
|
14 |
def predict(input_text):
|
@@ -20,7 +20,7 @@ def predict(input_text):
|
|
20 |
tokenize=True,
|
21 |
add_generation_prompt=True,
|
22 |
return_tensors="pt",
|
23 |
-
)
|
24 |
|
25 |
outputs = model.generate(
|
26 |
input_ids=inputs,
|
|
|
8 |
max_seq_length = 2048,
|
9 |
dtype = torch.float16,
|
10 |
load_in_4bit = True,
|
11 |
+
).to("cpu")
|
12 |
FastLanguageModel.for_inference(model)
|
13 |
|
14 |
def predict(input_text):
|
|
|
20 |
tokenize=True,
|
21 |
add_generation_prompt=True,
|
22 |
return_tensors="pt",
|
23 |
+
).to("cpu")
|
24 |
|
25 |
outputs = model.generate(
|
26 |
input_ids=inputs,
|