GIGAParviz commited on
Commit
d118a29
·
verified ·
1 Parent(s): 8b0d499

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -8,7 +8,7 @@ model, tokenizer = FastLanguageModel.from_pretrained(
8
  max_seq_length = 2048,
9
  dtype = torch.float16,
10
  load_in_4bit = True,
11
- )
12
  FastLanguageModel.for_inference(model)
13
 
14
  def predict(input_text):
@@ -20,7 +20,7 @@ def predict(input_text):
20
  tokenize=True,
21
  add_generation_prompt=True,
22
  return_tensors="pt",
23
- )
24
 
25
  outputs = model.generate(
26
  input_ids=inputs,
 
8
  max_seq_length = 2048,
9
  dtype = torch.float16,
10
  load_in_4bit = True,
11
+ ).to("cpu")
12
  FastLanguageModel.for_inference(model)
13
 
14
  def predict(input_text):
 
20
  tokenize=True,
21
  add_generation_prompt=True,
22
  return_tensors="pt",
23
+ ).to("cpu")
24
 
25
  outputs = model.generate(
26
  input_ids=inputs,