Spaces:

AbdulrhmanEldeeb
/

ft_metallurgy

Runtime error

AbdulrhmanEldeeb commited on Nov 29, 2024

Commit

c349adc

1 Parent(s): 2846ff5

changed to CPU 2

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,6 +1,9 @@
 from model import load_model, answer
 from components import create_app_layout
 import torch
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # Load the model and tokenizer

 from model import load_model, answer
 from components import create_app_layout
 import torch
+# Check if a GPU is available; otherwise, use the CPU
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # Load the model and tokenizer

model.py CHANGED Viewed

@@ -1,8 +1,8 @@
 from unsloth import FastLanguageModel
-import torch
 from prompts import metallurgy_prompt
-# Check if a GPU is available; otherwise, use the CPU
 def load_model():
     max_seq_length = 2048
@@ -22,7 +22,7 @@ def answer(model, tokenizer, query: str) -> str:
     inputs = tokenizer(
         [metallurgy_prompt.format(query, "", "")],
         return_tensors="pt"
-    ).to("cuda")
     outputs = model.generate(**inputs, use_cache=True)
     result = tokenizer.batch_decode(outputs)

 from unsloth import FastLanguageModel
 from prompts import metallurgy_prompt
+import torch
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 def load_model():
     max_seq_length = 2048
     inputs = tokenizer(
         [metallurgy_prompt.format(query, "", "")],
         return_tensors="pt"
+    ).to(device)
     outputs = model.generate(**inputs, use_cache=True)
     result = tokenizer.batch_decode(outputs)