Spaces:
Running
on
Zero
Running
on
Zero
Martín Santillán Cooper
commited on
Commit
•
a50a656
1
Parent(s):
fb6a6b8
fix: gpu is not a valid device
Browse files
model.py
CHANGED
@@ -21,7 +21,7 @@ inference_engine = os.getenv("INFERENCE_ENGINE", "VLLM")
|
|
21 |
logger.debug(f"Inference engine is: '{inference_engine}'")
|
22 |
|
23 |
if inference_engine == "VLLM":
|
24 |
-
device = torch.device("
|
25 |
|
26 |
model_path = os.getenv("MODEL_PATH", "ibm-granite/granite-guardian-3.0-8b")
|
27 |
logger.debug(f"model_path is {model_path}")
|
|
|
21 |
logger.debug(f"Inference engine is: '{inference_engine}'")
|
22 |
|
23 |
if inference_engine == "VLLM":
|
24 |
+
device = torch.device("cuda")
|
25 |
|
26 |
model_path = os.getenv("MODEL_PATH", "ibm-granite/granite-guardian-3.0-8b")
|
27 |
logger.debug(f"model_path is {model_path}")
|