Spaces:

fashn-ai
/

sapiens-body-part-segmentation

Running on Zero

Dan Bochman commited on Aug 26, 2024

Commit

a76f764

unverified ·

1 Parent(s): 6db27b1

cast to cuda outside of spaces.GPU scope

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,9 +12,6 @@ from torchvision import transforms
 # ----------------- ENV ----------------- #
-if torch.cuda.get_device_properties(0).major >= 8:
-    torch.backends.cuda.matmul.allow_tf32 = True
-    torch.backends.cudnn.allow_tf32 = True
 ASSETS_DIR = os.path.join(os.path.dirname(__file__), "assets")
@@ -107,13 +104,12 @@ if not os.path.exists(model_path):
 model = torch.jit.load(model_path)
 model.eval()
 @spaces.GPU
 @torch.inference_mode()
 def run_model(input_tensor, height, width):
-    model.to("cuda")  # set the device after acquiring it with ZERO
-    input_tensor = input_tensor.to("cuda")
     output = model(input_tensor)
     output = torch.nn.functional.interpolate(output, size=(height, width), mode="bilinear", align_corners=False)
     _, preds = torch.max(output, 1)
@@ -131,7 +127,7 @@ transform_fn = transforms.Compose(
 def segment(image: Image.Image) -> Image.Image:
-    input_tensor = transform_fn(image).unsqueeze(0)
     preds = run_model(input_tensor, height=image.height, width=image.width)
     mask = preds.squeeze(0).cpu().numpy()
     mask_image = Image.fromarray(mask.astype("uint8"))

 # ----------------- ENV ----------------- #
 ASSETS_DIR = os.path.join(os.path.dirname(__file__), "assets")
 model = torch.jit.load(model_path)
 model.eval()
+model.to("cuda")
 @spaces.GPU
 @torch.inference_mode()
 def run_model(input_tensor, height, width):
     output = model(input_tensor)
     output = torch.nn.functional.interpolate(output, size=(height, width), mode="bilinear", align_corners=False)
     _, preds = torch.max(output, 1)
 def segment(image: Image.Image) -> Image.Image:
+    input_tensor = transform_fn(image).unsqueeze(0).to("cuda")
     preds = run_model(input_tensor, height=image.height, width=image.width)
     mask = preds.squeeze(0).cpu().numpy()
     mask_image = Image.fromarray(mask.astype("uint8"))