Spaces:

henry000
/

YOLO

Running

henry000 commited on Jun 13, 2024

Commit

15f0a98

1 Parent(s): 64acfd1

🔨 [Update] dataloader with reversable padding size

Files changed (2) hide show

yolo/tools/data_augmentation.py CHANGED Viewed

@@ -17,12 +17,12 @@ class AugmentationComposer:
             if hasattr(transform, "set_parent"):
                 transform.set_parent(self)
-    def __call__(self, image, boxes):
         for transform in self.transforms:
             image, boxes = transform(image, boxes)
-        image, boxes = self.pad_resize(image, boxes)
         image = TF.to_tensor(image)
-        return image, boxes
 # TODO: RandomCrop, Resize, ... etc.
@@ -36,7 +36,7 @@ class PadAndResize:
     def __call__(self, image, boxes):
         original_size = max(image.size)
         scale = self.image_size / original_size
-        square_img = Image.new("RGB", (original_size, original_size), (255, 255, 255))
         left = (original_size - image.width) // 2
         top = (original_size - image.height) // 2
         square_img.paste(image, (left, top))
@@ -48,7 +48,8 @@ class PadAndResize:
         boxes[:, 3] = (boxes[:, 3] * image.width + left) / self.image_size * scale
         boxes[:, 4] = (boxes[:, 4] * image.height + top) / self.image_size * scale
-        return resized_img, boxes
 class HorizontalFlip:

             if hasattr(transform, "set_parent"):
                 transform.set_parent(self)
+    def __call__(self, image, boxes=torch.zeros(0, 5)):
         for transform in self.transforms:
             image, boxes = transform(image, boxes)
+        image, boxes, rev_tensor = self.pad_resize(image, boxes)
         image = TF.to_tensor(image)
+        return image, boxes, rev_tensor
 # TODO: RandomCrop, Resize, ... etc.
     def __call__(self, image, boxes):
         original_size = max(image.size)
         scale = self.image_size / original_size
+        square_img = Image.new("RGB", (original_size, original_size), (128, 128, 128))
         left = (original_size - image.width) // 2
         top = (original_size - image.height) // 2
         square_img.paste(image, (left, top))
         boxes[:, 3] = (boxes[:, 3] * image.width + left) / self.image_size * scale
         boxes[:, 4] = (boxes[:, 4] * image.height + top) / self.image_size * scale
+        rev_tensor = torch.tensor([scale, left, top, left, top])
+        return resized_img, boxes, rev_tensor
 class HorizontalFlip:

yolo/tools/data_loader.py CHANGED Viewed

@@ -149,7 +149,7 @@ class YoloDataset(Dataset):
     def __getitem__(self, idx) -> Union[Image.Image, torch.Tensor]:
         img, bboxes = self.get_data(idx)
-        img, bboxes = self.transform(img, bboxes)
         return img, bboxes
     def __len__(self) -> int:
@@ -261,7 +261,7 @@ class StreamDataLoader:
         if isinstance(frame, np.ndarray):
             frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
             frame = Image.fromarray(frame)
-        frame, _ = self.transform(frame, torch.zeros(0, 5))
         frame = frame[None]
         if not self.is_stream:
             self.queue.put(frame)

     def __getitem__(self, idx) -> Union[Image.Image, torch.Tensor]:
         img, bboxes = self.get_data(idx)
+        img, bboxes, _ = self.transform(img, bboxes)
         return img, bboxes
     def __len__(self) -> int:
         if isinstance(frame, np.ndarray):
             frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
             frame = Image.fromarray(frame)
+        frame, _, rev_tensor = self.transform(frame, torch.zeros(0, 5))
         frame = frame[None]
         if not self.is_stream:
             self.queue.put(frame)