Spaces:

henry000
/

YOLO

Running

App Files Files Community

henry000 commited on Jul 6, 2024

Commit

d5a73bd

1 Parent(s): d13852b

🔨 [Add] Anc2Box conveter, for YOLOv7's output

Browse files

Files changed (5) hide show

yolo/__init__.py +2 -1
yolo/config/config.py +3 -1
yolo/model/yolo.py +0 -1
yolo/utils/bounding_box_utils.py +61 -6
yolo/utils/model_utils.py +6 -4

yolo/__init__.py CHANGED Viewed

@@ -3,7 +3,7 @@ from yolo.model.yolo import create_model
 from yolo.tools.data_loader import AugmentationComposer, create_dataloader
 from yolo.tools.drawer import draw_bboxes
 from yolo.tools.solver import ModelTester, ModelTrainer, ModelValidator
-from yolo.utils.bounding_box_utils import Vec2Box, bbox_nms
 from yolo.utils.deploy_utils import FastModelLoader
 from yolo.utils.logging_utils import custom_logger
 from yolo.utils.model_utils import PostProccess
@@ -16,6 +16,7 @@ all = [
     "validate_log_directory",
     "draw_bboxes",
     "Vec2Box",
     "bbox_nms",
     "AugmentationComposer",
     "create_dataloader",

 from yolo.tools.data_loader import AugmentationComposer, create_dataloader
 from yolo.tools.drawer import draw_bboxes
 from yolo.tools.solver import ModelTester, ModelTrainer, ModelValidator
+from yolo.utils.bounding_box_utils import Anc2Box, Vec2Box, bbox_nms
 from yolo.utils.deploy_utils import FastModelLoader
 from yolo.utils.logging_utils import custom_logger
 from yolo.utils.model_utils import PostProccess
     "validate_log_directory",
     "draw_bboxes",
     "Vec2Box",
+    "Anc2Box",
     "bbox_nms",
     "AugmentationComposer",
     "create_dataloader",

yolo/config/config.py CHANGED Viewed

@@ -6,8 +6,10 @@ from torch import nn
 @dataclass
 class AnchorConfig:
-    reg_max: int
     strides: List[int]
 @dataclass

 @dataclass
 class AnchorConfig:
     strides: List[int]
+    reg_max: Optional[int]
+    anchor_num: Optional[int]
+    anchor: List[List[int]]
 @dataclass

yolo/model/yolo.py CHANGED Viewed

@@ -26,7 +26,6 @@ class YOLO(nn.Module):
         self.layer_map = get_layer_map()  # Get the map Dict[str: Module]
         self.model: List[YOLOLayer] = nn.ModuleList()
         self.reg_max = getattr(model_cfg.anchor, "reg_max", 16)
-        self.strides = getattr(model_cfg.anchor, "strides", None)
         self.build_model(model_cfg.model)
     def build_model(self, model_arch: Dict[str, List[Dict[str, Dict[str, Dict]]]]):

         self.layer_map = get_layer_map()  # Get the map Dict[str: Module]
         self.model: List[YOLOLayer] = nn.ModuleList()
         self.reg_max = getattr(model_cfg.anchor, "reg_max", 16)
         self.build_model(model_cfg.model)
     def build_model(self, model_arch: Dict[str, List[Dict[str, Dict[str, Dict]]]]):

yolo/utils/bounding_box_utils.py CHANGED Viewed

@@ -1,14 +1,14 @@
 import math
-from typing import Dict, List, Tuple
 import torch
 import torch.nn.functional as F
 from einops import rearrange
 from loguru import logger
-from torch import Tensor, arange
 from torchvision.ops import batched_nms
-from yolo.config.config import MatcherConfig, ModelConfig, NMSConfig
 from yolo.model.yolo import YOLO
@@ -308,9 +308,64 @@ class Vec2Box:
         return preds_cls, preds_anc, preds_box
-def bbox_nms(cls_dist: Tensor, bbox: Tensor, nms_cfg: NMSConfig):
-    # TODO change function to class or set 80 to class_num instead of a number
-    cls_dist = cls_dist.sigmoid()
     # filter class by confidence
     cls_val, cls_idx = cls_dist.max(dim=-1, keepdim=True)

 import math
+from typing import Dict, List, Optional, Tuple
 import torch
 import torch.nn.functional as F
 from einops import rearrange
 from loguru import logger
+from torch import Tensor, arange, tensor
 from torchvision.ops import batched_nms
+from yolo.config.config import AnchorConfig, MatcherConfig, ModelConfig, NMSConfig
 from yolo.model.yolo import YOLO
         return preds_cls, preds_anc, preds_box
+class Anc2Box:
+    def __init__(self, model: YOLO, anchor_cfg: AnchorConfig, image_size, device):
+        self.device = device
+        if hasattr(anchor_cfg, "strides"):
+            logger.info(f"🈶 Found stride of model {anchor_cfg.strides}")
+            self.strides = anchor_cfg.strides
+        else:
+            logger.info("🧸 Found no stride of model, performed a dummy test for auto-anchor size")
+            self.strides = self.create_auto_anchor(model, image_size)
+        self.generate_anchors(image_size)
+        self.anchor_grid = [anchor_grid.to(device) for anchor_grid in self.anchor_grid]
+        self.head_num = len(anchor_cfg.anchor)
+        self.anchor_scale = tensor(anchor_cfg.anchor, device=device).view(self.head_num, 1, -1, 1, 1, 2)
+        self.anchor_num = self.anchor_scale.size(2)
+        self.class_num = model.num_classes
+    def create_auto_anchor(self, model: YOLO, image_size):
+        dummy_input = torch.zeros(1, 3, *image_size).to(self.device)
+        dummy_output = model(dummy_input)
+        strides = []
+        for predict_head in dummy_output:
+            _, _, *anchor_num = predict_head.shape
+            strides.append(image_size[1] // anchor_num[1])
+        return strides
+    def generate_anchors(self, image_size: List[int]):
+        self.anchor_grid = []
+        for stride in self.strides:
+            W, H = image_size[0] // stride, image_size[1] // stride
+            anchor_h, anchor_w = torch.meshgrid([torch.arange(H), torch.arange(W)], indexing="ij")
+            self.anchor_grid.append(torch.stack((anchor_w, anchor_h), 2).view((1, 1, H, W, 2)).float())
+    def __call__(self, predicts: List[Tensor]):
+        preds_box, preds_cls, preds_cnf = [], [], []
+        for layer_idx, predict in enumerate(predicts):
+            predict = rearrange(predict, "B (L C) h w -> B L h w C", L=self.anchor_num)
+            pred_box, pred_cnf, pred_cls = predict.split((4, 1, self.class_num), dim=-1)
+            pred_box = pred_box.sigmoid()
+            pred_box[..., 0:2] = (pred_box[..., 0:2] * 2.0 - 0.5 + self.anchor_grid[layer_idx]) * self.strides[
+                layer_idx
+            ]
+            pred_box[..., 2:4] = (pred_box[..., 2:4] * 2) ** 2 * self.anchor_scale[layer_idx]
+            preds_box.append(rearrange(pred_box, "B L h w A -> B (L h w) A"))
+            preds_cls.append(rearrange(pred_cls, "B L h w C -> B (L h w) C"))
+            preds_cnf.append(rearrange(pred_cnf, "B L h w C -> B (L h w) C"))
+        preds_box = torch.concat(preds_box, dim=1)
+        preds_cls = torch.concat(preds_cls, dim=1)
+        preds_cnf = torch.concat(preds_cnf, dim=1)
+        preds_box = transform_bbox(preds_box, "xycwh -> xyxy")
+        return preds_cls, None, preds_box, preds_cnf.sigmoid()
+def bbox_nms(cls_dist: Tensor, bbox: Tensor, nms_cfg: NMSConfig, confidence: Optional[Tensor]):
+    cls_dist = cls_dist.sigmoid() * (1 if confidence is None else confidence)
     # filter class by confidence
     cls_val, cls_idx = cls_dist.max(dim=-1, keepdim=True)

yolo/utils/model_utils.py CHANGED Viewed

@@ -103,15 +103,17 @@ class PostProccess:
     scale back the prediction and do nms for pred_bbox
     """
-    def __init__(self, vec2box, nms_cfg: NMSConfig) -> None:
-        self.vec2box = vec2box
         self.nms = nms_cfg
     def __call__(self, predict, rev_tensor: Optional[Tensor] = None):
-        pred_class, _, pred_bbox = self.vec2box(predict["Main"])
         if rev_tensor is not None:
             pred_bbox = (pred_bbox - rev_tensor[:, None, 1:]) / rev_tensor[:, 0:1, None]
-        pred_bbox = bbox_nms(pred_class, pred_bbox, self.nms)
         return pred_bbox

     scale back the prediction and do nms for pred_bbox
     """
+    def __init__(self, converter, nms_cfg: NMSConfig) -> None:
+        self.converter = converter
         self.nms = nms_cfg
     def __call__(self, predict, rev_tensor: Optional[Tensor] = None):
+        prediction = self.converter(predict["Main"])
+        pred_class, _, pred_bbox = prediction[:3]
+        pred_conf = prediction[3] if len(prediction) == 4 else None
         if rev_tensor is not None:
             pred_bbox = (pred_bbox - rev_tensor[:, None, 1:]) / rev_tensor[:, 0:1, None]
+        pred_bbox = bbox_nms(pred_class, pred_bbox, self.nms, pred_conf)
         return pred_bbox