import torch import torch.nn as nn import torch.nn.functional as F from .gem import GeM def adaptive_avgmax_pool3d(x, output_size=1): x_avg = F.adaptive_avg_pool3d(x, output_size) x_max = F.adaptive_max_pool3d(x, output_size) return 0.5 * (x_avg + x_max) def adaptive_catavgmax_pool3d(x, output_size=1): x_avg = F.adaptive_avg_pool3d(x, output_size) x_max = F.adaptive_max_pool3d(x, output_size) return torch.cat((x_avg, x_max), 1) def select_adaptive_pool3d(x, pool_type='avg', output_size=1): """Selectable global pooling function with dynamic input kernel size """ if pool_type == 'avg': x = F.adaptive_avg_pool3d(x, output_size) elif pool_type == 'avgmax': x = adaptive_avgmax_pool3d(x, output_size) elif pool_type == 'catavgmax': x = adaptive_catavgmax_pool3d(x, output_size) elif pool_type == 'max': x = F.adaptive_max_pool3d(x, output_size) else: assert False, 'Invalid pool type: %s' % pool_type return x class FastAdaptiveAvgPool3d(nn.Module): def __init__(self, flatten=False): super(FastAdaptiveAvgPool3d, self).__init__() self.flatten = flatten def forward(self, x): return x.mean((2,3,4), keepdim=not self.flatten) class AdaptiveAvgMaxPool3d(nn.Module): def __init__(self, output_size=1): super(AdaptiveAvgMaxPool3d, self).__init__() self.output_size = output_size def forward(self, x): return adaptive_avgmax_pool3d(x, self.output_size) class AdaptiveCatAvgMaxPool3d(nn.Module): def __init__(self, output_size=1): super(AdaptiveCatAvgMaxPool3d, self).__init__() self.output_size = output_size def forward(self, x): return adaptive_catavgmax_pool3d(x, self.output_size) class SelectAdaptivePool3d(nn.Module): """Selectable global pooling layer with dynamic input kernel size """ def __init__(self, output_size=1, pool_type='fast', flatten=False): super(SelectAdaptivePool3d, self).__init__() self.pool_type = pool_type or '' # convert other falsy values to empty string for consistent TS typing self.flatten = nn.Flatten(1) if flatten else nn.Identity() if pool_type == '': self.pool = nn.Identity() # pass through elif pool_type == 'fast': assert output_size == 1 self.pool = FastAdaptiveAvgPool3d(flatten) self.flatten = nn.Identity() elif pool_type == 'avg': self.pool = nn.AdaptiveAvgPool3d(output_size) elif pool_type == 'avgmax': self.pool = AdaptiveAvgMaxPool3d(output_size) elif pool_type == 'catavgmax': self.pool = AdaptiveCatAvgMaxPool3d(output_size) elif pool_type == 'max': self.pool = nn.AdaptiveMaxPool3d(output_size) else: assert False, 'Invalid pool type: %s' % pool_type def is_identity(self): return not self.pool_type def forward(self, x): x = self.pool(x) x = self.flatten(x) return x def __repr__(self): return self.__class__.__name__ + ' (' \ + 'pool_type=' + self.pool_type \ + ', flatten=' + str(self.flatten) + ')' def create_pool3d_layer(name, **kwargs): assert name in ["avg", "max", "fast", "avgmax", "catavgmax", "gem"] if name != "gem": pool1d_layer = SelectAdaptivePool3d(pool_type=name, flatten=True) elif name == "gem": pool1d_layer = GeM(dim=3, **kwargs) return pool1d_layer