Source code for megengine.module.pooling

# -*- coding: utf-8 -*-
from abc import abstractmethod
from typing import Tuple, Union

from ..functional import avg_pool2d, max_pool2d
from .module import Module


class _PoolNd(Module):
    def __init__(
        self,
        kernel_size: Union[int, Tuple[int, int]],
        stride: Union[int, Tuple[int, int]] = None,
        padding: Union[int, Tuple[int, int]] = 0,
        **kwargs
    ):
        super(_PoolNd, self).__init__(**kwargs)
        self.kernel_size = kernel_size
        self.stride = stride or kernel_size
        self.padding = padding

    @abstractmethod
    def forward(self, inp):
        pass

    def _module_info_string(self) -> str:
        return "kernel_size={kernel_size}, stride={stride}, padding={padding}".format(
            **self.__dict__
        )


[docs]class MaxPool2d(_PoolNd): r"""Applies a 2D max pooling over an input. For instance, given an input of the size :`(N, C, H_{\text{in}}, W_{\text{in}})` and :attr:`kernel_size` :math:`(kH, kW)`, this layer generates the output of the size :math:`(N, C, H_{\text{out}}, W_{\text{out}})` through a process described as: .. math:: \begin{aligned} out(N_i, C_j, h, w) ={} & \max_{m=0, \ldots, kH-1} \max_{n=0, \ldots, kW-1} \text{input}(N_i, C_j, \text{stride[0]} \times h + m, \text{stride[1]} \times w + n) \end{aligned} If :attr:`padding` is non-zero, then the input is implicitly zero-padded on both sides for :attr:`padding` number of points. Args: kernel_size(Union[int, Tuple[int, int]]): the size of the window. stride(Union[int, Tuple[int, int]]): the stride of the window. Default value is ``kernel_size``. padding(Union[int, Tuple[int, int]]): implicit zero padding to be added on both sides.Default: 0. Shape: - Input: :math:`(N, C, H_{in}, W_{in})` or :math:`(C, H_{in}, W_{in})` - Output: :math:`(N, C, H_{out}, W_{out})` or :math:`(C, H_{out}, W_{out})`, where .. math:: H_{out} = \left\lfloor\frac{H_{in} + 2 * \text{padding[0]} - \text{dilation[0]} \times (\text{kernel\_size[0]} - 1) - 1}{\text{stride[0]}} + 1\right\rfloor .. math:: W_{out} = \left\lfloor\frac{W_{in} + 2 * \text{padding[1]} - \text{dilation[1]} \times (\text{kernel\_size[1]} - 1) - 1}{\text{stride[1]}} + 1\right\rfloor Returns: Return type: module. The instance of the ``MaxPool2d`` module. Examples: >>> import numpy as np >>> m = M.MaxPool2d(kernel_size=3, stride=1, padding=0) >>> inp = mge.tensor(np.arange(0, 16).astype("float32").reshape(1, 1, 4, 4)) >>> oup = m(inp) >>> oup.numpy() array([[[[10., 11.], [14., 15.]]]], dtype=float32) """ def forward(self, inp): return max_pool2d(inp, self.kernel_size, self.stride, self.padding)
[docs]class AvgPool2d(_PoolNd): r"""Applies a 2D average pooling over an input. For instance, given an input of the size :math:`(N, C, H_{\text{in}}, W_{\text{in}})` and :attr:`kernel_size` :math:`(kH, kW)`, this layer generates the output of the size :math:`(N, C, H_{\text{out}}, W_{\text{out}})` through a process described as: .. math:: out(N_i, C_j, h, w) = \frac{1}{kH * kW} \sum_{m=0}^{kH-1} \sum_{n=0}^{kW-1} input(N_i, C_j, stride[0] \times h + m, stride[1] \times w + n) If :attr:`padding` is non-zero, then the input is implicitly zero-padded on both sides for :attr:`padding` number of points. Args: kernel_size(Union[int, Tuple[int, int]]): the size of the window. stride(Union[int, Tuple[int, int]]): the stride of the window. Default value is ``kernel_size``. padding(Union[int, Tuple[int, int]]): implicit zero padding to be added on both sides.Default: 0. mode(str): whether to include the padding values while calculating the average, set to "average" will do counting. Default: "average_count_exclude_padding" Shape: - Input: :math:`(N, C, H_{in}, W_{in})` or :math:`(C, H_{in}, W_{in})`. - Output: :math:`(N, C, H_{out}, W_{out})` or :math:`(C, H_{out}, W_{out})`, where .. math:: H_{out} = \left\lfloor\frac{H_{in} + 2 \times \text{padding}[0] - \text{kernel\_size}[0]}{\text{stride}[0]} + 1\right\rfloor .. math:: W_{out} = \left\lfloor\frac{W_{in} + 2 \times \text{padding}[1] - \text{kernel\_size}[1]}{\text{stride}[1]} + 1\right\rfloor Returns: Return type: module. The instance of the ``AvgPool2d`` module. Examples: >>> import numpy as np >>> m = M.AvgPool2d(kernel_size=2, stride=2, padding=[1,0], mode="average") >>> inp = mge.tensor(np.arange(1 * 1 * 3 * 4).astype(np.float32).reshape(1, 1, 3, 4)) >>> output = m(inp) >>> output Tensor([[[[0.25 1.25] [6.5 8.5 ]]]], device=xpux:0) """ def __init__( self, kernel_size: Union[int, Tuple[int, int]], stride: Union[int, Tuple[int, int]] = None, padding: Union[int, Tuple[int, int]] = 0, mode: str = "average_count_exclude_padding", **kwargs ): super(AvgPool2d, self).__init__(kernel_size, stride, padding, **kwargs) self.mode = mode def forward(self, inp): return avg_pool2d(inp, self.kernel_size, self.stride, self.padding, self.mode) def _module_info_string(self) -> str: return "kernel_size={kernel_size}, stride={stride}, padding={padding}, mode={mode}".format( **self.__dict__ )