Source code for coremltools.converters.mil.mil.ops.defs.iOS15.pool

#  Copyright (c) 2020, Apple Inc. All rights reserved.
#
#  Use of this source code is governed by a BSD-3-clause license that can be
#  found in the LICENSE.txt file or at https://opensource.org/licenses/BSD-3-Clause

from coremltools.converters.mil.mil import Operation, types
from coremltools.converters.mil.mil.block import curr_opset_version
from coremltools.converters.mil.mil.input_type import (DefaultInputs,
                                                       InputSpec,
                                                       TensorInputType)
from coremltools.converters.mil.mil.ops.defs._op_reqs import register_op
from coremltools.converters.mil.mil.ops.defs._utils import \
    spatial_dimensions_out_shape
from coremltools.converters.mil.mil.ops.defs.iOS15 import _IOS15_TARGET


class Pooling(Operation):
    """
    Pooling Op Superclass
    """
    input_spec = InputSpec(
        x=TensorInputType(type_domain="T"),
        kernel_sizes=TensorInputType(const=True, type_domain=types.int32),
        strides=TensorInputType(const=True, optional=True, type_domain=types.int32),
        pad_type=TensorInputType(const=True, type_domain=types.str),
        pad=TensorInputType(const=True, optional=True, type_domain=types.int32),
        ceil_mode=TensorInputType(const=True, optional=True, type_domain=types.bool),
    )

    type_domains = {
        "T": (types.fp16, types.fp32),
    }

    def default_inputs(self):
        num_spatial_dims = self.x.rank - 2
        return DefaultInputs(
            strides=[1] * num_spatial_dims,
            pad=[0] * 2 * num_spatial_dims,
            ceil_mode=False,
        )

    def type_inference(self):
        ksize = self.kernel_sizes.val
        x_shape = self.x.shape
        D_in_rank = len(x_shape) - 2

        strides = [1] * D_in_rank if self.strides is None else self.strides.val
        pad_type = "valid" if self.pad_type is None else self.pad_type.val.lower()
        if pad_type not in ["valid", "same", "custom", "same_lower"]:
            raise ValueError("Unrecognized value of pad_type : {}".format(pad_type))
        pad = None if self.pad is None else self.pad.val
        D_in = x_shape[2:]  # spatial dimensions

        if self.ceil_mode.val:
            if D_in_rank > 2:
                raise ValueError('pool: ceil_mode only supported for 1D or 2D pool')
            if pad_type == "same" and self.ceil_mode.val:
                raise ValueError("ceil_mode must be False when pad_type==same")
            if pad is not None:
                for i in range(D_in_rank):
                    if pad[2 * i] != pad[2 * i + 1]:
                        raise ValueError("Padding must be symmetric if ceil_mode is True")

        # The same_lower padding is not supported in iOS15
        if curr_opset_version() == _IOS15_TARGET and self.pad_type.val == "same_lower":
            msg = "iOS15 version of pooling layers do not support pad_type = `same_lower`"
            raise ValueError(msg)

        D_out_shape = spatial_dimensions_out_shape(
            pad_type=pad_type,
            input_shape=D_in,
            kernel_shape=ksize,
            strides=strides,
            custom_pad=pad,
            ceil_mode=self.ceil_mode.val,
        )
        ret_shape = list(x_shape[:2]) + D_out_shape
        return types.tensor(self.x.dtype, tuple(ret_shape))


[docs]@register_op class avg_pool(Pooling): """ Perform average pooling. Supports 1-D, 2-D, and 3-D pool (1, 2, or 3 spatial dimensions). Parameters ---------- x: tensor<[n,C_in,\*D_in], T> (Required) * ``3 <= rank <= 5``. * ``D_in`` are spatial dimensions, ``1 <= len(D_in) <= 3``. * ``C_in`` is the number of input channels or depth dimensions. * ``n`` is the batch dimension. kernel_sizes: const tensor<[K], T> (Required) * The size of the window for each spatial dimension ``D_in`` of the input tensor. * ``K == len(D_in)`` strides: const tensor<[S],i32> (Optional, default to all 1s) * Stride along each of the spatial dimensions. * ``S == len(D_in)``. pad_type: const str (Required) Must be one of ``valid``, ``same``, ``custom`` or ``same_lower``. * ``valid``: No padding. This is equivalent to custom pad with ``pad[i] = 0, for all i``. * ``same`` : This is equivalent to custom pad with ``pad[2*i] + pad[2*i+1] = kernel_size[i]``. * ``custom``: Specify custom padding in the parameter pad. note that ``same`` padding is equivalent to custom padding with ``pad[2*i] + pad[2*i+1] = kernel_size[i]``. * ``same_lower``: Similar to ``same`` but the padding will place extra rows/cols on the top/left if the padding amount is odd. pad: const<[P],i32> (Optional. Default to all 0s) * ``pad`` represents the number of elements to pad before and after each dimension: ``pad[2*i], pad[2*i+1]`` are the pad size before and after spatial dimension ``i``. * ``P = 2 * len(D_in)``. * ``pad`` should be specified if and only if ``pad_type == custom`` exclude_padding_from_average: const tensor<[], bool> (Optional, default to False) * If ``True``, padded values (0s) are excluded from the denominator count when computing the average over the kernel window. ceil_mode: const<bool> * Same as PyTorch's ``ceil`` mode. * ``ceil`` is used instead of floor in calculating the output size. * Optional, defaults to ``False``. * Only applicable when ``pad_type`` is ``valid`` or ``custom``. * When ``ceil_mode`` is True, padding must be symmetric; that is, if specified, ``pad[2*i] == pad[2*i+1]`` must hold. Returns ------- tensor<[n, C_out,\*D_out], T> * Same rank as ``x``. * ``C_out`` is the number of output channels or depth dimensions. * When ``ceil_mode = False``: * ``D_out[i] = floor[(D_in[i] + pad[2*i] + pad[2*i+1] - kernel_sizes[i]) / strides[i]] +1, for i = 0, .., len(D_in) - 1`` is mathematically the same as (when all parameters involved are integers): * ``D_out[i] = ceil [(D_in[i] + pad[2*i] + pad[2*i+1] - kernel_size[i] - 1) / stride[i]], for i = 0, .., len(D_in) - 1``. * ``*D_out`` is all ones if ``global_pooling`` is ``true``. * When ``ceil_mode = True``: * ``D_out[i] = ceil[(D_in[i] + pad[2*i] + pad[2*i+1] - kernel_sizes[i]) / strides[i]] +1, for i = 0, .., len(D_in) - 1`` * If ``(D_out[i] - 1) * strides[i] >= D_in[i] + pad[2*i] and (pad[2*i] + pad[2*i+1] > 0)`` then ``D_out[i] = D_out[i] - 1``. * The first equation is same as: * ``D_out[i] = floor[(D_in[i] + pad[2*i] + pad[2*i+1] - kernel_sizes[i] + strides[i] - 1) / strides[i]] +1, for i = 0, .., len(D_in) - 1`` Attributes ---------- T: fp16, fp32 See Also -------- l2_pool, max_pool """ input_spec = ( InputSpec( exclude_padding_from_average=TensorInputType( const=True, optional=True, type_domain=types.bool ) ) + Pooling.input_spec ) def default_inputs(self): return super().default_inputs() + DefaultInputs( exclude_padding_from_average=False, )
[docs]@register_op class l2_pool(Pooling): """ Perform L2 pooling. Supports 1-D and 2-D pool. Parameters ---------- x: tensor<[n,C_in,*D_in], T> (Required) * Only support 1d and 2d pooling. * See :py:class:`avg_pool`. kernel_sizes: const tensor<[K], T> (Required) * See :py:class:`avg_pool`. strides: const tensor<[S],i32> (Optional, default to all 1s) * See :py:class:`avg_pool`. pad_type: const str (Required) * See :py:class:`avg_pool`. pad: const<[P],i32> (Optional, default to all 0s) * See :py:class:`avg_pool`. Returns ------- tensor<[n, C_out,*D_out], T> * See :py:class:`avg_pool`. Attributes ---------- T: fp16, fp32 See Also -------- avg_pool, max_pool """ def type_inference(self): if self.x.rank - 2 > 2: msg = "l2_pool only supports rank 1 or 2. Got rank: {}".format(self.x.rank - 2) raise ValueError(msg) return super().type_inference()
[docs]@register_op class max_pool(Pooling): """ Perform max pooling. Supports 1-D, 2-D, and 3-D pool. Parameters ---------- x: tensor<[n,C_in,*D_in], T> (Required) * See :py:class:`avg_pool`. kernel_sizes: const tensor<[K], T> (Required) * See :py:class:`avg_pool`. strides: const tensor<[S],i32> (Optional, default to all 1s) * See :py:class:`avg_pool`. pad_type: const str (Required) * See :py:class:`avg_pool`. pad: const<[P],i32> (Optional, default to all 0s) * See :py:class:`avg_pool`. ceil_mode: const<bool> * see :py:class:`avg_pool`. Returns ------- tensor<[n, C_out,*D_out], T> * See :py:class:`avg_pool`. Attributes ---------- T: fp16, fp32 See Also -------- avg_pool, l2_pool """ pass