Huawei_Technology
/
MindSpore-AKG

 
			
							# Copyright 2019 Huawei Technologies Co., Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import numpy as np
import itertools
from akg.utils import kernel_exec as utils
from akg.ops.nn import maxpool_grad
from akg.utils.dsl_create import cal_pad_shapes_by_strategy
from tests.common.tensorio import compare_tensor
from tests.common.base import get_rtol_atol
from tests.common.gen_random import random_gaussian


def maxpool_benchmark(input, kernel, stride, pad):
    sh, sw = stride
    [ph_h, ph_t, pw_h, pw_t], [out_size_h, out_size_w] = \
        cal_pad_shapes_by_strategy(input.shape, kernel, stride, pad)
    N, C1, H, W, C0 = input.shape
    KH, KW = kernel

    out_shape = (N, C1, out_size_h, out_size_w, C0)

    out = np.zeros(out_shape)

    inputpad = np.full((N, C1, H + ph_h + ph_t, W + pw_h + pw_t, C0),
                       np.finfo(input.dtype).min, dtype=input.dtype)
    inputpad[:, :, ph_h: ph_h + H, pw_h: pw_h + W, :] = input

    for i in range(out_size_h):
        for j in range(out_size_w):
            out[:, :, i, j, :] = np.max(inputpad[:, :,
                                                 i * sh:i * sh + KH, j * sw:j * sw + KW, :], axis=(2, 3))
    return out


# behaviour
#   - 0: return dy only for the first maximum within one kernel
#   - 1: return dy for all maximums within one kernel
def benchmark(x, y, dy, kernel, stride, pad, behaviour=0):

    kernel_h, kernel_w = kernel
    stride_h, stride_w = stride
    [pad_h_head, pad_h_tail, pad_w_head, pad_w_tail], _ = cal_pad_shapes_by_strategy(x.shape, kernel, stride, pad)
    N, C1, H, W, C0 = x.shape
    pad_shape = (N, C1, H + pad_h_tail + pad_h_head, W + pad_w_tail + pad_w_head, C0)

    padx = np.full(pad_shape, 0, dtype=x.dtype)
    padx[:, :, pad_h_head:(pad_h_head + H), pad_w_head:(pad_w_head + W), :] = x

    dx = np.zeros(padx.shape, dtype=x.dtype)
    _, _, yH, yW, _ = y.shape

    if behaviour == 0:
        for n in range(N):
            for c1 in range(C1):
                for yh in range(yH):
                    for yw in range(yW):
                        for c0 in range(C0):
                            out_maxpool1 = y[n, c1, yh, yw, c0]
                            head_maxpool1 = dy[n, c1, yh, yw, c0]
                            for kh,kw in itertools.product(range(kernel_h), range(kernel_w)):
                                    if padx[n, c1, yh*stride_h + kh, yw*stride_w + kw, c0] == out_maxpool1:
                                        dx[n, c1, yh*stride_h + kh, yw*stride_w + kw, c0] += head_maxpool1
                                        break
    elif behaviour == 1:
        for n in range(N):
            for c1 in range(C1):
                for yh in range(yH):
                    for yw in range(yW):
                        for c0 in range(C0):
                            out_maxpool1 = y[n, c1, yh, yw, c0]
                            head_maxpool1 = dy[n, c1, yh, yw, c0]
                            for kh in range(kernel_h):
                                for kw in range(kernel_w):
                                    if padx[n, c1, yh*stride_h + kh, yw*stride_w + kw, c0] == out_maxpool1:
                                        dx[n, c1, yh*stride_h + kh, yw*stride_w + kw, c0] += head_maxpool1

    return dx[:, :, pad_h_head:(pad_h_head + H), pad_w_head:(pad_w_head + W), :]


def maxpool_grad_run(shape, kernel, stride, pad, dtype, attrs):
    # Create op
    _, [yh, yw] = cal_pad_shapes_by_strategy(shape, kernel, stride, pad)
    y_shape = (shape[0], shape[1], yh, yw, shape[4])

    if 'tuning' in attrs.keys():
        t = attrs.get("tuning", False)
        kernel_name = attrs.get("kernel_name", False)
        mod = utils.op_build_test(maxpool_grad.maxpool_grad,
                                  [shape, y_shape, y_shape], [dtype, dtype, dtype],
                                  op_attrs=[kernel, stride, pad],
                                  kernel_name=kernel_name, attrs=attrs, dump_code=True, tuning=t)
        if t:
            dy, expect, output, x, y = \
                gen_data(dtype, kernel, pad, shape, stride, y_shape)
            return mod, expect, (x, y, dy, output)
        else:
            return mod
    else:
        mod = utils.op_build_test(maxpool_grad.maxpool_grad,
                                  [shape, y_shape, y_shape], [dtype, dtype, dtype],
                                  op_attrs=[kernel, stride, pad],
                                  kernel_name='maxpool_grad', attrs=attrs, dump_code=True)
        dy, expect, output, x, y = \
            gen_data(dtype, kernel, pad, shape, stride, y_shape)
        output = utils.mod_launch(mod, (x, y, dy, output), expect=expect)
        rtol, atol = get_rtol_atol("maxpool_grad", dtype)
        return (x, y, dy), output, expect, \
            compare_tensor(output, expect, rtol=rtol, atol=atol, equal_nan=True)


def gen_data(dtype, kernel, pad, shape, stride, y_shape):
    # Generate data for testing the op
    x = random_gaussian(shape, miu=1, sigma=0.1).astype(dtype)
    y = maxpool_benchmark(x, kernel, stride, pad)
    y = y.astype(dtype)
    assert y.shape == y_shape, "y shape wrong"
    dy = random_gaussian(y_shape, miu=1, sigma=0.1).astype(dtype)
    expect = benchmark(x, y, dy, kernel, stride, pad)
    output_shape = shape
    # output tensor must be initialized to zero
    output = np.full(output_shape, 0, dtype)
    return dy, expect, output, x, y