Huawei_Technology
/
MindSpore-AKG

 
			
							# Copyright 2020-2021 Huawei Technologies Co., Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License 
import numpy as np
from tests.common.gen_random import random_gaussian
from akg.utils import kernel_exec as utils
from akg.utils.result_analysis import gpu_profiling
from akg.utils.format_transform import to_tvm_nd_array
from akg.ops.math_gpu.equal import equal

def gen_data(shapes, dtype):
    support_list = {"float16": np.float16, "float32": np.float32}
    inputs = []
    for i in range(len(shapes)):
        shape = shapes[i]
        one_input = random_gaussian(shape, miu=1, sigma=0.1).astype(support_list[dtype])
        inputs.append(one_input)

    if len(inputs) != 2:
        raise RuntimeError("inputs num should be 2")
    expect = np.equal(inputs[0], inputs[1])
    output = np.full(expect.shape, 0, bool)
    return inputs, output, expect


def test_ms_equal(shapes, dtype, poly_sch=False):
    if poly_sch:
        mod = utils.op_build_test(equal, shapes, [dtype, dtype], kernel_name="equal", attrs={"target": "cuda"})
        
    inputs1, output1, expect1 = gen_data(shapes, dtype)
    output1 = utils.mod_launch(mod, (*inputs1, output1), expect=expect1)

    if shapes[0] == shapes[1]:
        inputs2 = []
        inputs2.append(inputs1[0])
        inputs2.append(inputs1[0])
        expect2 = np.equal(inputs2[0], inputs2[1])
        output2 = np.full(expect2.shape, 0, bool)
        output2 = utils.mod_launch(mod, (*inputs2, output2), expect=expect1)

        res = np.allclose(output1, expect1, rtol=5e-03, atol=1.e-8) and np.allclose(output2, expect2, rtol=5e-03, atol=1.e-8)
        print("Test {}".format("Pass" if res else "Fail"))
        if not res:
            print("Error cuda:========================")
            print(mod.imported_modules[0].get_source())
            raise AssertionError("Test fail")

        inputs1 = to_tvm_nd_array(inputs1)
        inputs2 = to_tvm_nd_array(inputs2)
        expect1 = to_tvm_nd_array(expect1)
        expect2 = to_tvm_nd_array(expect2)
        gpu_profiling(mod, *inputs1, expect1, *inputs2, expect2, 400)
    else:
        res = np.allclose(output1, expect1, rtol=5e-03, atol=1.e-8)
        print("Test {}".format("Pass" if res else "Fail"))
        if not res:
            print("Error cuda:========================")
            print(mod.imported_modules[0].get_source())
            raise AssertionError("Test fail")
        
        inputs1 = to_tvm_nd_array(inputs1)
        expect1 = to_tvm_nd_array(expect1)
        gpu_profiling(mod, *inputs1, expect1, 400)