#!/usr/bin/env python3
# coding: utf-8
# Copyright 2019 Huawei Technologies Co., Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""operator dsl function: sum"""

import akg.topi
import akg.tvm
from akg.utils import format_transform as ft_util
from akg.utils import validation_check as vc_util
from akg.utils.format_transform import get_shape
from akg.ops.math.cast import cast


def get_attrs():
    """get attrs."""
    attr_map = {"enable_bisect_optimize": True}
    return attr_map


@vc_util.check_input_type(akg.tvm.tensor.Tensor, (list, tuple, int, type(None)), (bool, type(None)))
def sum_value(inputs, axis=None, keepdims=False):
    """
    Computes the sum value of a tensor along the given axes.

    Args:
        inputs (tvm.tensor.Tensor): Tensor of type float16, float32.
        axis (Union[list, tuple, int, None]): Specifies which axis or axes to reduce.
        keepdims (bool): If true, the dimension specified by axis will be one.

    Returns:
        tvm.tensor.Tensor with same type as input tensor.
    """

    # Check types
    dtype = inputs.dtype
    vc_util.ops_dtype_check(dtype, vc_util.DtypeForDavinci.ALL_FLOAT)
    axis = ft_util.refine_reduce_axis(inputs, axis)
    vc_util.check_shape(inputs.shape)

    if not axis:
        output = akg.topi.identity(inputs)
    else:
        output = akg.topi.sum(inputs, axis=axis, keepdims=keepdims)
    attr_map = get_attrs()
    return output, attr_map


@vc_util.check_input_type(akg.tvm.tensor.Tensor, (list, tuple, int, type(None)), (bool, type(None)))
def sum_v2(inputs, axis=None, keepdims=True):
    """another implementation of sum with topi api."""
    dtype = inputs.dtype
    vc_util.ops_dtype_check(dtype, vc_util.DtypeForDavinci.ALL_FLOAT)
    axis = ft_util.refine_reduce_axis(inputs, axis)
    vc_util.check_shape(inputs.shape)
    if not axis:
        output = akg.topi.identity(inputs)
    else:
        if dtype == "float16":
            step_sum = cast(inputs, "float32")
        else:
            step_sum = inputs

        step_sum = akg.topi.sum(step_sum, axis=axis, keepdims=keepdims)

        if dtype == "float16":
            output = cast(step_sum, "float16")
        else:
            output = step_sum
    attr_map = get_attrs()
    return output, attr_map


def sum_by_shape(broadcast_data, original_shape):
    """sum the broadcast_data by original shape; gradient for Broadcast."""
    broadcast_shape = get_shape(broadcast_data)
    original_shape = get_shape(original_shape)
    if broadcast_shape == original_shape:
        return broadcast_data
    if original_shape == [1]:
        data, _ = sum_value(broadcast_data)
        return data

    vc_util.broadcast_check(original_shape, broadcast_shape)
    axis_len = len(broadcast_shape) - len(original_shape)
    if axis_len > 0:
        axis = list(range(axis_len))
        broadcast_data, _ = sum_value(broadcast_data, axis, False)
        broadcast_shape = get_shape(broadcast_data)

    axis = []
    for i, _ in enumerate(original_shape):
        if original_shape[i] != broadcast_shape[i]:
            axis.append(i)
    res = sum_value(broadcast_data, axis, True)[0] if axis else broadcast_data
    return res