|
- # Copyright 2021 Huawei Technologies Co., Ltd
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- # ============================================================================
-
- import numpy as np
- import pytest
-
- import mindspore.context as context
- import mindspore.nn as nn
- from mindspore import Tensor
- from mindspore.ops.operations import _grad_ops as G
- from mindspore.ops import operations as P
-
-
- class Net(nn.Cell):
- def __init__(self, reduction):
- super(Net, self).__init__()
- self.loss = P.NLLLoss(reduction=reduction)
-
- def construct(self, predict, target, weight):
- return self.loss(predict, target, weight)
-
-
- class NLLLossGradNet(nn.Cell):
- def __init__(self, reduction):
- super(NLLLossGradNet, self).__init__()
- self.grad = G.NLLLossGrad(reduction=reduction)
-
- def construct(self, x, dout_x, target, weight, total_weight):
- gout = self.grad(x, dout_x, target, weight, total_weight)
- return gout
-
-
- def nll_loss_template(nptype_input, nptype_weight, reduction):
- context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
-
- nll_loss_net = Net(reduction)
-
- predict = Tensor(
- np.array([[0.53, 0.74, -2.12], [1.29, -0.34, -1.13]]).astype(nptype_input))
-
- target = Tensor(np.array([0, 1]).astype(np.int32))
-
- weight = Tensor(np.array([0.45, -0.32, 1.21]).astype(nptype_weight))
-
- loss, total_weight = nll_loss_net(predict, target, weight)
-
- loss_np = loss.asnumpy()
- total_weight_np = total_weight.asnumpy()
-
- expected_tot_weight = np.array(0.129999995)
-
- if reduction == 'none':
- expected_loss = np.array([-0.238499984, -0.108800001])
- elif reduction == 'mean':
- expected_loss = np.array(-2.67153859)
- elif reduction == 'sum':
- expected_loss = np.array(-0.347299993)
-
- if nptype_input == np.float32 and nptype_weight == np.float32:
- ertol_loss = 1e-06
- elif nptype_input == np.float16 or nptype_weight == np.float16:
- ertol_loss = 1e-03
-
- if nptype_weight == np.float32:
- ertol_weight = 1e-06
- elif nptype_weight == np.float16:
- ertol_weight = 1e-03
-
- np.testing.assert_allclose(loss_np, expected_loss, ertol_loss)
- np.testing.assert_allclose(
- total_weight_np, expected_tot_weight, ertol_weight)
-
-
- def nll_loss_grad_template(nptype_input, nptype_weight, reduction):
- context.set_context(mode=context.GRAPH_MODE, device_target="GPU")
-
- nll_loss_grad_net = NLLLossGradNet(reduction)
-
- x = Tensor(
- np.array([[0.53, 0.74, -2.12], [1.29, -0.34, -1.13]]).astype(nptype_input))
-
- if reduction == "none":
- dloss = Tensor(
- np.array([3.24, -2.13]).astype(nptype_input))
- else:
- dloss = Tensor(np.array(1.23).astype(nptype_input))
-
- target = Tensor(np.array([0, 1]).astype(np.int32))
- weight = Tensor(np.array([0.45, -0.32, 1.21]).astype(nptype_weight))
-
- total_weight = Tensor(np.array(0.13).astype(nptype_weight))
-
- dx = nll_loss_grad_net(x, dloss, target, weight, total_weight)
-
- dx_np = dx.asnumpy()
-
- print(dx)
-
- if reduction == "none":
- dx_expected = np.array([[-1.45799994, 0, 0], [0, -0.681600034, 0]])
- elif reduction == "mean":
- dx_expected = np.array([[-4.25769234, 0, 0], [0, 3.02769232, 0]])
- else:
- dx_expected = np.array([[-0.553499997, 0, 0], [0, 0.393599987, 0]])
-
- if nptype_input == np.float32 and nptype_weight == np.float32:
- ertol_loss = 1e-06
- else:
- ertol_loss = 1e-02
-
- np.testing.assert_allclose(dx_np, dx_expected, ertol_loss)
-
-
- @pytest.mark.level0
- @pytest.mark.platform_x86_gpu_training
- @pytest.mark.env_onecard
- def test_nll_loss_no_reduction():
- # Four combinations of fp32 and fp16 inputs and weights
- nll_loss_template(np.float32, np.float32, "none")
- nll_loss_template(np.float32, np.float16, "none")
- nll_loss_template(np.float16, np.float32, "none")
- nll_loss_template(np.float16, np.float16, "none")
-
-
- @pytest.mark.level0
- @pytest.mark.platform_x86_gpu_training
- @pytest.mark.env_onecard
- def test_nll_loss_mean_reduction():
- # Four combinations of fp32 and fp16 inputs and weights
- nll_loss_template(np.float32, np.float32, "mean")
- nll_loss_template(np.float32, np.float16, "mean")
- nll_loss_template(np.float16, np.float32, "mean")
- nll_loss_template(np.float16, np.float16, "mean")
-
-
- @pytest.mark.level0
- @pytest.mark.platform_x86_gpu_training
- @pytest.mark.env_onecard
- def test_nll_loss_sum_reduction():
- # Four combinations of fp32 and fp16 inputs and weights
- nll_loss_template(np.float32, np.float32, "sum")
- nll_loss_template(np.float32, np.float16, "sum")
- nll_loss_template(np.float16, np.float32, "sum")
- nll_loss_template(np.float16, np.float16, "sum")
-
-
- @pytest.mark.level0
- @pytest.mark.platform_x86_gpu_training
- @pytest.mark.env_onecard
- def test_nll_loss_grad_mean_reduction():
- # Four combinations of fp32 and fp16 inputs and weights
- nll_loss_grad_template(np.float32, np.float32, "mean")
- nll_loss_grad_template(np.float32, np.float16, "mean")
- nll_loss_grad_template(np.float16, np.float32, "mean")
- nll_loss_grad_template(np.float16, np.float16, "mean")
-
-
- @pytest.mark.level0
- @pytest.mark.platform_x86_gpu_training
- @pytest.mark.env_onecard
- def test_nll_loss_grad_sum_reduction():
- # Four combinations of fp32 and fp16 inputs and weights
- nll_loss_grad_template(np.float32, np.float32, "sum")
- nll_loss_grad_template(np.float32, np.float16, "sum")
- nll_loss_grad_template(np.float16, np.float32, "sum")
- nll_loss_grad_template(np.float16, np.float16, "sum")
-
-
- @pytest.mark.level0
- @pytest.mark.platform_x86_gpu_training
- @pytest.mark.env_onecard
- def test_nll_loss_grad_no_reduction():
- # Four combinations of fp32 and fp16 inputs and weights
- nll_loss_grad_template(np.float32, np.float32, "none")
- nll_loss_grad_template(np.float32, np.float16, "none")
- nll_loss_grad_template(np.float16, np.float32, "none")
- nll_loss_grad_template(np.float16, np.float16, "none")
|