|
- # Copyright 2020 Huawei Technologies Co., Ltd
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- # ===========================================================================
- """generate json desc for gelu"""
- from mindspore._extends.graph_kernel.model import model_builder as builder
-
- CSVALUE = 0.044715
- CSVALUE_SQRT_TWO_DIV_PI = 0.7978845608028564 # np.sqrt(2/np.pi)
- ONE = 1.0
- HALF = 0.5
-
-
- def expand_gelu(expand_info):
- """Gelu expander"""
- # cal formula are:
- # gelu(x) = 0.5 * x * (1.0 + tanh(y))
- # y = sqrt(2.0 / pi) * (x + 0.044715 * x * x * x)
-
- # get op info.
- input_desc = expand_info['input_desc'][0]
- graph_builder = builder.GraphBuilder()
-
- # generate a graph.
- with graph_builder.graph_scope('main') as graph_scope:
- # create tensor input.
- input_x = graph_builder.tensor(input_desc['shape'], input_desc['data_type'], input_desc['format'])
- graph_scope.set_input(input_x)
-
- # cal y
- mul_0 = graph_builder.emit('Mul', [input_x, input_x])
- pow_0 = graph_builder.emit('Mul', [mul_0, input_x])
- const_csvalue = graph_builder.value(pow_0.dtype, CSVALUE, input_desc['format'])
- mul_1 = graph_builder.emit('Mul', [pow_0, const_csvalue])
- tanh_res = graph_builder.emit('TensorAdd', [input_x, mul_1])
- const_csvalue_sqrt_two_div_pi = graph_builder.value(
- tanh_res.dtype, CSVALUE_SQRT_TWO_DIV_PI, input_desc['format'])
- y = graph_builder.emit('Mul', [tanh_res, const_csvalue_sqrt_two_div_pi])
-
- # cal gelu(x)
- tanh_y = graph_builder.emit('Tanh', [y])
- const_one = graph_builder.value(tanh_y.dtype, ONE, input_desc['format'])
- const_half = graph_builder.value(tanh_y.dtype, HALF, input_desc['format'])
- tanh_y_add_one = graph_builder.emit('TensorAdd', [tanh_y, const_one])
- mul_x = graph_builder.emit('Mul', [input_x, tanh_y_add_one])
- result = graph_builder.emit('Mul', [const_half, mul_x])
-
- # set graph output.
- graph_scope.set_output(result)
-
- graph = graph_builder.get()[0]
- return graph
|