# Copyright 2020-2021 Huawei Technologies Co., Ltd # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. # =========================================================================== """generate json desc for gelu""" from ._utils import Expander class GeLU(Expander): """GeLU expander""" CSVALUE = 0.044715 CSVALUE_SQRT_TWO_DIV_PI = 0.7978845608028564 # np.sqrt(2/np.pi) def _expand(self, graph_builder): # cal formula are: # gelu of x is 0.5 * x * (1.0 + tanh(y)) # y is sqrt(2.0 / pi) * (x + 0.044715 * x * x * x) input_x = self.inputs[0] # cal y mul_0 = graph_builder.emit('Mul', [input_x, input_x]) pow_0 = graph_builder.emit('Mul', [mul_0, input_x]) const_csvalue = graph_builder.value(pow_0.dtype, self.CSVALUE) mul_1 = graph_builder.emit('Mul', [pow_0, const_csvalue]) tanh_res = graph_builder.emit('Add', [input_x, mul_1]) const_csvalue_sqrt_two_div_pi = graph_builder.value(tanh_res.dtype, self.CSVALUE_SQRT_TWO_DIV_PI) y = graph_builder.emit('Mul', [tanh_res, const_csvalue_sqrt_two_div_pi]) # cal gelu(x) tanh_y = graph_builder.emit('Tanh', [y]) const_one = graph_builder.value(tanh_y.dtype, 1) const_half = graph_builder.value(tanh_y.dtype, 0.5) tanh_y_add_one = graph_builder.emit('Add', [tanh_y, const_one]) mul_x = graph_builder.emit('Mul', [input_x, tanh_y_add_one]) result = graph_builder.emit('Mul', [const_half, mul_x]) return result