Merge pull request !750 from liubuyu/mastertags/v0.3.0-alpha
| @@ -38,6 +38,7 @@ | |||||
| #include "pre_activate/ascend/ir_fusion/adam_apply_one_fusion.h" | #include "pre_activate/ascend/ir_fusion/adam_apply_one_fusion.h" | ||||
| #include "pre_activate/ascend/ir_fusion/adam_apply_one_with_decay_rule.h" | #include "pre_activate/ascend/ir_fusion/adam_apply_one_with_decay_rule.h" | ||||
| #include "pre_activate/ascend/ir_fusion/parameter_and_transop_fusion.h" | #include "pre_activate/ascend/ir_fusion/parameter_and_transop_fusion.h" | ||||
| #include "pre_activate/ascend/ir_fusion/refresh_parameter_format.h" | |||||
| #include "pre_activate/ascend/ir_fusion/transpose_transdata_fusion.h" | #include "pre_activate/ascend/ir_fusion/transpose_transdata_fusion.h" | ||||
| #include "pre_activate/ascend/ir_fission/transdata_split.h" | #include "pre_activate/ascend/ir_fission/transdata_split.h" | ||||
| #include "pre_activate/ascend/ir_fission/topk_split.h" | #include "pre_activate/ascend/ir_fission/topk_split.h" | ||||
| @@ -265,6 +266,7 @@ void AscendBackendOptimization(const std::shared_ptr<session::KernelGraph> &kern | |||||
| other_pm->AddPass(std::make_shared<AllReduceFusion>()); | other_pm->AddPass(std::make_shared<AllReduceFusion>()); | ||||
| other_pm->AddPass(std::make_shared<AllGatherFusion>()); | other_pm->AddPass(std::make_shared<AllGatherFusion>()); | ||||
| other_pm->AddPass(std::make_shared<ParameterTransOpFusion>()); | other_pm->AddPass(std::make_shared<ParameterTransOpFusion>()); | ||||
| other_pm->AddPass(std::make_shared<RefreshParameterFormat>()); | |||||
| other_pm->AddPass(std::make_shared<BufferFusion>()); | other_pm->AddPass(std::make_shared<BufferFusion>()); | ||||
| other_pm->AddPass(std::make_shared<GetitemTuple>()); | other_pm->AddPass(std::make_shared<GetitemTuple>()); | ||||
| other_pm->AddPass(std::make_shared<CommonSubexpressionElimination>()); | other_pm->AddPass(std::make_shared<CommonSubexpressionElimination>()); | ||||
| @@ -0,0 +1,71 @@ | |||||
| /** | |||||
| * Copyright 2020 Huawei Technologies Co., Ltd | |||||
| * | |||||
| * Licensed under the Apache License, Version 2.0 (the "License"); | |||||
| * you may not use this file except in compliance with the License. | |||||
| * You may obtain a copy of the License at | |||||
| * | |||||
| * http://www.apache.org/licenses/LICENSE-2.0 | |||||
| * | |||||
| * Unless required by applicable law or agreed to in writing, software | |||||
| * distributed under the License is distributed on an "AS IS" BASIS, | |||||
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |||||
| * See the License for the specific language governing permissions and | |||||
| * limitations under the License. | |||||
| */ | |||||
| #include "pre_activate/ascend/ir_fusion/refresh_parameter_format.h" | |||||
| #include "session/anf_runtime_algorithm.h" | |||||
| #include "utils/utils.h" | |||||
| #include "operator/ops.h" | |||||
| #include "device/kernel_info.h" | |||||
| #include "pre_activate/common/helper.h" | |||||
| #include "pre_activate/common/optimizer.h" | |||||
| #include "pre_activate/ascend/ascend_helper.h" | |||||
| namespace mindspore { | |||||
| namespace opt { | |||||
| void DoRefresh(const CNodePtr &cnode) { | |||||
| if (cnode == nullptr) { | |||||
| MS_LOG(EXCEPTION) << "node is nullptr"; | |||||
| } | |||||
| for (size_t input_index = 0; input_index < AnfAlgo::GetInputTensorNum(cnode); input_index++) { | |||||
| auto input_kernel_node = AnfAlgo::GetInputNode(cnode, input_index); | |||||
| if (input_kernel_node->isa<Parameter>()) { | |||||
| std::shared_ptr<kernel::KernelBuildInfo::KernelBuildInfoBuilder> builder = | |||||
| std::make_shared<kernel::KernelBuildInfo::KernelBuildInfoBuilder>(); | |||||
| auto cnode_input_format = AnfAlgo::GetInputFormat(cnode, input_index); | |||||
| auto kernel_node_format = AnfAlgo::GetOutputFormat(input_kernel_node, 0); | |||||
| auto dtype = AnfAlgo::GetOutputDeviceDataType(input_kernel_node, 0); | |||||
| if (kernel_node_format != cnode_input_format) { | |||||
| builder->SetOutputsFormat({cnode_input_format}); | |||||
| builder->SetOutputsDeviceType({dtype}); | |||||
| AnfAlgo::SetSelectKernelBuildInfo(builder->Build(), input_kernel_node.get()); | |||||
| } | |||||
| } | |||||
| } | |||||
| } | |||||
| bool RefreshParameterFormat::Run(const FuncGraphPtr &func_graph) { | |||||
| if (func_graph == nullptr) { | |||||
| MS_LOG(ERROR) << "func_graph is nullptr."; | |||||
| return false; | |||||
| } | |||||
| std::vector<AnfNodePtr> node_list = TopoSort(func_graph->get_return()); | |||||
| for (auto node : node_list) { | |||||
| if (node == nullptr || !node->isa<CNode>()) { | |||||
| continue; | |||||
| } | |||||
| auto cnode = node->cast<CNodePtr>(); | |||||
| if (cnode == nullptr) { | |||||
| continue; | |||||
| } | |||||
| auto node_name = AnfAlgo::GetCNodeName(cnode); | |||||
| if (node_name == kBNTrainingUpdateOpName) { | |||||
| DoRefresh(cnode); | |||||
| } | |||||
| } | |||||
| return true; | |||||
| } | |||||
| } // namespace opt | |||||
| } // namespace mindspore | |||||
| @@ -0,0 +1,40 @@ | |||||
| /** | |||||
| * Copyright 2020 Huawei Technologies Co., Ltd | |||||
| * | |||||
| * Licensed under the Apache License, Version 2.0 (the "License"); | |||||
| * you may not use this file except in compliance with the License. | |||||
| * You may obtain a copy of the License at | |||||
| * | |||||
| * http://www.apache.org/licenses/LICENSE-2.0 | |||||
| * | |||||
| * Unless required by applicable law or agreed to in writing, software | |||||
| * distributed under the License is distributed on an "AS IS" BASIS, | |||||
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |||||
| * See the License for the specific language governing permissions and | |||||
| * limitations under the License. | |||||
| */ | |||||
| #ifndef MINDSPORE_CCSRC_PRE_ACTIVATE_ASCEND_IR_FUSION_REFRESH_PARAMETER_FORMAT_H_ | |||||
| #define MINDSPORE_CCSRC_PRE_ACTIVATE_ASCEND_IR_FUSION_REFRESH_PARAMETER_FORMAT_H_ | |||||
| #include <vector> | |||||
| #include <memory> | |||||
| #include <utility> | |||||
| #include "ir/anf.h" | |||||
| #include "pre_activate/common/pass.h" | |||||
| namespace mindspore { | |||||
| namespace opt { | |||||
| class RefreshParameterFormat : public Pass { | |||||
| public: | |||||
| explicit RefreshParameterFormat(size_t groups = 1) : Pass("refresh_parameter_format"), groups_(groups) {} | |||||
| ~RefreshParameterFormat() override = default; | |||||
| bool Run(const FuncGraphPtr &graph) override; | |||||
| private: | |||||
| size_t groups_ = 1; | |||||
| }; | |||||
| } // namespace opt | |||||
| } // namespace mindspore | |||||
| #endif // MINDSPORE_CCSRC_PRE_ACTIVATE_ASCEND_IR_FUSION_REFRESH_PARAMETER_FORMAT_H_ | |||||