/** * Copyright 2019-2020 Huawei Technologies Co., Ltd * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "backend/session/cpu_session.h" #include #include #include "ir/tensor.h" #include "ir/anf.h" #include "backend/kernel_compiler/kernel.h" #include "common/utils.h" #include "backend/session/anf_runtime_algorithm.h" #include "runtime/device/kernel_runtime.h" #include "backend/kernel_compiler/cpu/cpu_kernel_factory.h" #include "runtime/device/cpu/kernel_select_cpu.h" #include "backend/optimizer/common/optimizer.h" #include "backend/optimizer/common/pass_manager.h" #include "backend/optimizer/pass/replace_node_by_proxy.h" #ifdef ENABLE_DEBUGGER #include "debug/debugger/debugger.h" #endif #if (ENABLE_CPU && (ENABLE_D || ENABLE_GPU)) #include "frontend/parallel/ps/util.h" #endif namespace mindspore { namespace session { ParameterPtr CPUSession::CreateNewParameterFromParameter(const AnfNodePtr &anf, bool valid_input, KernelGraph *graph) { MS_EXCEPTION_IF_NULL(anf); MS_EXCEPTION_IF_NULL(graph); if (!anf->isa()) { MS_LOG(EXCEPTION) << "anf[" << anf->DebugString() << "] is not a parameter"; } auto valid_inputs = graph->MutableValidInputs(); MS_EXCEPTION_IF_NULL(valid_inputs); auto graph_inputs = graph->MutableInputs(); MS_EXCEPTION_IF_NULL(graph_inputs); TraceManager::DebugTrace(std::make_shared(anf->debug_info())); ParameterPtr new_parameter = graph->NewParameter(anf->cast()); TraceManager::EndTrace(); graph_inputs->push_back(new_parameter); valid_inputs->push_back(valid_input); return new_parameter; } void CPUSession::Optimize(const std::shared_ptr &kernel_graph) { auto optimizer = std::make_shared(); auto pm = std::make_shared(); std::string pass_name = "replace_node_by_proxy"; pass_name.append(std::to_string(graph_sum_)); pm->AddPass(std::make_shared(pass_name)); optimizer->AddPassManager(pm); (void)optimizer->Optimize(kernel_graph); kernel_graph->SetExecOrderByDefault(); } GraphId CPUSession::CompileGraph(const AnfNodePtrList &lst, const AnfNodePtrList &outputs) { auto graph_id = graph_sum_; auto graph = ConstructKernelGraph(lst, outputs); MS_EXCEPTION_IF_NULL(graph); MS_LOG(INFO) << "Set kernel info"; SetKernelInfo(graph.get()); #if (ENABLE_CPU && (ENABLE_D || ENABLE_GPU)) AssignParamKey(graph); if (parallel::ps::Util::IsRoleOfWorker()) { Optimize(graph); } #endif MS_LOG(INFO) << "Build kernel"; BuildKernel(graph.get()); MS_LOG(INFO) << "Assign kernel address"; runtime_.AssignKernelAddress(graph.get()); return graph_id; } void CPUSession::RunGraph(const GraphId &graph_id, const std::vector &inputs, VectorRef *outputs) { auto &kernel_graph = graphs_[graph_id]; MS_EXCEPTION_IF_NULL(kernel_graph); #if (ENABLE_CPU && (ENABLE_D || ENABLE_GPU)) // Initialize parameter server if (!ps_init_) { InitPSParamAndOptim(kernel_graph, inputs); } #endif MS_LOG(INFO) << "Bind input output address"; std::vector need_sync_outputs; runtime_.BindInputOutput(kernel_graph.get(), inputs, outputs, &need_sync_outputs); MS_LOG(INFO) << "Run graph start"; auto execution_order = kernel_graph->execution_order(); Reorder(&execution_order); bool enable_summary = summary_callback_ != nullptr; kernel_graph->set_execution_order(execution_order); NamedSummaryOutputs summary_outputs; if (enable_summary) { SetSummaryNodes(kernel_graph.get()); summary_outputs = kernel_graph->summary_nodes(); runtime_.IncreaseSummaryRefCount(summary_outputs); } #ifdef ENABLE_DEBUGGER // debugger pre-execution processing if (debugger_) { debugger_->PreExecute(kernel_graph); } #endif bool ret = runtime_.Run(kernel_graph.get()); if (!ret) { MS_LOG(EXCEPTION) << "Run graph failed"; } for (auto output : need_sync_outputs) { (void)output->data_sync(); } if (enable_summary) { Summary(kernel_graph.get()); runtime_.DecreaseSummaryRefCount(summary_outputs); } #ifdef ENABLE_DEBUGGER // debugger post-execution processing if (debugger_) { debugger_->PostExecute(); } #endif MS_LOG(INFO) << "Run graph end"; } void CPUSession::SetKernelInfo(const KernelGraph *kernel_graph) { MS_EXCEPTION_IF_NULL(kernel_graph); auto &kernel_nodes = kernel_graph->execution_order(); for (const auto &kernel_node : kernel_nodes) { MS_EXCEPTION_IF_NULL(kernel_node); device::cpu::SetKernelInfo(kernel_node); } } namespace { void KernelNotSupportException(const AnfNodePtr &kernel_node) { std::string kernel_name = AnfAlgo::GetCNodeName(kernel_node); std::stringstream operator_info; operator_info << "Operator[" << kernel_name << "] "; auto kernel_info = dynamic_cast(kernel_node->kernel_info()); if (kernel_info == nullptr) { operator_info << "is not support."; MS_LOG(EXCEPTION) << operator_info.str(); } auto kernel_build_Info = kernel_info->select_kernel_build_info(); if (kernel_build_Info == nullptr) { operator_info << "is not support."; MS_LOG(EXCEPTION) << operator_info.str(); } size_t input_num = kernel_build_Info->GetInputNum(); if (input_num > 0) { operator_info << " input("; for (size_t i = 0; i < input_num; ++i) { operator_info << TypeIdLabel(kernel_build_Info->GetInputDeviceType(i)); if (i != input_num - 1) { operator_info << ","; } } operator_info << ") "; } size_t output_num = kernel_build_Info->GetOutputNum(); if (output_num > 0) { operator_info << "output("; for (size_t i = 0; i < output_num; ++i) { operator_info << TypeIdLabel(kernel_build_Info->GetOutputDeviceType(i)); if (i != kernel_build_Info->GetOutputNum() - 1) { operator_info << ","; } } operator_info << ") "; } operator_info << "is not support."; MS_LOG(EXCEPTION) << operator_info.str(); } } // namespace void CPUSession::BuildKernel(const KernelGraph *kernel_graph) { MS_EXCEPTION_IF_NULL(kernel_graph); auto &kernel_nodes = kernel_graph->execution_order(); for (const auto &kernel_node : kernel_nodes) { MS_EXCEPTION_IF_NULL(kernel_node); std::string kernel_name = AnfAlgo::GetCNodeName(kernel_node); MS_LOG(INFO) << "Cpu building operator[" << kernel_name << "]."; std::shared_ptr cpu_kernel = kernel::CPUKernelFactory::GetInstance().Create(kernel_name, kernel_node); if (cpu_kernel == nullptr) { KernelNotSupportException(kernel_node); } cpu_kernel->Init(kernel_node); AnfAlgo::SetKernelMod(cpu_kernel, kernel_node.get()); MS_LOG(INFO) << "Cpu build success operator[" << kernel_name << "]."; } } } // namespace session } // namespace mindspore