|
- /**
- * Copyright 2019 Huawei Technologies Co., Ltd
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
- #include <map>
- #include "device/ascend/profiling/profiling_utils.h"
- #include "kernel/kernel.h"
- #include "device/ascend/profiling/profiling_manager.h"
- #include "session/anf_runtime_algorithm.h"
- #include "common/utils.h"
- #include "utils/utils.h"
-
- namespace mindspore {
- namespace device {
- namespace ascend {
- constexpr uint32_t kMaxProfilingNodeNum = 100;
- constexpr char kCustomNode[] = "PROFILING_CUSTOM_";
- constexpr char kFpStartNode[] = "PROFILING_FP_START";
- constexpr char kBpEndNode[] = "PROFILING_BP_END";
- constexpr char kIterEndNode[] = "PROFILING_ITER_END";
- std::unordered_map<uint32_t, std::vector<std::string>> ProfilingUtils::graph_kernel_name_;
- uint32_t ProfilingUtils::custom_node_index_ = 1;
-
- ProfilingTraceInfo ProfilingUtils::GetProfilingTraceFromEnv(NotNull<session::KernelGraph *> graph_ptr) {
- MS_LOG(INFO) << "get env start";
- custom_node_index_ = 1;
- auto &cnode_exec_order = graph_ptr->execution_order();
- ProfilingTraceInfo profiling_trace;
- profiling_trace.trace_begin = GetTraceBegin(cnode_exec_order);
- profiling_trace.trace_bp_end = GetTraceBpEnd();
- profiling_trace.trace_netoutput = GetTraceNetoutput(cnode_exec_order);
-
- MS_LOG(INFO) << "[profiling] trace_begin:" << profiling_trace.trace_begin
- << " trace_bp_end:" << profiling_trace.trace_bp_end
- << " trace_netoutput:" << profiling_trace.trace_netoutput;
-
- for (uint32_t i = 1; i <= kMaxProfilingNodeNum; ++i) {
- std::string env_str = std::string(kCustomNode) + std::to_string(i);
- const char *node_full_name = std::getenv(env_str.c_str());
- if (node_full_name == nullptr) {
- break;
- }
- MS_LOG(INFO) << "Get profiling node:" << node_full_name;
- profiling_trace.trace_custom_node.insert(node_full_name);
- }
- MS_LOG(INFO) << "get env end";
- return profiling_trace;
- }
-
- std::string ProfilingUtils::GetTraceBegin(const std::vector<CNodePtr> &cnode_exec_order) {
- const char *trace_begin = std::getenv(kFpStartNode);
- auto &first_cnode = cnode_exec_order.front();
- MS_EXCEPTION_IF_NULL(first_cnode);
- return trace_begin == nullptr ? first_cnode->fullname_with_scope() : std::string(trace_begin);
- }
-
- std::string ProfilingUtils::GetTraceBpEnd() {
- const char *trace_bp_end = std::getenv(kBpEndNode);
- return trace_bp_end == nullptr ? "" : std::string(trace_bp_end);
- }
-
- std::string ProfilingUtils::GetTraceNetoutput(const std::vector<CNodePtr> &cnode_exec_order) {
- const char *trace_netoutput = std::getenv(kIterEndNode);
- auto &last_cnode = cnode_exec_order.back();
- MS_EXCEPTION_IF_NULL(last_cnode);
- return trace_netoutput == nullptr ? last_cnode->fullname_with_scope() : std::string(trace_netoutput);
- }
-
- NotNull<CNodePtr> ProfilingUtils::CreateProfilingCNode(const ProfilingContent &profiling_content,
- NotNull<session::KernelGraph *> graph_ptr) {
- kernel::KernelBuildInfo::KernelBuildInfoBuilder selected_kernel_builder;
- selected_kernel_builder.SetInputsFormat({kOpFormat_DEFAULT, kOpFormat_DEFAULT});
- selected_kernel_builder.SetInputsDeviceType({TypeId::kNumberTypeInt32, TypeId::kNumberTypeInt32});
- selected_kernel_builder.SetFusionType(kernel::FusionType::OPAQUE);
- selected_kernel_builder.SetProcessor(kernel::Processor::AICORE);
- selected_kernel_builder.SetKernelType(KernelType::RT_KERNEL);
- abstract::AbstractBasePtr type_none_abstract = std::make_shared<abstract::AbstractNone>();
- auto primitive = std::make_shared<Primitive>(ProfilingUtils::kProfiling);
- std::vector<AnfNodePtr> inputs;
- inputs.emplace_back(NewValueNode(primitive));
- CNodePtr cnode_ptr = graph_ptr->NewCNode(inputs);
- MS_EXCEPTION_IF_NULL(cnode_ptr);
- AnfAlgo::SetSelectKernelBuildInfo(selected_kernel_builder.Build(), cnode_ptr.get());
- cnode_ptr->set_abstract(type_none_abstract);
- // set attr
- ValuePtr notify_value = MakeValue(profiling_content.notify);
- ValuePtr trace_id_value = MakeValue(profiling_content.profiler_trace_id);
- ValuePtr flags_value = MakeValue(profiling_content.flags);
- AnfAlgo::SetNodeAttr(ProfilingUtils::kNotify, notify_value, cnode_ptr);
- AnfAlgo::SetNodeAttr(ProfilingUtils::kProfilerTraceId, trace_id_value, cnode_ptr);
- AnfAlgo::SetNodeAttr(ProfilingUtils::kFlags, flags_value, cnode_ptr);
- return NOT_NULL(cnode_ptr);
- }
-
- void ProfilingUtils::ProfilingTraceFpStart(const mindspore::AnfNodePtr &anf_node,
- const ProfilingTraceInfo &profiling_trace_info,
- NotNull<session::KernelGraph *> graph_ptr,
- NotNull<std::vector<mindspore::CNodePtr> *> kernel_list) {
- if (profiling_trace_info.trace_begin == anf_node->fullname_with_scope()) {
- auto job_id = ProfilingManager::GetInstance().GetJobId();
- ProfilingContent job_profiling_context = {false, job_id, 0};
- auto job_profiling_node = CreateProfilingCNodeWithStream(anf_node, job_profiling_context, graph_ptr);
- kernel_list->emplace_back(job_profiling_node);
-
- ProfilingContent fp_profiling_content = {false, kProfilingFpStartLogId, 0};
- auto fp_profiling_node = CreateProfilingCNodeWithStream(anf_node, fp_profiling_content, graph_ptr);
- kernel_list->emplace_back(fp_profiling_node);
- }
- }
-
- CNodePtr ProfilingUtils::CreateProfilingCNodeWithStream(const mindspore::AnfNodePtr &anf_node,
- const ProfilingContent &profiling_content,
- NotNull<session::KernelGraph *> graph_ptr) {
- CNodePtr profiling_node = CreateProfilingCNode(profiling_content, graph_ptr);
- AnfAlgo::SetStreamDistinctionLabel(AnfAlgo::GetStreamDistinctionLabel(anf_node.get()), profiling_node.get());
- AnfAlgo::SetStreamId(AnfAlgo::GetStreamId(anf_node), profiling_node.get());
- return profiling_node;
- }
-
- void ProfilingUtils::ProfilingCustomOp(const AnfNodePtr &anf_node, const ProfilingTraceInfo &profiling_trace_info,
- NotNull<session::KernelGraph *> graph_ptr,
- NotNull<std::vector<CNodePtr> *> kernel_list) {
- MS_EXCEPTION_IF_NULL(anf_node);
- auto iter = profiling_trace_info.trace_custom_node.find(anf_node->fullname_with_scope());
- if (iter == profiling_trace_info.trace_custom_node.end()) {
- return;
- }
- // custom op profiling job start from 3.
- ProfilingContent front_profiling_content = {false, 2 * custom_node_index_ + 1, 0};
- CNodePtr front_node = CreateProfilingCNodeWithStream(anf_node, front_profiling_content, graph_ptr);
- kernel_list->insert(kernel_list->end() - 1, front_node);
-
- ProfilingContent back_profiling_content = {false, 2 * custom_node_index_ + 2, 0};
- CNodePtr back_node = CreateProfilingCNodeWithStream(anf_node, back_profiling_content, graph_ptr);
- kernel_list->insert(kernel_list->end(), back_node);
- ++custom_node_index_;
- }
-
- void ProfilingUtils::ProfilingTraceBpEnd(const AnfNodePtr &anf_node, const ProfilingTraceInfo &profiling_trace_info,
- NotNull<session::KernelGraph *> graph_ptr,
- NotNull<std::vector<CNodePtr> *> kernel_list) {
- MS_EXCEPTION_IF_NULL(anf_node);
- if (profiling_trace_info.trace_bp_end == anf_node->fullname_with_scope()) {
- ProfilingContent bp_end_profiling_content = {false, kProfilingBpEndLogId, 0};
- CNodePtr bp_end_node = CreateProfilingCNodeWithStream(anf_node, bp_end_profiling_content, graph_ptr);
- kernel_list->emplace_back(bp_end_node);
- }
- }
-
- void ProfilingUtils::ProfilingTraceEnd(const AnfNodePtr &anf_node, const ProfilingTraceInfo &profiling_trace_info,
- NotNull<session::KernelGraph *> graph_ptr,
- NotNull<std::vector<mindspore::CNodePtr> *> kernel_list) {
- MS_EXCEPTION_IF_NULL(anf_node);
- auto full_scope_name = anf_node->fullname_with_scope();
- if (profiling_trace_info.trace_netoutput == full_scope_name) {
- ProfilingContent bp_end_profiling_content = {true, kProfilingIterEndLogId, 0};
- CNodePtr bp_kernel_ptr = CreateProfilingCNodeWithStream(anf_node, bp_end_profiling_content, graph_ptr);
- kernel_list->emplace_back(bp_kernel_ptr);
- }
- }
-
- void ProfilingUtils::SetGraphKernelName(uint32_t graph_id, const std::vector<std::string> &kernel_names) {
- auto iter = graph_kernel_name_.find(graph_id);
- if (iter == graph_kernel_name_.end()) {
- graph_kernel_name_[graph_id] = kernel_names;
- } else {
- MS_LOG(ERROR) << "[profiling]graph kernel names already exist";
- }
- }
-
- void ProfilingUtils::ReportProfilingData(uint32_t graph_id, const std::vector<uint32_t> &task_ids) {
- auto iter = graph_kernel_name_.find(graph_id);
- if (iter == graph_kernel_name_.end()) {
- MS_LOG(ERROR) << "[profiling]graph id " << graph_id << " not in graph_kernel_name_";
- return;
- }
- auto &kernel_names = iter->second;
-
- MS_LOG(INFO) << "kernel_names size:" << kernel_names.size() << ", task_ids size:" << task_ids.size();
- if (kernel_names.size() != task_ids.size()) {
- MS_LOG(ERROR) << "[profiling]kernel name and task id not match";
- return;
- }
- std::map<uint32_t, std::string> op_task_id_map;
- size_t size = kernel_names.size();
- for (size_t i = 0; i < size; ++i) {
- auto it = op_task_id_map.find(task_ids[i]);
- if (it != op_task_id_map.end()) {
- MS_LOG(WARNING) << "task_id " << task_ids[i] << " exist, " << kernel_names[i];
- continue;
- }
- op_task_id_map[task_ids[i]] = kernel_names[i];
- }
- if (!ProfilingManager::GetInstance().ReportProfilingData(op_task_id_map)) {
- MS_LOG(ERROR) << "ReportProfilingData failed";
- }
- }
- } // namespace ascend
- } // namespace device
- } // namespace mindspore
|