You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

kernel_query.cc 6.9 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157
  1. /**
  2. * Copyright 2019 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "kernel/kernel_query.h"
  17. #include <memory>
  18. #include <algorithm>
  19. #include "kernel/aicpu/aicpu_kernel_metadata.h"
  20. #include "kernel/rts/rt_kernel_info.h"
  21. #include "kernel/hccl/hccl_kernel_metadata.h"
  22. #include "kernel/tbe/tbe_kernel_select/tbe_kernel_select.h"
  23. #include "kernel/akg/akg_kernel_metadata.h"
  24. #include "session/anf_runtime_algorithm.h"
  25. #include "utils/context/ms_context.h"
  26. namespace mindspore {
  27. namespace kernel {
  28. namespace {
  29. void FilterInvalidKernelInfo(const CNodePtr &kernel_node,
  30. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  31. MS_EXCEPTION_IF_NULL(kernel_info_list);
  32. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> filtered_list;
  33. (void)std::copy_if(kernel_info_list->begin(), kernel_info_list->end(), std::back_inserter(filtered_list),
  34. [&](const std::shared_ptr<kernel::KernelBuildInfo> &kernel_build_info) {
  35. return AnfAlgo::GetOutputTensorNum(kernel_node) == kernel_build_info->GetOutputNum() &&
  36. AnfAlgo::GetInputTensorNum(kernel_node) == kernel_build_info->GetInputNum();
  37. });
  38. if (!filtered_list.empty()) {
  39. kernel_info_list->clear();
  40. (void)std::copy(filtered_list.begin(), filtered_list.end(), std::back_inserter(*kernel_info_list));
  41. } else {
  42. MS_LOG(INFO) << "All kernel Info list does not match any kernel info ";
  43. for (size_t index = 0; index < kernel_info_list->size(); ++index) {
  44. std::ostringstream buffer;
  45. MS_EXCEPTION_IF_NULL(kernel_info_list->at(index));
  46. if (AnfAlgo::GetOutputTensorNum(kernel_node) != kernel_info_list->at(index)->GetOutputNum()) {
  47. buffer << "Kernel node's output size [" << AnfAlgo::GetOutputTensorNum(kernel_node) << "]"
  48. << " cannot match the kernel's output size [" << kernel_info_list->at(index)->GetOutputNum() << "]";
  49. } else {
  50. buffer << "Kernel node's output size [" << AnfAlgo::GetInputTensorNum(kernel_node) << "]"
  51. << " cannot match the kernel's output size [" << kernel_info_list->at(index)->GetInputNum() << "]";
  52. }
  53. MS_LOG(INFO) << "kernel [ " << index << " ] :" << kernel_info_list->at(index)->ToString() << buffer.str();
  54. }
  55. kernel_info_list->clear();
  56. MS_LOG(INFO) << "node" << kernel_node->DebugString() << "'s output size : ["
  57. << AnfAlgo::GetOutputTensorNum(kernel_node) << "]"
  58. << "input size : [" << AnfAlgo::GetInputTensorNum(kernel_node) << "] cannot match any kernelInfo !";
  59. }
  60. }
  61. } // namespace
  62. void KernelQueryAll(const CNodePtr &kernel_node,
  63. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  64. MS_EXCEPTION_IF_NULL(kernel_node);
  65. MS_EXCEPTION_IF_NULL(kernel_info_list);
  66. TbeMetadataInfo(kernel_node, kernel_info_list);
  67. if (kernel_info_list->empty()) {
  68. AicpuMetadataInfo(kernel_node, kernel_info_list);
  69. if (!kernel_info_list->empty()) {
  70. MS_LOG(INFO) << "The node [" << kernel_node->DebugString()
  71. << "] cannot find valid TBE kernel info, try to get aicpu kernel info";
  72. AnfAlgo::SetNodeAttr(kAttrIsAICPUKernel, MakeValue(true), kernel_node);
  73. }
  74. }
  75. if (kernel_info_list->empty()) {
  76. GetRtKelInfo(kernel_node, kernel_info_list);
  77. }
  78. if (kernel_info_list->empty()) {
  79. HcclMetadataInfo(kernel_node, kernel_info_list);
  80. }
  81. if (kernel_info_list->empty()) {
  82. MS_LOG(EXCEPTION) << "Op " << kernel_node->DebugString() << "kernel query fail!";
  83. }
  84. }
  85. void KernelQuery(const CNodePtr &kernel_node, std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list,
  86. KernelType kernel_type) {
  87. MS_EXCEPTION_IF_NULL(kernel_node);
  88. MS_EXCEPTION_IF_NULL(kernel_info_list);
  89. std::string op_name = AnfAlgo::GetCNodeName(kernel_node);
  90. auto context_ptr = MsContext::GetInstance();
  91. MS_EXCEPTION_IF_NULL(context_ptr);
  92. if (context_ptr->enable_graph_kernel() && IsPrimitiveCNode(kernel_node, prim::kPrimBatchMatMul)) {
  93. kernel_type = KernelType::AKG_KERNEL;
  94. }
  95. switch (kernel_type) {
  96. case KernelType::AKG_KERNEL:
  97. AkgMetadataInfo(kernel_node, kernel_info_list);
  98. break;
  99. default:
  100. KernelQueryAll(kernel_node, kernel_info_list);
  101. break;
  102. }
  103. if (kernel_info_list->empty()) {
  104. MS_EXCEPTION(NotExistsError) << "Op[" << kernel_node->DebugString() << "] kernel query fail!";
  105. }
  106. // check output
  107. FilterInvalidKernelInfo(kernel_node, kernel_info_list);
  108. }
  109. void AICPUQuery(const CNodePtr &kernel_node, std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  110. MS_EXCEPTION_IF_NULL(kernel_node);
  111. MS_EXCEPTION_IF_NULL(kernel_info_list);
  112. kernel_info_list->clear();
  113. AicpuMetadataInfo(kernel_node, kernel_info_list);
  114. FilterInvalidKernelInfo(kernel_node, kernel_info_list);
  115. }
  116. bool IsSupportedByAICPU(const AnfNodePtr &kernel_node, const KernelBuildInfoPtr &select_kernel_build_info) {
  117. MS_EXCEPTION_IF_NULL(kernel_node);
  118. MS_EXCEPTION_IF_NULL(select_kernel_build_info);
  119. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> kernel_info_list;
  120. auto cnode = kernel_node->cast<CNodePtr>();
  121. MS_EXCEPTION_IF_NULL(cnode);
  122. AICPUQuery(cnode, &kernel_info_list);
  123. return std::any_of(kernel_info_list.begin(), kernel_info_list.end(),
  124. [&select_kernel_build_info](const kernel::KernelBuildInfoPtr item) {
  125. MS_EXCEPTION_IF_NULL(item);
  126. return *item == *select_kernel_build_info;
  127. });
  128. }
  129. bool IsSupportedByAICore(const AnfNodePtr &kernel_node, const KernelBuildInfoPtr &select_kernel_build_info) {
  130. MS_EXCEPTION_IF_NULL(kernel_node);
  131. MS_EXCEPTION_IF_NULL(select_kernel_build_info);
  132. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> kernel_info_list;
  133. auto cnode = kernel_node->cast<CNodePtr>();
  134. MS_EXCEPTION_IF_NULL(cnode);
  135. TbeMetadataInfo(cnode, &kernel_info_list);
  136. return std::any_of(kernel_info_list.begin(), kernel_info_list.end(),
  137. [&select_kernel_build_info](const kernel::KernelBuildInfoPtr item) {
  138. MS_EXCEPTION_IF_NULL(item);
  139. return *item == *select_kernel_build_info;
  140. });
  141. }
  142. } // namespace kernel
  143. } // namespace mindspore