You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

kernel_query.cc 6.9 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158
  1. /**
  2. * Copyright 2019 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "kernel/kernel_query.h"
  17. #include <memory>
  18. #include <algorithm>
  19. #include "kernel/aicpu/aicpu_kernel_metadata.h"
  20. #include "kernel/rts/rt_kernel_info.h"
  21. #include "kernel/hccl/hccl_kernel_metadata.h"
  22. #include "kernel/tbe/tbe_kernel_select/tbe_kernel_select.h"
  23. #include "kernel/akg/akg_kernel_metadata.h"
  24. #include "session/anf_runtime_algorithm.h"
  25. #include "utils/context/ms_context.h"
  26. namespace mindspore {
  27. namespace kernel {
  28. namespace {
  29. void FilterInvalidKernelInfo(const CNodePtr &kernel_node,
  30. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  31. MS_EXCEPTION_IF_NULL(kernel_info_list);
  32. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> filtered_list;
  33. (void)std::copy_if(kernel_info_list->begin(), kernel_info_list->end(), std::back_inserter(filtered_list),
  34. [&kernel_node](const std::shared_ptr<kernel::KernelBuildInfo> &kernel_build_info) {
  35. return AnfAlgo::GetOutputTensorNum(kernel_node) == kernel_build_info->GetOutputNum() &&
  36. AnfAlgo::GetInputTensorNum(kernel_node) == kernel_build_info->GetInputNum();
  37. });
  38. if (!filtered_list.empty()) {
  39. kernel_info_list->clear();
  40. (void)std::copy(filtered_list.begin(), filtered_list.end(), std::back_inserter(*kernel_info_list));
  41. } else {
  42. MS_LOG(INFO) << "All kernel Info list does not match any kernel info ";
  43. for (size_t index = 0; index < kernel_info_list->size(); ++index) {
  44. std::ostringstream buffer;
  45. auto kernel_info = kernel_info_list->at(index);
  46. MS_EXCEPTION_IF_NULL(kernel_info);
  47. if (AnfAlgo::GetOutputTensorNum(kernel_node) != kernel_info->GetOutputNum()) {
  48. buffer << "Kernel node's output size [" << AnfAlgo::GetOutputTensorNum(kernel_node) << "]"
  49. << " cannot match the kernel's output size [" << kernel_info->GetOutputNum() << "]";
  50. } else {
  51. buffer << "Kernel node's output size [" << AnfAlgo::GetInputTensorNum(kernel_node) << "]"
  52. << " cannot match the kernel's output size [" << kernel_info->GetInputNum() << "]";
  53. }
  54. MS_LOG(INFO) << "kernel [ " << index << " ] :" << kernel_info->ToString() << buffer.str();
  55. }
  56. kernel_info_list->clear();
  57. MS_LOG(INFO) << "node" << kernel_node->DebugString() << "'s output size : ["
  58. << AnfAlgo::GetOutputTensorNum(kernel_node) << "]"
  59. << "input size : [" << AnfAlgo::GetInputTensorNum(kernel_node) << "] cannot match any kernelInfo !";
  60. }
  61. }
  62. } // namespace
  63. void KernelQueryAll(const CNodePtr &kernel_node,
  64. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  65. MS_EXCEPTION_IF_NULL(kernel_node);
  66. MS_EXCEPTION_IF_NULL(kernel_info_list);
  67. TbeMetadataInfo(kernel_node, kernel_info_list);
  68. if (kernel_info_list->empty()) {
  69. AicpuMetadataInfo(kernel_node, kernel_info_list);
  70. if (!kernel_info_list->empty()) {
  71. MS_LOG(INFO) << "The node [" << kernel_node->DebugString()
  72. << "] cannot find valid TBE kernel info, try to get aicpu kernel info";
  73. AnfAlgo::SetNodeAttr(kAttrIsAICPUKernel, MakeValue(true), kernel_node);
  74. }
  75. }
  76. if (kernel_info_list->empty()) {
  77. GetRtKelInfo(kernel_node, kernel_info_list);
  78. }
  79. if (kernel_info_list->empty()) {
  80. HcclMetadataInfo(kernel_node, kernel_info_list);
  81. }
  82. if (kernel_info_list->empty()) {
  83. MS_LOG(EXCEPTION) << "Op " << kernel_node->DebugString() << "kernel query fail!";
  84. }
  85. }
  86. void KernelQuery(const CNodePtr &kernel_node, std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list,
  87. KernelType kernel_type) {
  88. MS_EXCEPTION_IF_NULL(kernel_node);
  89. MS_EXCEPTION_IF_NULL(kernel_info_list);
  90. std::string op_name = AnfAlgo::GetCNodeName(kernel_node);
  91. auto context_ptr = MsContext::GetInstance();
  92. MS_EXCEPTION_IF_NULL(context_ptr);
  93. if (context_ptr->enable_graph_kernel() && IsPrimitiveCNode(kernel_node, prim::kPrimBatchMatMul)) {
  94. kernel_type = KernelType::AKG_KERNEL;
  95. }
  96. switch (kernel_type) {
  97. case KernelType::AKG_KERNEL:
  98. AkgMetadataInfo(kernel_node, kernel_info_list);
  99. break;
  100. default:
  101. KernelQueryAll(kernel_node, kernel_info_list);
  102. break;
  103. }
  104. if (kernel_info_list->empty()) {
  105. MS_EXCEPTION(NotExistsError) << "Op[" << kernel_node->DebugString() << "] kernel query fail!";
  106. }
  107. // check output
  108. FilterInvalidKernelInfo(kernel_node, kernel_info_list);
  109. }
  110. void AICPUQuery(const CNodePtr &kernel_node, std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  111. MS_EXCEPTION_IF_NULL(kernel_node);
  112. MS_EXCEPTION_IF_NULL(kernel_info_list);
  113. kernel_info_list->clear();
  114. AicpuMetadataInfo(kernel_node, kernel_info_list);
  115. FilterInvalidKernelInfo(kernel_node, kernel_info_list);
  116. }
  117. bool IsSupportedByAICPU(const AnfNodePtr &kernel_node, const KernelBuildInfoPtr &select_kernel_build_info) {
  118. MS_EXCEPTION_IF_NULL(kernel_node);
  119. MS_EXCEPTION_IF_NULL(select_kernel_build_info);
  120. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> kernel_info_list;
  121. auto cnode = kernel_node->cast<CNodePtr>();
  122. MS_EXCEPTION_IF_NULL(cnode);
  123. AICPUQuery(cnode, &kernel_info_list);
  124. return std::any_of(kernel_info_list.begin(), kernel_info_list.end(),
  125. [&select_kernel_build_info](const kernel::KernelBuildInfoPtr item) {
  126. MS_EXCEPTION_IF_NULL(item);
  127. return *item == *select_kernel_build_info;
  128. });
  129. }
  130. bool IsSupportedByAICore(const AnfNodePtr &kernel_node, const KernelBuildInfoPtr &select_kernel_build_info) {
  131. MS_EXCEPTION_IF_NULL(kernel_node);
  132. MS_EXCEPTION_IF_NULL(select_kernel_build_info);
  133. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> kernel_info_list;
  134. auto cnode = kernel_node->cast<CNodePtr>();
  135. MS_EXCEPTION_IF_NULL(cnode);
  136. TbeMetadataInfo(cnode, &kernel_info_list);
  137. return std::any_of(kernel_info_list.begin(), kernel_info_list.end(),
  138. [&select_kernel_build_info](const kernel::KernelBuildInfoPtr item) {
  139. MS_EXCEPTION_IF_NULL(item);
  140. return *item == *select_kernel_build_info;
  141. });
  142. }
  143. } // namespace kernel
  144. } // namespace mindspore