You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

kernel_query.cc 7.7 kB

4 years ago
5 years ago
5 years ago
4 years ago
4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183
  1. /**
  2. * Copyright 2019 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "kernel/kernel_query.h"
  17. #include <algorithm>
  18. #include "plugin/device/ascend/kernel/aicpu/aicpu_kernel_metadata.h"
  19. #include "plugin/device/ascend/kernel/host/host_kernel_metadata.h"
  20. #include "plugin/device/ascend/kernel/rts/rt_kernel_info.h"
  21. #include "plugin/device/ascend/kernel/hccl/hccl_kernel_metadata.h"
  22. #include "plugin/device/ascend/kernel/tbe/tbe_kernel_select/tbe_kernel_select.h"
  23. #include "kernel/akg/akg_kernel_metadata.h"
  24. #include "backend/common/session/anf_runtime_algorithm.h"
  25. #include "utils/ms_context.h"
  26. #include "utils/trace_base.h"
  27. namespace mindspore {
  28. namespace kernel {
  29. namespace {
  30. void FilterInvalidKernelInfo(const CNodePtr &kernel_node,
  31. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  32. MS_EXCEPTION_IF_NULL(kernel_info_list);
  33. if (kernel_info_list->empty()) {
  34. return;
  35. }
  36. MS_EXCEPTION_IF_NULL(kernel_node);
  37. size_t output_tensor_num = AnfAlgo::GetOutputTensorNum(kernel_node);
  38. size_t input_tensor_num = AnfAlgo::GetInputTensorNum(kernel_node);
  39. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> filtered_list;
  40. (void)std::copy_if(
  41. kernel_info_list->begin(), kernel_info_list->end(), std::back_inserter(filtered_list),
  42. [output_tensor_num, input_tensor_num](const std::shared_ptr<kernel::KernelBuildInfo> &kernel_build_info) {
  43. return kernel_build_info->GetOutputNum() == output_tensor_num &&
  44. kernel_build_info->GetInputNum() == input_tensor_num;
  45. });
  46. if (!filtered_list.empty()) {
  47. kernel_info_list->clear();
  48. (void)std::copy(filtered_list.begin(), filtered_list.end(), std::back_inserter(*kernel_info_list));
  49. } else {
  50. for (size_t index = 0; index < kernel_info_list->size(); ++index) {
  51. std::ostringstream buffer;
  52. auto &kernel_info = kernel_info_list->at(index);
  53. MS_EXCEPTION_IF_NULL(kernel_info);
  54. if (kernel_info->GetOutputNum() != output_tensor_num) {
  55. buffer << "Kernel node's output size [" << output_tensor_num << "]"
  56. << " cannot match the kernel's output size [" << kernel_info->GetOutputNum() << "]";
  57. } else {
  58. buffer << "Kernel node's input size [" << input_tensor_num << "]"
  59. << " cannot match the kernel's input size [" << kernel_info->GetInputNum() << "]";
  60. }
  61. MS_LOG(INFO) << "Kernel [ " << index << " ] :" << kernel_info->ToString() << buffer.str();
  62. }
  63. kernel_info_list->clear();
  64. MS_LOG(INFO) << "Node: " << kernel_node->DebugString() << "'s output size : [" << output_tensor_num << "]"
  65. << "input size : [" << input_tensor_num << "] can not match any kernelInfo !";
  66. }
  67. }
  68. bool SelectAicpuReshapeInTaskSink(const CNodePtr &kernel_node) {
  69. MS_EXCEPTION_IF_NULL(kernel_node);
  70. if (AnfAlgo::GetCNodeName(kernel_node) != "Reshape") {
  71. return false;
  72. }
  73. const size_t AicpuReshapeSize = 2;
  74. if (kernel_node->size() != AicpuReshapeSize) {
  75. return false;
  76. }
  77. auto context_ptr = MsContext::GetInstance();
  78. MS_EXCEPTION_IF_NULL(context_ptr);
  79. auto is_task_sink = context_ptr->get_param<bool>(MS_CTX_ENABLE_TASK_SINK);
  80. return is_task_sink;
  81. }
  82. } // namespace
  83. void CheckKernelInfoListEmpty(const std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list,
  84. const std::string &type) {
  85. MS_EXCEPTION_IF_NULL(kernel_info_list);
  86. if (kernel_info_list->empty()) {
  87. MS_LOG(INFO) << "Warning: kernel info list is empty, kernel type: " << type;
  88. }
  89. }
  90. void KernelQueryAll(const CNodePtr &kernel_node,
  91. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  92. MS_EXCEPTION_IF_NULL(kernel_node);
  93. MS_EXCEPTION_IF_NULL(kernel_info_list);
  94. TbeMetadataInfo(kernel_node, kernel_info_list);
  95. if (kernel_info_list->empty()) {
  96. GetRtKelInfo(kernel_node, kernel_info_list);
  97. CheckKernelInfoListEmpty(kernel_info_list, "RT_Kernel");
  98. }
  99. if (kernel_info_list->empty()) {
  100. HcclMetadataInfo(kernel_node, kernel_info_list);
  101. CheckKernelInfoListEmpty(kernel_info_list, "HCCL_Kernel");
  102. }
  103. if (SelectAicpuReshapeInTaskSink(kernel_node)) {
  104. return;
  105. }
  106. if (kernel_info_list->empty()) {
  107. HostMetadataInfo(kernel_node, kernel_info_list);
  108. CheckKernelInfoListEmpty(kernel_info_list, "HOST_Kernel");
  109. }
  110. }
  111. void KernelQuery(const CNodePtr &kernel_node, std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list,
  112. KernelType kernel_type) {
  113. MS_EXCEPTION_IF_NULL(kernel_node);
  114. MS_EXCEPTION_IF_NULL(kernel_info_list);
  115. auto context_ptr = MsContext::GetInstance();
  116. MS_EXCEPTION_IF_NULL(context_ptr);
  117. const PrimitivePtr kPrimProdForceSeA = std::make_shared<Primitive>("ProdForceSeA");
  118. if (IsPrimitiveCNode(kernel_node, kPrimProdForceSeA)) {
  119. kernel_type = KernelType::AKG_KERNEL;
  120. }
  121. const PrimitivePtr kPrimLoadIm2Col = std::make_shared<Primitive>("LoadIm2Col");
  122. if (IsPrimitiveCNode(kernel_node, kPrimLoadIm2Col)) {
  123. kernel_type = KernelType::AKG_KERNEL;
  124. } // use LoadIm2Col only for THOR optimizer
  125. switch (kernel_type) {
  126. case KernelType::AKG_KERNEL:
  127. AkgMetadataInfo(kernel_node, kernel_info_list);
  128. break;
  129. default:
  130. KernelQueryAll(kernel_node, kernel_info_list);
  131. break;
  132. }
  133. // check output
  134. FilterInvalidKernelInfo(kernel_node, kernel_info_list);
  135. }
  136. void AICPUQuery(const CNodePtr &kernel_node, std::vector<std::shared_ptr<kernel::KernelBuildInfo>> *kernel_info_list) {
  137. MS_EXCEPTION_IF_NULL(kernel_node);
  138. MS_EXCEPTION_IF_NULL(kernel_info_list);
  139. kernel_info_list->clear();
  140. AicpuMetadataInfo(kernel_node, kernel_info_list);
  141. FilterInvalidKernelInfo(kernel_node, kernel_info_list);
  142. }
  143. bool IsSupportedByAICPU(const AnfNodePtr &kernel_node, const KernelBuildInfoPtr &select_kernel_build_info) {
  144. MS_EXCEPTION_IF_NULL(kernel_node);
  145. MS_EXCEPTION_IF_NULL(select_kernel_build_info);
  146. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> kernel_info_list;
  147. auto cnode = kernel_node->cast<CNodePtr>();
  148. MS_EXCEPTION_IF_NULL(cnode);
  149. AICPUQuery(cnode, &kernel_info_list);
  150. return std::any_of(kernel_info_list.begin(), kernel_info_list.end(),
  151. [&select_kernel_build_info](const kernel::KernelBuildInfoPtr item) {
  152. MS_EXCEPTION_IF_NULL(item);
  153. return item->IsSimilarityKernelBuildInfo(*select_kernel_build_info);
  154. });
  155. }
  156. bool IsSupportedByAICore(const AnfNodePtr &kernel_node, const KernelBuildInfoPtr &select_kernel_build_info) {
  157. MS_EXCEPTION_IF_NULL(kernel_node);
  158. MS_EXCEPTION_IF_NULL(select_kernel_build_info);
  159. std::vector<std::shared_ptr<kernel::KernelBuildInfo>> kernel_info_list;
  160. auto cnode = kernel_node->cast<CNodePtr>();
  161. MS_EXCEPTION_IF_NULL(cnode);
  162. TbeMetadataInfo(cnode, &kernel_info_list);
  163. return std::any_of(kernel_info_list.begin(), kernel_info_list.end(),
  164. [&select_kernel_build_info](const kernel::KernelBuildInfoPtr item) {
  165. MS_EXCEPTION_IF_NULL(item);
  166. return *item == *select_kernel_build_info;
  167. });
  168. }
  169. } // namespace kernel
  170. } // namespace mindspore