You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

context.cc 11 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "include/api/context.h"
  17. #include <any>
  18. #include <map>
  19. #include <type_traits>
  20. #include "cxx_api/factory.h"
  21. #include "utils/log_adapter.h"
  22. constexpr auto kModelOptionCpuEnableFP16 = "mindspore.option.cpu.enable_fp16";
  23. constexpr auto kModelOptionCpuThreadAffinity = "mindspore.option.cpu.thread_affinity";
  24. constexpr auto kModelOptionMaliGpuEnableFP16 = "mindspore.option.mali_gpu.enable_fp16";
  25. constexpr auto kModelOptionKirinNpuFrequency = "mindspore.option.kirin_npu.frequency";
  26. constexpr auto kModelOptionDeviceID = "mindspore.option.device_id";
  27. constexpr auto kModelOptionNvidiaGpuDeviceID = kModelOptionDeviceID;
  28. constexpr auto kModelOptionNvidiaGpuTrtInferMode = "mindspore.option.nvidia_gpu.trt_infer_mode";
  29. constexpr auto kModelOptionAscend910DeviceID = kModelOptionDeviceID;
  30. constexpr auto kModelOptionAscend310DeviceID = kModelOptionDeviceID;
  31. constexpr auto kModelOptionAscend310DumpCfgPath = "mindspore.option.ascend310.dump_config_file_path";
  32. constexpr auto kModelOptionAscend310InsertOpCfgPath =
  33. "mindspore.option.ascend310.insert_op_config_file_path"; // aipp config file
  34. constexpr auto kModelOptionAscend310InputFormat = "mindspore.option.ascend310.input_format"; // nchw or nhwc
  35. constexpr auto kModelOptionAscend310InputShapeMap = "mindspore.option.ascend310.input_shape_map";
  36. constexpr auto kModelOptionAscend310InputShape = "mindspore.option.ascend310.input_shape";
  37. // Mandatory while dynamic batch: e.g. "input_op_name1: n1,c2,h3,w4;input_op_name2: n4,c3,h2,w1"
  38. constexpr auto kModelOptionAscend310OutputType =
  39. "mindspore.option.ascend310.output_type"; // "FP32", "UINT8" or "FP16", default as "FP32"
  40. constexpr auto kModelOptionAscend310PrecisionMode = "mindspore.option.ascend310.precision_mode";
  41. // "force_fp16", "allow_fp32_to_fp16", "must_keep_origin_dtype" or "allow_mix_precision", default as "force_fp16"
  42. constexpr auto kModelOptionAscend310OpSelectImplMode = "mindspore.option.ascend310.op_select_impl_mode";
  43. constexpr auto KModelOptionAscend310FusionSwitchCfgPath = "mindspore.option.ascend310.fusion_switch_config_file_path";
  44. // "False": Inference with native backend, "True": Inference with Tensor-RT engine, default as "False"
  45. constexpr auto kModelOptionAscend310DynamicBatchSize = "mindspore.option.ascend310.dynamic_batch_size";
  46. namespace mindspore {
  47. class Allocator {};
  48. struct Context::Data {
  49. std::vector<std::shared_ptr<DeviceInfoContext>> device_info_list;
  50. int32_t thread_num;
  51. std::shared_ptr<Allocator> allocator;
  52. };
  53. struct DeviceInfoContext::Data {
  54. std::map<std::string, std::any> params;
  55. };
  56. Context::Context() : data_(std::make_shared<Data>()) {}
  57. template <class T, typename U = std::remove_cv_t<std::remove_reference_t<T>>>
  58. static const U &GetValue(const std::shared_ptr<DeviceInfoContext::Data> &data, const std::string &key) {
  59. static U empty_result;
  60. if (data == nullptr) {
  61. return empty_result;
  62. }
  63. auto iter = data->params.find(key);
  64. if (iter == data->params.end()) {
  65. return empty_result;
  66. }
  67. const std::any &value = iter->second;
  68. if (value.type() != typeid(U)) {
  69. return empty_result;
  70. }
  71. return std::any_cast<const U &>(value);
  72. }
  73. void Context::SetThreadNum(int32_t thread_num) {
  74. MS_EXCEPTION_IF_NULL(data_);
  75. data_->thread_num = thread_num;
  76. }
  77. int32_t Context::GetThreadNum() const {
  78. MS_EXCEPTION_IF_NULL(data_);
  79. return data_->thread_num;
  80. }
  81. void Context::SetAllocator(const std::shared_ptr<Allocator> &allocator) {
  82. MS_EXCEPTION_IF_NULL(data_);
  83. data_->allocator = allocator;
  84. }
  85. std::shared_ptr<Allocator> Context::GetAllocator() const {
  86. MS_EXCEPTION_IF_NULL(data_);
  87. return data_->allocator;
  88. }
  89. std::vector<std::shared_ptr<DeviceInfoContext>> &Context::MutableDeviceInfo() {
  90. MS_EXCEPTION_IF_NULL(data_);
  91. return data_->device_info_list;
  92. }
  93. DeviceInfoContext::DeviceInfoContext() : data_(std::make_shared<Data>()) {}
  94. void CPUDeviceInfo::SetEnableFP16(bool is_fp16) {
  95. MS_EXCEPTION_IF_NULL(data_);
  96. data_->params[kModelOptionCpuEnableFP16] = is_fp16;
  97. }
  98. bool CPUDeviceInfo::GetEnableFP16() const {
  99. MS_EXCEPTION_IF_NULL(data_);
  100. return GetValue<bool>(data_, kModelOptionCpuEnableFP16);
  101. }
  102. void CPUDeviceInfo::SetThreadAffinity(int affinity) {
  103. MS_EXCEPTION_IF_NULL(data_);
  104. data_->params[kModelOptionCpuThreadAffinity] = affinity;
  105. }
  106. int CPUDeviceInfo::GetThreadAffinity() const {
  107. MS_EXCEPTION_IF_NULL(data_);
  108. return GetValue<bool>(data_, kModelOptionCpuThreadAffinity);
  109. }
  110. void MaliGPUDeviceInfo::SetEnableFP16(bool is_fp16) {
  111. MS_EXCEPTION_IF_NULL(data_);
  112. data_->params[kModelOptionMaliGpuEnableFP16] = is_fp16;
  113. }
  114. bool MaliGPUDeviceInfo::GetEnableFP16() const {
  115. MS_EXCEPTION_IF_NULL(data_);
  116. return GetValue<bool>(data_, kModelOptionMaliGpuEnableFP16);
  117. }
  118. void KirinNPUDeviceInfo::SetFrequency(int frequency) {
  119. MS_EXCEPTION_IF_NULL(data_);
  120. data_->params[kModelOptionKirinNpuFrequency] = frequency;
  121. }
  122. int KirinNPUDeviceInfo::GetFrequency() const {
  123. MS_EXCEPTION_IF_NULL(data_);
  124. return GetValue<int>(data_, kModelOptionKirinNpuFrequency);
  125. }
  126. void NvidiaGPUDeviceInfo::SetDeviceID(uint32_t device_id) {
  127. MS_EXCEPTION_IF_NULL(data_);
  128. data_->params[kModelOptionNvidiaGpuDeviceID] = device_id;
  129. }
  130. uint32_t NvidiaGPUDeviceInfo::GetDeviceID() const {
  131. MS_EXCEPTION_IF_NULL(data_);
  132. return GetValue<uint32_t>(data_, kModelOptionNvidiaGpuDeviceID);
  133. }
  134. void NvidiaGPUDeviceInfo::SetGpuTrtInferMode(bool gpu_trt_infer_mode) {
  135. MS_EXCEPTION_IF_NULL(data_);
  136. data_->params[kModelOptionNvidiaGpuTrtInferMode] = gpu_trt_infer_mode;
  137. }
  138. bool NvidiaGPUDeviceInfo::GetGpuTrtInferMode() const {
  139. MS_EXCEPTION_IF_NULL(data_);
  140. return GetValue<bool>(data_, kModelOptionNvidiaGpuTrtInferMode);
  141. }
  142. void Ascend910DeviceInfo::SetDeviceID(uint32_t device_id) {
  143. MS_EXCEPTION_IF_NULL(data_);
  144. data_->params[kModelOptionAscend910DeviceID] = device_id;
  145. }
  146. uint32_t Ascend910DeviceInfo::GetDeviceID() const {
  147. MS_EXCEPTION_IF_NULL(data_);
  148. return GetValue<uint32_t>(data_, kModelOptionAscend910DeviceID);
  149. }
  150. void Ascend310DeviceInfo::SetDeviceID(uint32_t device_id) {
  151. MS_EXCEPTION_IF_NULL(data_);
  152. data_->params[kModelOptionAscend310DeviceID] = device_id;
  153. }
  154. uint32_t Ascend310DeviceInfo::GetDeviceID() const {
  155. MS_EXCEPTION_IF_NULL(data_);
  156. return GetValue<uint32_t>(data_, kModelOptionAscend310DeviceID);
  157. }
  158. void Ascend310DeviceInfo::SetDumpConfigPath(const std::vector<char> &cfg_path) {
  159. MS_EXCEPTION_IF_NULL(data_);
  160. data_->params[kModelOptionAscend310DumpCfgPath] = CharToString(cfg_path);
  161. }
  162. std::vector<char> Ascend310DeviceInfo::GetDumpConfigPathChar() const {
  163. MS_EXCEPTION_IF_NULL(data_);
  164. const std::string &ref = GetValue<std::string>(data_, kModelOptionAscend310DeviceID);
  165. return StringToChar(ref);
  166. }
  167. void Ascend310DeviceInfo::SetInsertOpConfigPath(const std::vector<char> &cfg_path) {
  168. MS_EXCEPTION_IF_NULL(data_);
  169. data_->params[kModelOptionAscend310InsertOpCfgPath] = CharToString(cfg_path);
  170. }
  171. std::vector<char> Ascend310DeviceInfo::GetInsertOpConfigPathChar() const {
  172. MS_EXCEPTION_IF_NULL(data_);
  173. const std::string &ref = GetValue<std::string>(data_, kModelOptionAscend310InsertOpCfgPath);
  174. return StringToChar(ref);
  175. }
  176. void Ascend310DeviceInfo::SetInputFormat(const std::vector<char> &format) {
  177. MS_EXCEPTION_IF_NULL(data_);
  178. data_->params[kModelOptionAscend310InputFormat] = CharToString(format);
  179. }
  180. std::vector<char> Ascend310DeviceInfo::GetInputFormatChar() const {
  181. MS_EXCEPTION_IF_NULL(data_);
  182. const std::string &ref = GetValue<std::string>(data_, kModelOptionAscend310InputFormat);
  183. return StringToChar(ref);
  184. }
  185. void Ascend310DeviceInfo::SetInputShape(const std::vector<char> &shape) {
  186. MS_EXCEPTION_IF_NULL(data_);
  187. data_->params[kModelOptionAscend310InputShape] = CharToString(shape);
  188. }
  189. std::vector<char> Ascend310DeviceInfo::GetInputShapeChar() const {
  190. MS_EXCEPTION_IF_NULL(data_);
  191. const std::string &ref = GetValue<std::string>(data_, kModelOptionAscend310InputShape);
  192. return StringToChar(ref);
  193. }
  194. void Ascend310DeviceInfo::SetDynamicBatchSize(const std::vector<size_t> &dynamic_batch_size) {
  195. MS_EXCEPTION_IF_NULL(data_);
  196. std::string batchs = "";
  197. for (size_t i = 0; i < dynamic_batch_size.size(); ++i) {
  198. if (i != 0) {
  199. batchs.push_back(',');
  200. }
  201. batchs += std::to_string(dynamic_batch_size[i]);
  202. }
  203. data_->params[kModelOptionAscend310DynamicBatchSize] = batchs;
  204. }
  205. std::vector<char> Ascend310DeviceInfo::GetDynamicBatchSizeChar() const {
  206. MS_EXCEPTION_IF_NULL(data_);
  207. const std::string &ref = GetValue<std::string>(data_, kModelOptionAscend310DynamicBatchSize);
  208. return StringToChar(ref);
  209. }
  210. void Ascend310DeviceInfo::SetPrecisionMode(const std::vector<char> &precision_mode) {
  211. MS_EXCEPTION_IF_NULL(data_);
  212. data_->params[kModelOptionAscend310PrecisionMode] = CharToString(precision_mode);
  213. }
  214. std::vector<char> Ascend310DeviceInfo::GetPrecisionModeChar() const {
  215. MS_EXCEPTION_IF_NULL(data_);
  216. const std::string &ref = GetValue<std::string>(data_, kModelOptionAscend310PrecisionMode);
  217. return StringToChar(ref);
  218. }
  219. void Ascend310DeviceInfo::SetOpSelectImplMode(const std::vector<char> &op_select_impl_mode) {
  220. MS_EXCEPTION_IF_NULL(data_);
  221. data_->params[kModelOptionAscend310OpSelectImplMode] = CharToString(op_select_impl_mode);
  222. }
  223. std::vector<char> Ascend310DeviceInfo::GetOpSelectImplModeChar() const {
  224. MS_EXCEPTION_IF_NULL(data_);
  225. const std::string &ref = GetValue<std::string>(data_, kModelOptionAscend310OpSelectImplMode);
  226. return StringToChar(ref);
  227. }
  228. void Ascend310DeviceInfo::SetFusionSwitchConfigPath(const std::vector<char> &cfg_path) {
  229. MS_EXCEPTION_IF_NULL(data_);
  230. data_->params[KModelOptionAscend310FusionSwitchCfgPath] = CharToString(cfg_path);
  231. }
  232. std::vector<char> Ascend310DeviceInfo::GetFusionSwitchConfigPathChar() const {
  233. MS_EXCEPTION_IF_NULL(data_);
  234. const std::string &ref = GetValue<std::string>(data_, KModelOptionAscend310FusionSwitchCfgPath);
  235. return StringToChar(ref);
  236. }
  237. void Ascend310DeviceInfo::SetInputShapeMap(const std::map<int, std::vector<int>> &shape) {
  238. MS_EXCEPTION_IF_NULL(data_);
  239. data_->params[kModelOptionAscend310InputShapeMap] = shape;
  240. }
  241. std::map<int, std::vector<int>> Ascend310DeviceInfo::GetInputShapeMap() const {
  242. MS_EXCEPTION_IF_NULL(data_);
  243. return GetValue<std::map<int, std::vector<int>>>(data_, kModelOptionAscend310InputShapeMap);
  244. }
  245. void Ascend310DeviceInfo::SetOutputType(enum DataType output_type) {
  246. MS_EXCEPTION_IF_NULL(data_);
  247. data_->params[kModelOptionAscend310OutputType] = output_type;
  248. }
  249. enum DataType Ascend310DeviceInfo::GetOutputType() const {
  250. MS_EXCEPTION_IF_NULL(data_);
  251. return GetValue<enum DataType>(data_, kModelOptionAscend310OutputType);
  252. }
  253. } // namespace mindspore