You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

helper.cpp 26 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714
  1. /**
  2. * \file imperative/python/src/helper.cpp
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2020 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. */
  11. #include "./helper.h"
  12. #include <pybind11/eval.h>
  13. #include "megbrain/graph/exc_extra_info.h"
  14. #include "megbrain/graph/event.h"
  15. #include "megbrain/graph/cg.h"
  16. #include "megbrain/tensor.h"
  17. #include "megbrain/utils/mempool.h"
  18. #include "./numpy_dtypes.h"
  19. namespace py = pybind11;
  20. PyTaskDipatcher py_task_q = {};
  21. py::module submodule(py::module parent, const char* name, const char* doc) {
  22. auto m = parent.def_submodule(name, doc);
  23. m.attr("__package__") = parent.attr("__name__");
  24. m.attr("__builtins__") = py::module::import("builtins");
  25. return m;
  26. }
  27. py::module rel_import(py::str name, py::module m, int level) {
  28. py::object import = py::module::import("builtins").attr("__import__");
  29. return import(name, m.attr("__dict__"), py::arg("level")=level);
  30. }
  31. /*
  32. * demangle typeid, see
  33. * http://stackoverflow.com/questions/281818/unmangling-the-result-of-stdtype-infoname
  34. */
  35. #ifdef __GNUG__
  36. #include <cxxabi.h>
  37. #include <cstdlib>
  38. #include <memory>
  39. namespace {
  40. std::string demangle_typeid(const char* name) {
  41. int status = -4; // some arbitrary value to eliminate the compiler warning
  42. // enable c++11 by passing the flag -std=c++11 to g++
  43. std::unique_ptr<char, void(*)(void*)> res {
  44. abi::__cxa_demangle(name, nullptr, nullptr, &status),
  45. std::free
  46. };
  47. return (status==0) ? res.get() : name ;
  48. }
  49. } // namespace
  50. #else
  51. namespace {
  52. // does nothing if not g++
  53. std::string demangle_typeid(const char* name) {
  54. return name;
  55. }
  56. }
  57. #endif
  58. using namespace mgb;
  59. using namespace cg;
  60. namespace {
  61. std::string repr_pyobj(PyObject *obj) {
  62. if (!obj)
  63. return "<null PyObject>";
  64. PYTHON_GIL;
  65. auto str = PyObject_Repr(obj);
  66. if (!str)
  67. return ssprintf("<PyObject at %p (repr failed)>", obj);
  68. std::string ret{PyUnicode_AsUTF8(str)};
  69. Py_DECREF(str);
  70. return ret;
  71. }
  72. template<typename T>
  73. std::string typeid_name(const T &t) {
  74. return demangle_typeid(typeid(t).name());
  75. }
  76. } // anonymous namespace
  77. /* ============== PyExceptionForward ============== */
  78. PyExceptionForward::~PyExceptionForward() {
  79. PYTHON_GIL;
  80. PyObjRefKeeper::deleter(m_type);
  81. PyObjRefKeeper::deleter(m_value);
  82. PyObjRefKeeper::deleter(m_traceback);
  83. }
  84. void PyExceptionForward::restore() {
  85. PyErr_Restore(m_type, m_value, m_traceback);
  86. m_type = m_value = m_traceback = nullptr;
  87. }
  88. void PyExceptionForward::throw_() {
  89. PyObject *etype, *obj, *trace;
  90. PyErr_Fetch(&etype, &obj, &trace);
  91. PyErr_NormalizeException(&etype, &obj, &trace);
  92. std::string msg{"python exception"};
  93. bool succ = false;
  94. if (etype && obj && trace) {
  95. auto run = [&]() {
  96. #define DEF(name, expr) \
  97. PyObjRefKeeper name{expr}; \
  98. if (!name.get()) \
  99. return
  100. DEF(mod, PyImport_ImportModule("traceback"));
  101. DEF(result, PyObject_CallMethod(mod.get(), "format_exception",
  102. "(OOO)", etype, obj, trace));
  103. if (!PyList_Check(result.get()))
  104. return;
  105. auto size = PyList_Size(result.get());
  106. msg.append(":\n");
  107. for (Py_ssize_t i = 0; i < size; ++i) {
  108. msg.append(" ");
  109. msg.append(PyUnicode_AsUTF8(PyList_GetItem(result.get(), i)));
  110. }
  111. msg.pop_back(); // remove last \n
  112. succ = true;
  113. #undef DEF
  114. };
  115. run();
  116. }
  117. if (!succ) {
  118. PyObject* obj_str_py;
  119. if (obj && (obj_str_py = PyObject_Repr(obj))) {
  120. msg.append(" with message ");
  121. msg.append(PyUnicode_AsUTF8(obj_str_py));
  122. Py_DECREF(obj_str_py);
  123. } else {
  124. msg.append(" with unknown message");
  125. }
  126. }
  127. // throwing exception may cause abort due to unknown reasons; so we first
  128. // log the message
  129. mgb_log_error("caught exception from python callback: %s", msg.c_str());
  130. fflush(stdout);
  131. fflush(stderr);
  132. throw PyExceptionForward{etype, obj, trace, msg};
  133. }
  134. /* ============== namespace npy ============== */
  135. namespace npy {
  136. int to_mgb_supported_dtype_raw(int dtype) {
  137. if (dtype == NPY_INT64)
  138. return NPY_INT32;
  139. if (dtype == NPY_FLOAT64)
  140. return NPY_FLOAT32;
  141. return dtype;
  142. }
  143. #define FOREACH_NPY_DTYPE_PAIR(cb) \
  144. cb(Uint8, NPY_UINT8) \
  145. cb(Int8, NPY_INT8) \
  146. cb(Int16, NPY_INT16) \
  147. cb(Int32, NPY_INT32) \
  148. cb(Float16, NPY_FLOAT16) \
  149. cb(Float32, NPY_FLOAT32) \
  150. cb(Bool, NPY_BOOL)
  151. #define FOREACH_NPY_MGB_DTYPE_PAIR(cb) \
  152. FOREACH_NPY_DTYPE_PAIR(cb) \
  153. FOREACH_MGB_DTYPE_PAIR(cb)
  154. //! convert megbrain dtype to numpy dtype
  155. int dtype_mgb2np_raw(DType dtype) {
  156. mgb_assert(dtype.valid(), "attempt to convert from invalid dtype");
  157. switch (dtype.enumv()) {
  158. #define cb(_m, _n) \
  159. case DTypeEnum::_m: \
  160. return _n;
  161. FOREACH_NPY_MGB_DTYPE_PAIR(cb)
  162. #undef cb
  163. default:
  164. break;
  165. }
  166. throw ConversionError(ssprintf(
  167. "can not convert dtype %s to numpy dtype", dtype.name()));
  168. }
  169. //! Convert MegBrain DType to NumPy DType descriptor, the caller receives a new
  170. //! reference to the descriptor.
  171. std::unique_ptr<PyArray_Descr, PyArrayDescrDeleter> dtype_mgb2np_descr(
  172. DType dtype) {
  173. PYTHON_GIL;
  174. mgb_assert(dtype.valid(), "attempt to convert from invalid dtype");
  175. auto build_mgb_dtype_dict =
  176. [](const char* name,
  177. const std::vector<std::pair<const char*, PyObject*>>& data) {
  178. PyObject* metadata = PyDict_New();
  179. PyObject* mgb_dtype_metadata = PyDict_New();
  180. PyDict_SetItemString(mgb_dtype_metadata, "name",
  181. PyUnicode_FromString(name));
  182. for (const auto& d : data) {
  183. PyDict_SetItemString(mgb_dtype_metadata, d.first, d.second);
  184. }
  185. PyDict_SetItemString(metadata, "mgb_dtype", mgb_dtype_metadata);
  186. return metadata;
  187. };
  188. if (dtype.has_param()) {
  189. PyArray_Descr* type_descr;
  190. switch (dtype.enumv()) {
  191. case DTypeEnum::Quantized4Asymm: {
  192. auto& param = dtype.param<dtype::Quantized4Asymm>();
  193. type_descr = PyArray_DescrNewFromType(NPY_UINT8);
  194. type_descr->metadata = build_mgb_dtype_dict(
  195. DTypeTrait<dtype::Quantized4Asymm>::name,
  196. {{"scale", PyFloat_FromDouble(param.scale)},
  197. {"zero_point", PyLong_FromLong(param.zero_point)}});
  198. break;
  199. }
  200. case DTypeEnum::QuantizedS4: {
  201. auto& param = dtype.param<dtype::QuantizedS4>();
  202. type_descr = PyArray_DescrNewFromType(NPY_INT8);
  203. type_descr->metadata = build_mgb_dtype_dict(
  204. DTypeTrait<dtype::QuantizedS4>::name,
  205. {{"scale", PyFloat_FromDouble(param.scale)}});
  206. break;
  207. }
  208. case DTypeEnum::Quantized8Asymm: {
  209. auto& param = dtype.param<dtype::Quantized8Asymm>();
  210. type_descr = PyArray_DescrNewFromType(NPY_UINT8);
  211. type_descr->metadata = build_mgb_dtype_dict(
  212. DTypeTrait<dtype::Quantized8Asymm>::name,
  213. {{"scale", PyFloat_FromDouble(param.scale)},
  214. {"zero_point", PyLong_FromLong(param.zero_point)}});
  215. break;
  216. }
  217. case DTypeEnum::QuantizedS8: {
  218. auto& param = dtype.param<dtype::QuantizedS8>();
  219. type_descr = PyArray_DescrNewFromType(NPY_INT8);
  220. type_descr->metadata = build_mgb_dtype_dict(
  221. DTypeTrait<dtype::QuantizedS8>::name,
  222. {{"scale", PyFloat_FromDouble(param.scale)}});
  223. break;
  224. }
  225. case DTypeEnum::QuantizedS32: {
  226. auto& param = dtype.param<dtype::QuantizedS32>();
  227. type_descr = PyArray_DescrNewFromType(NPY_INT32);
  228. type_descr->metadata = build_mgb_dtype_dict(
  229. DTypeTrait<dtype::QuantizedS32>::name,
  230. {{"scale", PyFloat_FromDouble(param.scale)}});
  231. break;
  232. }
  233. default:
  234. mgb_throw(ConversionError, "unhandled parameterized DType %s",
  235. dtype.name());
  236. }
  237. return std::unique_ptr<PyArray_Descr, PyArrayDescrDeleter>(type_descr);
  238. }
  239. PyArray_Descr* basic_descr = PyArray_DescrFromType(dtype_mgb2np_raw(dtype));
  240. mgb_assert(basic_descr != nullptr,
  241. "failed to convert expected dtype to numpy type descriptor");
  242. return std::unique_ptr<PyArray_Descr, PyArrayDescrDeleter>(basic_descr);
  243. }
  244. DType dtype_np2mgb_raw(int npt) {
  245. switch (npt) {
  246. #define cb(_m, _n) \
  247. case _n: \
  248. return dtype::_m();
  249. FOREACH_NPY_DTYPE_PAIR(cb)
  250. #undef cb
  251. }
  252. #define cb(_m, _n) \
  253. if (_n == npt) return dtype::_m();
  254. FOREACH_MGB_DTYPE_PAIR(cb)
  255. #undef cb
  256. PYTHON_GIL;
  257. std::string msg;
  258. auto py_obj = PyArray_TypeObjectFromType(npt);
  259. if (!py_obj) {
  260. msg = ssprintf("unknown numpy dtype enum %d", npt);
  261. } else {
  262. msg = ssprintf("unsupported numpy dtype %s",
  263. repr_pyobj(py_obj).c_str());
  264. }
  265. Py_DECREF(py_obj);
  266. throw ConversionError(msg);
  267. }
  268. DType dtype_np2mgb_descr(PyArray_Descr* descr) {
  269. PYTHON_GIL;
  270. auto handle_parameterized_dtype = [](PyObject* metadata) -> DType {
  271. mgb_assert(PyDict_Check(metadata),
  272. "Invalid parameterized DType metadata: should be a dict");
  273. PyObject* dtype_name_py = PyDict_GetItemString(metadata, "name");
  274. mgb_assert(
  275. PyUnicode_Check(dtype_name_py),
  276. "Invalid parameterized DType metadata: name should be a str");
  277. std::string dtype_name(PyUnicode_AsUTF8(dtype_name_py));
  278. if (dtype_name == "Quantized8Asymm") {
  279. PyObject* scale_py = PyDict_GetItemString(metadata, "scale");
  280. PyObject* zero_point_py =
  281. PyDict_GetItemString(metadata, "zero_point");
  282. mgb_assert(scale_py && zero_point_py,
  283. "Invalid Quantized8Asymm metadata: missing scale or "
  284. "zero_point.");
  285. mgb_assert(
  286. PyFloat_Check(scale_py),
  287. "Invalid Quantized8Asymm metadata: scale should be float");
  288. mgb_assert(PyLong_Check(zero_point_py),
  289. "Invalid Quantized8Asymm metadata: zero_point should be "
  290. "integer");
  291. auto zero_point = PyLong_AS_LONG(zero_point_py);
  292. mgb_assert(zero_point >= 0 && zero_point < 256,
  293. "Invalid Quantized8Asymm metadata: zero_point should be "
  294. "in [0, 256)");
  295. return dtype::Quantized8Asymm(
  296. static_cast<float>(PyFloat_AS_DOUBLE(scale_py)),
  297. static_cast<uint8_t>(zero_point));
  298. }
  299. if (dtype_name == "Quantized4Asymm") {
  300. PyObject* scale_py = PyDict_GetItemString(metadata, "scale");
  301. PyObject* zero_point_py =
  302. PyDict_GetItemString(metadata, "zero_point");
  303. mgb_assert(scale_py && zero_point_py,
  304. "Invalid Quantized4Asymm metadata: missing scale or "
  305. "zero_point.");
  306. mgb_assert(
  307. PyFloat_Check(scale_py),
  308. "Invalid Quantized4Asymm metadata: scale should be float");
  309. mgb_assert(PyLong_Check(zero_point_py),
  310. "Invalid Quantized4Asymm metadata: zero_point should be "
  311. "integer");
  312. auto zero_point = PyLong_AS_LONG(zero_point_py);
  313. mgb_assert(zero_point >= 0 && zero_point < 15,
  314. "Invalid Quantized4Asymm metadata: zero_point should be "
  315. "in [0, 15)");
  316. return dtype::Quantized4Asymm(
  317. static_cast<float>(PyFloat_AS_DOUBLE(scale_py)),
  318. static_cast<uint8_t>(zero_point));
  319. }
  320. if (dtype_name == "QuantizedS32" || dtype_name == "QuantizedS8" ||
  321. dtype_name == "QuantizedS4") {
  322. PyObject* scale_py = PyDict_GetItemString(metadata, "scale");
  323. mgb_assert(scale_py, "Invalid metadata: missing scale");
  324. mgb_assert(PyFloat_Check(scale_py),
  325. "Invalid metadata: scale should be float");
  326. float scale = static_cast<float>(PyFloat_AS_DOUBLE(scale_py));
  327. if (dtype_name == "QuantizedS32") {
  328. return dtype::QuantizedS32(scale);
  329. } else if (dtype_name == "QuantizedS8"){
  330. return dtype::QuantizedS8(scale);
  331. } else {
  332. return dtype::QuantizedS4(scale);
  333. }
  334. }
  335. throw ConversionError(
  336. ssprintf("Unknown parameterized DType: %s", dtype_name.c_str())
  337. .c_str());
  338. };
  339. PyObject* dtype_metadata;
  340. if (descr->metadata && PyDict_Check(descr->metadata) &&
  341. (dtype_metadata = PyDict_GetItemString(descr->metadata, "mgb_dtype"))) {
  342. return handle_parameterized_dtype(dtype_metadata);
  343. }
  344. return dtype_np2mgb_raw(descr->type_num);
  345. }
  346. HostTensorND lowbit_ndarray_to_host_tensor(
  347. CompNode comp_node, TensorLayout &layout, PyArrayObject *input) {
  348. auto src_ptr = reinterpret_cast<dt_byte*>(PyArray_DATA(input));
  349. if (!layout.ndim) {
  350. // numpy scalar
  351. mgb_assert(src_ptr, "can not convert from null numpy array");
  352. layout.init_contiguous_stride({1});
  353. } else {
  354. mgb_assert(layout.ndim && layout.ndim <= TensorShape::MAX_NDIM,
  355. "unsupported ndim %zu", layout.ndim);
  356. for (size_t i = 0; i < layout.ndim; ++ i) {
  357. layout.shape[i] = PyArray_SHAPE(input)[i];
  358. layout.stride[i] = PyArray_STRIDE(input, i);
  359. mgb_assert(layout.shape[i], "zero shape not supported");
  360. }
  361. mgb_assert(layout.is_contiguous());
  362. }
  363. HostTensorND ret{comp_node, layout};
  364. lowbit_memcpy_byte2compact(layout.dtype, ret.raw_ptr(), src_ptr,
  365. layout.total_nr_elems());
  366. return ret;
  367. }
  368. /*!
  369. * \brief convert a python object to tensor and try to borrow memory if the
  370. * original object is a contiguous numpy array
  371. * \param dtype see np2tensor
  372. * \return the megbrain tensor, and whether memory is borrowed
  373. */
  374. std::pair<HostTensorND, bool> np2tensor_try_borrow(
  375. PyObject *obj, const npy::Meth& meth, DType dtype) {
  376. auto dest_cn = meth.dest_cn_;
  377. mgb_assert(dest_cn.valid());
  378. PYTHON_GIL;
  379. PyArray_Descr* expected_descr = nullptr;
  380. if (dtype.valid()) {
  381. // The reference to expected_descr will be stealed later.
  382. expected_descr = dtype_mgb2np_descr(dtype).release();
  383. }
  384. // make result from PyArrayObject; its reference may be stolen
  385. auto make_from_arr = [&](PyArrayObject *input, bool allow_borrow) {
  386. TensorLayout layout;
  387. layout.dtype = dtype_np2mgb_descr(PyArray_DESCR(input));
  388. if (dtype.valid())
  389. mgb_assert(dtype == layout.dtype);
  390. layout.ndim = PyArray_NDIM(input);
  391. if (layout.dtype.is_low_bit()) {
  392. auto ret = lowbit_ndarray_to_host_tensor(dest_cn, layout, input);
  393. if (meth.dest_tensor_) {
  394. meth.dest_tensor_->copy_from(ret);
  395. ret = *meth.dest_tensor_;
  396. }
  397. return std::make_pair(ret, false);
  398. }
  399. auto data = reinterpret_cast<dt_byte*>(PyArray_DATA(input));
  400. if (!layout.ndim) {
  401. // numpy scalar
  402. mgb_assert(data, "can not convert from null numpy array");
  403. layout.init_contiguous_stride({1});
  404. } else {
  405. mgb_assert(layout.ndim && layout.ndim <= TensorShape::MAX_NDIM,
  406. "unsupported ndim %zu", layout.ndim);
  407. auto dsize = layout.dtype.size();
  408. bool is_empty = false;
  409. for (size_t i = 0; i < layout.ndim; ++ i) {
  410. layout.shape[i] = PyArray_SHAPE(input)[i];
  411. layout.stride[i] = PyArray_STRIDE(input, i);
  412. if (!layout.shape[i]) {
  413. is_empty = true;
  414. }
  415. mgb_assert(layout.stride[i] % dsize == 0,
  416. "bad stride %zd", layout.stride[i]);
  417. layout.stride[i] /= dsize;
  418. }
  419. mgb_assert(is_empty || layout.is_contiguous());
  420. }
  421. if (!meth.dest_tensor_ && allow_borrow) {
  422. Py_INCREF(input);
  423. PyObjRefKeeper ref_obj_cvt{reinterpret_cast<PyObject*>(input)};
  424. HostTensorStorage storage;
  425. auto input_ptr = ref_obj_cvt.make_shared(data);
  426. storage.reset(dest_cn, layout.span().high_byte, input_ptr);
  427. HostTensorND ret;
  428. ret.reset(storage, layout);
  429. return std::make_pair(ret, true);
  430. } else {
  431. auto storage = HostTensorStorage(dest_cn);
  432. storage.ensure_size(layout.span().dist_byte());
  433. memcpy(storage.ptr(), data, layout.span().dist_byte());
  434. HostTensorND ret{dest_cn, layout.dtype};
  435. if (meth.dest_tensor_) {
  436. meth.dest_tensor_->reset(storage, layout);
  437. return std::make_pair(*meth.dest_tensor_, false);
  438. } else {
  439. HostTensorND ret;
  440. ret.reset(storage, layout);
  441. return std::make_pair(ret, false);
  442. }
  443. }
  444. };
  445. PyArrayObject *obj_as_arr = nullptr;
  446. do {
  447. // check contiguous and dtype, and borrow mem if ok
  448. if (!PyArray_Check(obj))
  449. break;
  450. obj_as_arr = reinterpret_cast<PyArrayObject*>(obj);
  451. int typenum = PyArray_DTYPE(obj_as_arr)->type_num;
  452. // We have to check dtype.valid() and typenum first to avoid
  453. // accidentally trigger ConversionError on incompatible dtypes which can
  454. // be automatically converted into comptaible ones (e.g. float64).
  455. if (dtype.valid() &&
  456. (expected_descr->type_num != typenum ||
  457. dtype_np2mgb_descr(PyArray_DTYPE(obj_as_arr)) != dtype))
  458. break;
  459. if (typenum != to_mgb_supported_dtype_raw(typenum)) {
  460. mgb_assert(!dtype.valid() && expected_descr == nullptr);
  461. expected_descr =
  462. PyArray_DescrFromType(to_mgb_supported_dtype_raw(typenum));
  463. break;
  464. }
  465. if (PyArray_ISCARRAY_RO(obj_as_arr)) {
  466. return make_from_arr(obj_as_arr, true);
  467. }
  468. } while(0);
  469. constexpr auto NP_FLAGS = NPY_ARRAY_C_CONTIGUOUS | NPY_ARRAY_FORCECAST;
  470. PyObject *obj_cvt;
  471. if (obj_as_arr) {
  472. obj_cvt = PyArray_FromArray(obj_as_arr, expected_descr, NP_FLAGS);
  473. } else {
  474. obj_cvt = PyArray_FromAny(obj, expected_descr, 0, 0, NP_FLAGS, nullptr);
  475. }
  476. if (obj_cvt) {
  477. // convert to mgb supported dtype
  478. auto arr = reinterpret_cast<PyArrayObject*>(obj_cvt);
  479. int dt0 = PyArray_TYPE(arr), dt1 = to_mgb_supported_dtype_raw(dt0);
  480. if (dt0 != dt1) {
  481. mgb_assert(expected_descr == nullptr);
  482. expected_descr = PyArray_DescrFromType(dt1);
  483. mgb_assert(expected_descr);
  484. auto obj_cvt_new = PyArray_FromAny(
  485. obj_cvt, expected_descr, 0, 0, NP_FLAGS, nullptr);
  486. Py_DECREF(obj_cvt);
  487. obj_cvt = obj_cvt_new;
  488. }
  489. }
  490. if (!obj_cvt) {
  491. if (PyErr_Occurred()) {
  492. PyExceptionForward::throw_();
  493. }
  494. throw ConversionError(ssprintf("can not convert to numpy array from %s",
  495. repr_pyobj(obj).c_str()));
  496. }
  497. auto ret = make_from_arr(reinterpret_cast<PyArrayObject*>(obj_cvt), false);
  498. Py_DECREF(obj_cvt);
  499. return ret;
  500. }
  501. //! hold a reference to HostTensorND
  502. class HostTensorNDRefHolder final: public NonCopyableObj {
  503. HostTensorND m_val;
  504. static MemPool<HostTensorNDRefHolder> sm_mem_pool;
  505. friend class MemPool<HostTensorNDRefHolder>;
  506. HostTensorNDRefHolder(const HostTensorND &v):
  507. m_val{v}
  508. {
  509. }
  510. public:
  511. static HostTensorNDRefHolder* alloc(const HostTensorND &v) {
  512. return sm_mem_pool.alloc(v);
  513. }
  514. static void free(HostTensorNDRefHolder *p) {
  515. return sm_mem_pool.free(p);
  516. }
  517. };
  518. MemPool<HostTensorNDRefHolder> HostTensorNDRefHolder::sm_mem_pool;
  519. void ndarray_shared_from_tensor_py_capsule_dtor(PyObject *cap) {
  520. auto ptr = PyCapsule_GetPointer(cap, "HostTensorND");
  521. mgb_assert(ptr, "not a PyCapsule: %s", repr_pyobj(cap).c_str());
  522. HostTensorNDRefHolder::free(static_cast<HostTensorNDRefHolder*>(ptr));
  523. }
  524. PyObject* ndarray_from_tensor(
  525. const HostTensorND &val, ShareType share_type) {
  526. if (!val.layout().is_contiguous() && !val.shape().is_empty()) {
  527. mgb_assert(share_type != ShareType::MUST_SHARE);
  528. HostTensorND contig;
  529. contig.copy_from(val);
  530. return ndarray_from_tensor(contig, ShareType::TRY_SHARE);
  531. }
  532. PYTHON_GIL;
  533. npy_intp dims[TensorLayout::MAX_NDIM];
  534. for (size_t i = 0; i < val.layout().ndim; ++ i)
  535. dims[i] = val.shape()[i];
  536. PyObject* ret = nullptr;
  537. auto alloc_new_ret = [&]() {
  538. mgb_assert(!ret);
  539. ret = PyArray_NewFromDescr(
  540. &PyArray_Type, dtype_mgb2np_descr(val.dtype()).release(),
  541. val.layout().ndim, dims, nullptr, nullptr, 0, nullptr);
  542. mgb_assert(ret, "failed to allocate array");
  543. mgb_assert(PyArray_Check(ret));
  544. return PyArray_DATA(reinterpret_cast<PyArrayObject*>(ret));
  545. };
  546. if (val.dtype().is_low_bit()) {
  547. mgb_assert(share_type != ShareType::MUST_SHARE,
  548. "can not share memory for lowbit dtype");
  549. lowbit_memcpy_compact2byte(val.dtype(), alloc_new_ret(), val.raw_ptr(),
  550. val.layout().total_nr_elems());
  551. } else if (share_type == ShareType::MUST_UNSHARE) {
  552. memcpy(alloc_new_ret(), val.raw_ptr(), val.layout().span().dist_byte());
  553. } else {
  554. // share data
  555. ret = PyArray_NewFromDescr(
  556. &PyArray_Type, dtype_mgb2np_descr(val.dtype()).release(),
  557. val.layout().ndim, dims, nullptr,
  558. const_cast<dt_byte*>(val.raw_ptr()), 0, nullptr);
  559. mgb_assert(ret, "failed to alloc ndarray");
  560. auto capsule = PyCapsule_New(HostTensorNDRefHolder::alloc(val),
  561. "HostTensorND", ndarray_shared_from_tensor_py_capsule_dtor);
  562. mgb_assert(capsule, "failed to create PyCapsule");
  563. auto err = PyArray_SetBaseObject(
  564. reinterpret_cast<PyArrayObject*>(ret), capsule);
  565. mgb_assert(!err);
  566. }
  567. return ret;
  568. }
  569. HostTensorND np2tensor(PyObject* obj, const Meth& meth, DType dtype) {
  570. auto ret_full = np2tensor_try_borrow(obj, meth, dtype);
  571. if (meth.must_borrow_) {
  572. mgb_assert(ret_full.second,
  573. "can not borrow from numpy array as contig array with dtype "
  574. "%s; src=%s",
  575. dtype.name(), repr_pyobj(obj).c_str());
  576. }
  577. return ret_full.first;
  578. }
  579. PyObject* dtype_mgb2np(mgb::DType dtype) {
  580. PYTHON_GIL;
  581. // According to
  582. // https://docs.scipy.org/doc/numpy/reference/c-api.array.html#c.PyArray_TypeObjectFromType
  583. // the following is equivalent to PyArray_TypeObjectFromType for built-in
  584. // types.
  585. if(!dtype.valid()){
  586. Py_XINCREF(Py_None);
  587. return Py_None;
  588. }
  589. auto descr = dtype_mgb2np_descr(dtype);
  590. if (descr == nullptr) {
  591. Py_XINCREF(Py_None);
  592. return Py_None;
  593. }
  594. if (dtype.has_param()) {
  595. return reinterpret_cast<PyObject*>(descr.release());
  596. }
  597. PyObject* typeobj = reinterpret_cast<PyObject*>(descr->typeobj);
  598. Py_XINCREF(typeobj);
  599. return typeobj;
  600. }
  601. mgb::DType dtype_np2mgb(PyObject *obj) {
  602. mgb_assert(obj && obj != Py_None,
  603. "can not convert null PyObject to numpy dtype");
  604. // see
  605. // http://stackoverflow.com/questions/8477122/numpy-c-api-convert-type-object-to-type-number
  606. PYTHON_GIL;
  607. PyArray_Descr* dtype;
  608. if(!PyArray_DescrConverter(obj, &dtype)) {
  609. throw ConversionError(ssprintf("can not convert to np.dtype from %s",
  610. repr_pyobj(obj).c_str()));
  611. }
  612. mgb::DType result = dtype_np2mgb_descr(dtype);
  613. Py_DECREF(dtype);
  614. return result;
  615. }
  616. PyObject* to_mgb_supported_dtype(PyObject* dtype) {
  617. PYTHON_GIL;
  618. PyArray_Descr* descr;
  619. if (!PyArray_DescrConverter(dtype, &descr)) {
  620. throw ConversionError(ssprintf("can not convert to np.dtype from %s",
  621. repr_pyobj(dtype).c_str()));
  622. }
  623. mgb_assert(!descr->metadata,
  624. "unexpected metadata in dtype: "
  625. "dtype_obj=%s metadata=%s",
  626. repr_pyobj(dtype).c_str(), repr_pyobj(descr->metadata).c_str());
  627. int type_num = to_mgb_supported_dtype_raw(descr->type_num);
  628. return PyArray_TypeObjectFromType(type_num);
  629. }
  630. TensorShape vec2shape(const std::vector<size_t> &vec) {
  631. TensorShape shape;
  632. mgb_assert(vec.size() <= TensorShape::MAX_NDIM,
  633. "dim too large: %zd (max %zd)",
  634. vec.size(), TensorShape::MAX_NDIM);
  635. shape.ndim = vec.size();
  636. for (size_t i = 0; i < vec.size(); i ++) {
  637. if (!vec[i]) {
  638. shape.ndim = 0;
  639. break;
  640. }
  641. shape[i] = vec[i];
  642. }
  643. mgb_assert(shape.ndim, "shape should not be empty");
  644. return shape;
  645. }
  646. } // namespace npy

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台