You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

helper.cpp 27 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733
  1. /**
  2. * \file imperative/python/src/helper.cpp
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. */
  11. #include "./helper.h"
  12. #include <pybind11/eval.h>
  13. #include "megbrain/graph/cg.h"
  14. #include "megbrain/graph/event.h"
  15. #include "megbrain/graph/exc_extra_info.h"
  16. #include "megbrain/tensor.h"
  17. #include "megbrain/utils/mempool.h"
  18. #include "./numpy_dtypes.h"
  19. namespace py = pybind11;
  20. PyTaskDipatcher py_task_q = {};
  21. py::module submodule(py::module parent, const char* name, const char* doc) {
  22. auto m = parent.def_submodule(name, doc);
  23. m.attr("__package__") = parent.attr("__name__");
  24. m.attr("__builtins__") = py::module::import("builtins");
  25. return m;
  26. }
  27. py::module rel_import(py::str name, py::module m, int level) {
  28. py::object import = py::module::import("builtins").attr("__import__");
  29. return import(name, m.attr("__dict__"), py::arg("level") = level);
  30. }
  31. /*
  32. * demangle typeid, see
  33. * http://stackoverflow.com/questions/281818/unmangling-the-result-of-stdtype-infoname
  34. */
  35. #ifdef __GNUG__
  36. #include <cxxabi.h>
  37. #include <cstdlib>
  38. #include <memory>
  39. namespace {
  40. std::string demangle_typeid(const char* name) {
  41. int status = -4; // some arbitrary value to eliminate the compiler warning
  42. // enable c++11 by passing the flag -std=c++11 to g++
  43. std::unique_ptr<char, void (*)(void*)> res{
  44. abi::__cxa_demangle(name, nullptr, nullptr, &status), std::free};
  45. return (status == 0) ? res.get() : name;
  46. }
  47. } // namespace
  48. #else
  49. namespace {
  50. // does nothing if not g++
  51. std::string demangle_typeid(const char* name) {
  52. return name;
  53. }
  54. } // namespace
  55. #endif
  56. using namespace mgb;
  57. using namespace cg;
  58. namespace {
  59. std::string repr_pyobj(PyObject* obj) {
  60. if (!obj)
  61. return "<null PyObject>";
  62. PYTHON_GIL;
  63. auto str = PyObject_Repr(obj);
  64. if (!str)
  65. return ssprintf("<PyObject at %p (repr failed)>", obj);
  66. std::string ret{PyUnicode_AsUTF8(str)};
  67. Py_DECREF(str);
  68. return ret;
  69. }
  70. template <typename T>
  71. std::string typeid_name(const T& t) {
  72. return demangle_typeid(typeid(t).name());
  73. }
  74. } // anonymous namespace
  75. /* ============== PyExceptionForward ============== */
  76. PyExceptionForward::~PyExceptionForward() {
  77. PYTHON_GIL;
  78. PyObjRefKeeper::deleter(m_type);
  79. PyObjRefKeeper::deleter(m_value);
  80. PyObjRefKeeper::deleter(m_traceback);
  81. }
  82. void PyExceptionForward::restore() {
  83. PyErr_Restore(m_type, m_value, m_traceback);
  84. m_type = m_value = m_traceback = nullptr;
  85. }
  86. void PyExceptionForward::throw_() {
  87. PyObject *etype, *obj, *trace;
  88. PyErr_Fetch(&etype, &obj, &trace);
  89. PyErr_NormalizeException(&etype, &obj, &trace);
  90. std::string msg{"python exception"};
  91. bool succ = false;
  92. if (etype && obj && trace) {
  93. auto run = [&]() {
  94. #define DEF(name, expr) \
  95. PyObjRefKeeper name{expr}; \
  96. if (!name.get()) \
  97. return
  98. DEF(mod, PyImport_ImportModule("traceback"));
  99. DEF(result,
  100. PyObject_CallMethod(
  101. mod.get(), "format_exception", "(OOO)", etype, obj, trace));
  102. if (!PyList_Check(result.get()))
  103. return;
  104. auto size = PyList_Size(result.get());
  105. msg.append(":\n");
  106. for (Py_ssize_t i = 0; i < size; ++i) {
  107. msg.append(" ");
  108. msg.append(PyUnicode_AsUTF8(PyList_GetItem(result.get(), i)));
  109. }
  110. msg.pop_back(); // remove last \n
  111. succ = true;
  112. #undef DEF
  113. };
  114. run();
  115. }
  116. if (!succ) {
  117. PyObject* obj_str_py;
  118. if (obj && (obj_str_py = PyObject_Repr(obj))) {
  119. msg.append(" with message ");
  120. msg.append(PyUnicode_AsUTF8(obj_str_py));
  121. Py_DECREF(obj_str_py);
  122. } else {
  123. msg.append(" with unknown message");
  124. }
  125. }
  126. // throwing exception may cause abort due to unknown reasons; so we first
  127. // log the message
  128. mgb_log_error("caught exception from python callback: %s", msg.c_str());
  129. fflush(stdout);
  130. fflush(stderr);
  131. throw PyExceptionForward{etype, obj, trace, msg};
  132. }
  133. /* ============== namespace npy ============== */
  134. namespace npy {
  135. int to_mgb_supported_dtype_raw(int dtype) {
  136. if (dtype == NPY_INT64)
  137. return NPY_INT32;
  138. if (dtype == NPY_FLOAT64)
  139. return NPY_FLOAT32;
  140. return dtype;
  141. }
  142. #define FOREACH_NPY_DTYPE_PAIR(cb) \
  143. cb(Uint8, NPY_UINT8) cb(Int8, NPY_INT8) cb(Uint16, NPY_UINT16) \
  144. cb(Int16, NPY_INT16) cb(Int32, NPY_INT32) cb(Float16, NPY_FLOAT16) \
  145. cb(Float32, NPY_FLOAT32) cb(Bool, NPY_BOOL)
  146. #define FOREACH_NPY_MGB_DTYPE_PAIR(cb) \
  147. FOREACH_NPY_DTYPE_PAIR(cb) \
  148. FOREACH_MGB_DTYPE_PAIR(cb)
  149. //! convert megbrain dtype to numpy dtype
  150. int dtype_mgb2np_raw(DType dtype) {
  151. mgb_assert(dtype.valid(), "attempt to convert from invalid dtype");
  152. switch (dtype.enumv()) {
  153. #define cb(_m, _n) \
  154. case DTypeEnum::_m: \
  155. return _n;
  156. FOREACH_NPY_MGB_DTYPE_PAIR(cb)
  157. #undef cb
  158. default:
  159. break;
  160. }
  161. throw ConversionError(
  162. ssprintf("can not convert dtype %s to numpy dtype", dtype.name()));
  163. }
  164. //! Convert MegBrain DType to NumPy DType descriptor, the caller receives a new
  165. //! reference to the descriptor.
  166. std::unique_ptr<PyArray_Descr, PyArrayDescrDeleter> dtype_mgb2np_descr(DType dtype) {
  167. PYTHON_GIL;
  168. mgb_assert(dtype.valid(), "attempt to convert from invalid dtype");
  169. auto build_mgb_dtype_dict =
  170. [](const char* name,
  171. const std::vector<std::pair<const char*, PyObject*>>& data) {
  172. PyObject* metadata = PyDict_New();
  173. PyObject* mgb_dtype_metadata = PyDict_New();
  174. PyDict_SetItemString(
  175. mgb_dtype_metadata, "name", PyUnicode_FromString(name));
  176. for (const auto& d : data) {
  177. PyDict_SetItemString(mgb_dtype_metadata, d.first, d.second);
  178. }
  179. PyDict_SetItemString(metadata, "mgb_dtype", mgb_dtype_metadata);
  180. return metadata;
  181. };
  182. if (dtype.has_param()) {
  183. PyArray_Descr* type_descr;
  184. switch (dtype.enumv()) {
  185. case DTypeEnum::QuantizedS1: {
  186. auto& param = dtype.param<dtype::QuantizedS1>();
  187. type_descr = PyArray_DescrNewFromType(NPY_INT8);
  188. type_descr->metadata = build_mgb_dtype_dict(
  189. DTypeTrait<dtype::QuantizedS1>::name,
  190. {{"scale", PyFloat_FromDouble(param.scale)}});
  191. break;
  192. }
  193. case DTypeEnum::Quantized4Asymm: {
  194. auto& param = dtype.param<dtype::Quantized4Asymm>();
  195. type_descr = PyArray_DescrNewFromType(NPY_UINT8);
  196. type_descr->metadata = build_mgb_dtype_dict(
  197. DTypeTrait<dtype::Quantized4Asymm>::name,
  198. {{"scale", PyFloat_FromDouble(param.scale)},
  199. {"zero_point", PyLong_FromLong(param.zero_point)}});
  200. break;
  201. }
  202. case DTypeEnum::QuantizedS4: {
  203. auto& param = dtype.param<dtype::QuantizedS4>();
  204. type_descr = PyArray_DescrNewFromType(NPY_INT8);
  205. type_descr->metadata = build_mgb_dtype_dict(
  206. DTypeTrait<dtype::QuantizedS4>::name,
  207. {{"scale", PyFloat_FromDouble(param.scale)}});
  208. break;
  209. }
  210. case DTypeEnum::Quantized8Asymm: {
  211. auto& param = dtype.param<dtype::Quantized8Asymm>();
  212. type_descr = PyArray_DescrNewFromType(NPY_UINT8);
  213. type_descr->metadata = build_mgb_dtype_dict(
  214. DTypeTrait<dtype::Quantized8Asymm>::name,
  215. {{"scale", PyFloat_FromDouble(param.scale)},
  216. {"zero_point", PyLong_FromLong(param.zero_point)}});
  217. break;
  218. }
  219. case DTypeEnum::QuantizedS8: {
  220. auto& param = dtype.param<dtype::QuantizedS8>();
  221. type_descr = PyArray_DescrNewFromType(NPY_INT8);
  222. type_descr->metadata = build_mgb_dtype_dict(
  223. DTypeTrait<dtype::QuantizedS8>::name,
  224. {{"scale", PyFloat_FromDouble(param.scale)}});
  225. break;
  226. }
  227. case DTypeEnum::QuantizedS32: {
  228. auto& param = dtype.param<dtype::QuantizedS32>();
  229. type_descr = PyArray_DescrNewFromType(NPY_INT32);
  230. type_descr->metadata = build_mgb_dtype_dict(
  231. DTypeTrait<dtype::QuantizedS32>::name,
  232. {{"scale", PyFloat_FromDouble(param.scale)}});
  233. break;
  234. }
  235. default:
  236. mgb_throw(
  237. ConversionError, "unhandled parameterized DType %s",
  238. dtype.name());
  239. }
  240. return std::unique_ptr<PyArray_Descr, PyArrayDescrDeleter>(type_descr);
  241. }
  242. PyArray_Descr* basic_descr = PyArray_DescrFromType(dtype_mgb2np_raw(dtype));
  243. mgb_assert(
  244. basic_descr != nullptr,
  245. "failed to convert expected dtype to numpy type descriptor");
  246. return std::unique_ptr<PyArray_Descr, PyArrayDescrDeleter>(basic_descr);
  247. }
  248. DType dtype_np2mgb_raw(int npt) {
  249. switch (npt) {
  250. #define cb(_m, _n) \
  251. case _n: \
  252. return dtype::_m();
  253. FOREACH_NPY_DTYPE_PAIR(cb)
  254. #undef cb
  255. }
  256. #define cb(_m, _n) \
  257. if (_n == npt) \
  258. return dtype::_m();
  259. FOREACH_MGB_DTYPE_PAIR(cb)
  260. #undef cb
  261. PYTHON_GIL;
  262. std::string msg;
  263. auto py_obj = PyArray_TypeObjectFromType(npt);
  264. if (!py_obj) {
  265. msg = ssprintf("unknown numpy dtype enum %d", npt);
  266. } else {
  267. msg = ssprintf("unsupported numpy dtype %s", repr_pyobj(py_obj).c_str());
  268. }
  269. Py_DECREF(py_obj);
  270. throw ConversionError(msg);
  271. }
  272. DType dtype_np2mgb_descr(PyArray_Descr* descr) {
  273. PYTHON_GIL;
  274. auto handle_parameterized_dtype = [](PyObject* metadata) -> DType {
  275. mgb_assert(
  276. PyDict_Check(metadata),
  277. "Invalid parameterized DType metadata: should be a dict");
  278. PyObject* dtype_name_py = PyDict_GetItemString(metadata, "name");
  279. mgb_assert(
  280. PyUnicode_Check(dtype_name_py),
  281. "Invalid parameterized DType metadata: name should be a str");
  282. std::string dtype_name(PyUnicode_AsUTF8(dtype_name_py));
  283. if (dtype_name == "Quantized8Asymm") {
  284. PyObject* scale_py = PyDict_GetItemString(metadata, "scale");
  285. PyObject* zero_point_py = PyDict_GetItemString(metadata, "zero_point");
  286. mgb_assert(
  287. scale_py && zero_point_py,
  288. "Invalid Quantized8Asymm metadata: missing scale or "
  289. "zero_point.");
  290. mgb_assert(
  291. PyFloat_Check(scale_py),
  292. "Invalid Quantized8Asymm metadata: scale should be float");
  293. mgb_assert(
  294. PyLong_Check(zero_point_py),
  295. "Invalid Quantized8Asymm metadata: zero_point should be "
  296. "integer");
  297. auto zero_point = PyLong_AS_LONG(zero_point_py);
  298. mgb_assert(
  299. zero_point >= 0 && zero_point < 256,
  300. "Invalid Quantized8Asymm metadata: zero_point should be "
  301. "in [0, 256)");
  302. return dtype::Quantized8Asymm(
  303. static_cast<float>(PyFloat_AS_DOUBLE(scale_py)),
  304. static_cast<uint8_t>(zero_point));
  305. }
  306. if (dtype_name == "Quantized4Asymm") {
  307. PyObject* scale_py = PyDict_GetItemString(metadata, "scale");
  308. PyObject* zero_point_py = PyDict_GetItemString(metadata, "zero_point");
  309. mgb_assert(
  310. scale_py && zero_point_py,
  311. "Invalid Quantized4Asymm metadata: missing scale or "
  312. "zero_point.");
  313. mgb_assert(
  314. PyFloat_Check(scale_py),
  315. "Invalid Quantized4Asymm metadata: scale should be float");
  316. mgb_assert(
  317. PyLong_Check(zero_point_py),
  318. "Invalid Quantized4Asymm metadata: zero_point should be "
  319. "integer");
  320. auto zero_point = PyLong_AS_LONG(zero_point_py);
  321. mgb_assert(
  322. zero_point >= 0 && zero_point < 15,
  323. "Invalid Quantized4Asymm metadata: zero_point should be "
  324. "in [0, 15)");
  325. return dtype::Quantized4Asymm(
  326. static_cast<float>(PyFloat_AS_DOUBLE(scale_py)),
  327. static_cast<uint8_t>(zero_point));
  328. }
  329. if (dtype_name == "QuantizedS32" || dtype_name == "QuantizedS8" ||
  330. dtype_name == "QuantizedS4" || dtype_name == "QuantizedS1") {
  331. PyObject* scale_py = PyDict_GetItemString(metadata, "scale");
  332. mgb_assert(scale_py, "Invalid metadata: missing scale");
  333. mgb_assert(
  334. PyFloat_Check(scale_py), "Invalid metadata: scale should be float");
  335. float scale = static_cast<float>(PyFloat_AS_DOUBLE(scale_py));
  336. if (dtype_name == "QuantizedS32") {
  337. return dtype::QuantizedS32(scale);
  338. } else if (dtype_name == "QuantizedS8") {
  339. return dtype::QuantizedS8(scale);
  340. } else if (dtype_name == "QuantizedS4") {
  341. return dtype::QuantizedS4(scale);
  342. } else if (dtype_name == "QuantizedS1") {
  343. return dtype::QuantizedS1(scale);
  344. }
  345. }
  346. throw ConversionError(
  347. ssprintf("Unknown parameterized DType: %s", dtype_name.c_str())
  348. .c_str());
  349. };
  350. PyObject* dtype_metadata;
  351. if (descr->metadata && PyDict_Check(descr->metadata) &&
  352. (dtype_metadata = PyDict_GetItemString(descr->metadata, "mgb_dtype"))) {
  353. return handle_parameterized_dtype(dtype_metadata);
  354. }
  355. return dtype_np2mgb_raw(descr->type_num);
  356. }
  357. HostTensorND lowbit_ndarray_to_host_tensor(
  358. CompNode comp_node, TensorLayout& layout, PyArrayObject* input) {
  359. auto src_ptr = reinterpret_cast<dt_byte*>(PyArray_DATA(input));
  360. if (!layout.ndim) {
  361. // numpy scalar
  362. mgb_assert(src_ptr, "can not convert from null numpy array");
  363. layout.init_contiguous_stride({1});
  364. } else {
  365. mgb_assert(
  366. layout.ndim && layout.ndim <= TensorShape::MAX_NDIM,
  367. "unsupported ndim %zu", layout.ndim);
  368. TensorLayout ly;
  369. ly.ndim = layout.ndim;
  370. for (size_t i = 0; i < layout.ndim; ++i) {
  371. ly.shape[i] = layout.shape[i] = PyArray_SHAPE(input)[i];
  372. ly.stride[i] = PyArray_STRIDE(input, i);
  373. mgb_assert(layout.shape[i], "zero shape not supported");
  374. }
  375. mgb_assert(ly.is_physical_contiguous());
  376. layout.init_contiguous_stride();
  377. }
  378. HostTensorND ret{comp_node, layout};
  379. if (layout.format.is_lowbit_aligned()) {
  380. mgb_assert(layout.is_contiguous());
  381. lowbit_memcpy_byte2aligned(ret.raw_ptr(), src_ptr, layout);
  382. } else {
  383. lowbit_memcpy_byte2compact(
  384. layout.dtype, ret.raw_ptr(), src_ptr, layout.total_nr_elems());
  385. }
  386. return ret;
  387. }
  388. /*!
  389. * \brief convert a python object to tensor and try to borrow memory if the
  390. * original object is a contiguous numpy array
  391. * \param dtype see np2tensor
  392. * \return the megbrain tensor, and whether memory is borrowed
  393. */
  394. std::pair<HostTensorND, bool> np2tensor_try_borrow(
  395. PyObject* obj, const npy::Meth& meth, DType dtype) {
  396. auto dest_cn = meth.dest_cn_;
  397. mgb_assert(dest_cn.valid());
  398. PYTHON_GIL;
  399. PyArray_Descr* expected_descr = nullptr;
  400. if (dtype.valid()) {
  401. // The reference to expected_descr will be stealed later.
  402. expected_descr = dtype_mgb2np_descr(dtype).release();
  403. }
  404. // make result from PyArrayObject; its reference may be stolen
  405. auto make_from_arr = [&](PyArrayObject* input, bool allow_borrow) {
  406. TensorLayout layout{{}, dtype_np2mgb_descr(PyArray_DESCR(input))};
  407. if (dtype.valid())
  408. mgb_assert(dtype == layout.dtype);
  409. layout.ndim = PyArray_NDIM(input);
  410. if (layout.dtype.is_low_bit()) {
  411. auto ret = lowbit_ndarray_to_host_tensor(dest_cn, layout, input);
  412. if (meth.dest_tensor_) {
  413. meth.dest_tensor_->copy_from(ret);
  414. ret = *meth.dest_tensor_;
  415. }
  416. return std::make_pair(ret, false);
  417. }
  418. auto data = reinterpret_cast<dt_byte*>(PyArray_DATA(input));
  419. if (!layout.ndim) {
  420. // numpy scalar
  421. mgb_assert(data, "can not convert from null numpy array");
  422. layout.init_contiguous_stride({1});
  423. } else {
  424. mgb_assert(
  425. layout.ndim && layout.ndim <= TensorShape::MAX_NDIM,
  426. "unsupported ndim %zu", layout.ndim);
  427. auto dsize = layout.dtype.size();
  428. bool is_empty = false;
  429. for (size_t i = 0; i < layout.ndim; ++i) {
  430. layout.shape[i] = PyArray_SHAPE(input)[i];
  431. layout.stride[i] = PyArray_STRIDE(input, i);
  432. if (!layout.shape[i]) {
  433. is_empty = true;
  434. }
  435. mgb_assert(
  436. layout.stride[i] % dsize == 0, "bad stride %zd",
  437. layout.stride[i]);
  438. layout.stride[i] /= dsize;
  439. }
  440. mgb_assert(is_empty || layout.is_contiguous());
  441. }
  442. if (!meth.dest_tensor_ && allow_borrow) {
  443. Py_INCREF(input);
  444. PyObjRefKeeper ref_obj_cvt{reinterpret_cast<PyObject*>(input)};
  445. HostTensorStorage storage;
  446. auto input_ptr = ref_obj_cvt.make_shared(data);
  447. storage.reset(dest_cn, layout.span().high_byte, input_ptr);
  448. HostTensorND ret;
  449. ret.reset(storage, layout);
  450. return std::make_pair(ret, true);
  451. } else {
  452. auto storage = HostTensorStorage(dest_cn);
  453. storage.ensure_size(layout.span().dist_byte());
  454. memcpy(storage.ptr(), data, layout.span().dist_byte());
  455. HostTensorND ret{dest_cn, layout.dtype};
  456. if (meth.dest_tensor_) {
  457. meth.dest_tensor_->reset(storage, layout);
  458. return std::make_pair(*meth.dest_tensor_, false);
  459. } else {
  460. HostTensorND ret;
  461. ret.reset(storage, layout);
  462. return std::make_pair(ret, false);
  463. }
  464. }
  465. };
  466. PyArrayObject* obj_as_arr = nullptr;
  467. do {
  468. // check contiguous and dtype, and borrow mem if ok
  469. if (!PyArray_Check(obj))
  470. break;
  471. obj_as_arr = reinterpret_cast<PyArrayObject*>(obj);
  472. int typenum = PyArray_DTYPE(obj_as_arr)->type_num;
  473. // We have to check dtype.valid() and typenum first to avoid
  474. // accidentally trigger ConversionError on incompatible dtypes which can
  475. // be automatically converted into comptaible ones (e.g. float64).
  476. if (dtype.valid() && (expected_descr->type_num != typenum ||
  477. dtype_np2mgb_descr(PyArray_DTYPE(obj_as_arr)) != dtype))
  478. break;
  479. if (typenum != to_mgb_supported_dtype_raw(typenum)) {
  480. mgb_assert(!dtype.valid() && expected_descr == nullptr);
  481. expected_descr = PyArray_DescrFromType(to_mgb_supported_dtype_raw(typenum));
  482. break;
  483. }
  484. if (PyArray_ISCARRAY_RO(obj_as_arr)) {
  485. return make_from_arr(obj_as_arr, true);
  486. }
  487. } while (0);
  488. constexpr auto NP_FLAGS = NPY_ARRAY_C_CONTIGUOUS | NPY_ARRAY_FORCECAST;
  489. PyObject* obj_cvt;
  490. if (obj_as_arr) {
  491. obj_cvt = PyArray_FromArray(obj_as_arr, expected_descr, NP_FLAGS);
  492. } else {
  493. obj_cvt = PyArray_FromAny(obj, expected_descr, 0, 0, NP_FLAGS, nullptr);
  494. }
  495. if (obj_cvt) {
  496. // convert to mgb supported dtype
  497. auto arr = reinterpret_cast<PyArrayObject*>(obj_cvt);
  498. int dt0 = PyArray_TYPE(arr), dt1 = to_mgb_supported_dtype_raw(dt0);
  499. if (dt0 != dt1) {
  500. mgb_assert(expected_descr == nullptr);
  501. expected_descr = PyArray_DescrFromType(dt1);
  502. mgb_assert(expected_descr);
  503. auto obj_cvt_new =
  504. PyArray_FromAny(obj_cvt, expected_descr, 0, 0, NP_FLAGS, nullptr);
  505. Py_DECREF(obj_cvt);
  506. obj_cvt = obj_cvt_new;
  507. }
  508. }
  509. if (!obj_cvt) {
  510. if (PyErr_Occurred()) {
  511. PyExceptionForward::throw_();
  512. }
  513. throw ConversionError(ssprintf(
  514. "can not convert to numpy array from %s", repr_pyobj(obj).c_str()));
  515. }
  516. auto ret = make_from_arr(reinterpret_cast<PyArrayObject*>(obj_cvt), false);
  517. Py_DECREF(obj_cvt);
  518. return ret;
  519. }
  520. //! hold a reference to HostTensorND
  521. class HostTensorNDRefHolder final : public NonCopyableObj {
  522. HostTensorND m_val;
  523. static MemPool<HostTensorNDRefHolder> sm_mem_pool;
  524. friend class MemPool<HostTensorNDRefHolder>;
  525. HostTensorNDRefHolder(const HostTensorND& v) : m_val{v} {}
  526. public:
  527. static HostTensorNDRefHolder* alloc(const HostTensorND& v) {
  528. return sm_mem_pool.alloc(v);
  529. }
  530. static void free(HostTensorNDRefHolder* p) { return sm_mem_pool.free(p); }
  531. };
  532. MemPool<HostTensorNDRefHolder> HostTensorNDRefHolder::sm_mem_pool;
  533. void ndarray_shared_from_tensor_py_capsule_dtor(PyObject* cap) {
  534. auto ptr = PyCapsule_GetPointer(cap, "HostTensorND");
  535. mgb_assert(ptr, "not a PyCapsule: %s", repr_pyobj(cap).c_str());
  536. HostTensorNDRefHolder::free(static_cast<HostTensorNDRefHolder*>(ptr));
  537. }
  538. PyObject* ndarray_from_tensor(const HostTensorND& val, ShareType share_type) {
  539. if (!val.layout().is_contiguous() && !val.shape().is_empty()) {
  540. mgb_assert(share_type != ShareType::MUST_SHARE);
  541. HostTensorND contig;
  542. contig.copy_from(val);
  543. return ndarray_from_tensor(contig, ShareType::TRY_SHARE);
  544. }
  545. PYTHON_GIL;
  546. npy_intp dims[TensorLayout::MAX_NDIM];
  547. for (size_t i = 0; i < val.layout().ndim; ++i)
  548. dims[i] = val.shape()[i];
  549. PyObject* ret = nullptr;
  550. auto alloc_new_ret = [&]() {
  551. mgb_assert(!ret);
  552. ret = PyArray_NewFromDescr(
  553. &PyArray_Type, dtype_mgb2np_descr(val.dtype()).release(),
  554. val.layout().ndim, dims, nullptr, nullptr, 0, nullptr);
  555. mgb_assert(ret, "failed to allocate array");
  556. mgb_assert(PyArray_Check(ret));
  557. return PyArray_DATA(reinterpret_cast<PyArrayObject*>(ret));
  558. };
  559. if (val.dtype().is_low_bit()) {
  560. mgb_assert(
  561. share_type != ShareType::MUST_SHARE,
  562. "can not share memory for lowbit dtype");
  563. const auto& layout = val.layout();
  564. if (layout.format.is_lowbit_aligned()) {
  565. lowbit_memcpy_aligned2byte(alloc_new_ret(), val.raw_ptr(), val.layout());
  566. } else {
  567. lowbit_memcpy_compact2byte(
  568. val.dtype(), alloc_new_ret(), val.raw_ptr(),
  569. val.layout().total_nr_elems());
  570. }
  571. } else if (share_type == ShareType::MUST_UNSHARE) {
  572. memcpy(alloc_new_ret(), val.raw_ptr(), val.layout().span().dist_byte());
  573. } else {
  574. // share data
  575. ret = PyArray_NewFromDescr(
  576. &PyArray_Type, dtype_mgb2np_descr(val.dtype()).release(),
  577. val.layout().ndim, dims, nullptr, const_cast<dt_byte*>(val.raw_ptr()),
  578. 0, nullptr);
  579. mgb_assert(ret, "failed to alloc ndarray");
  580. auto capsule = PyCapsule_New(
  581. HostTensorNDRefHolder::alloc(val), "HostTensorND",
  582. ndarray_shared_from_tensor_py_capsule_dtor);
  583. mgb_assert(capsule, "failed to create PyCapsule");
  584. auto err =
  585. PyArray_SetBaseObject(reinterpret_cast<PyArrayObject*>(ret), capsule);
  586. mgb_assert(!err);
  587. }
  588. return ret;
  589. }
  590. HostTensorND np2tensor(PyObject* obj, const Meth& meth, DType dtype) {
  591. auto ret_full = np2tensor_try_borrow(obj, meth, dtype);
  592. if (meth.must_borrow_) {
  593. mgb_assert(
  594. ret_full.second,
  595. "can not borrow from numpy array as contig array with dtype "
  596. "%s; src=%s",
  597. dtype.name(), repr_pyobj(obj).c_str());
  598. }
  599. return ret_full.first;
  600. }
  601. PyObject* dtype_mgb2np(mgb::DType dtype) {
  602. PYTHON_GIL;
  603. // According to
  604. // https://docs.scipy.org/doc/numpy/reference/c-api.array.html#c.PyArray_TypeObjectFromType
  605. // the following is equivalent to PyArray_TypeObjectFromType for built-in
  606. // types.
  607. if (!dtype.valid()) {
  608. Py_XINCREF(Py_None);
  609. return Py_None;
  610. }
  611. auto descr = dtype_mgb2np_descr(dtype);
  612. if (descr == nullptr) {
  613. Py_XINCREF(Py_None);
  614. return Py_None;
  615. }
  616. if (dtype.has_param()) {
  617. return reinterpret_cast<PyObject*>(descr.release());
  618. }
  619. PyObject* typeobj = reinterpret_cast<PyObject*>(descr->typeobj);
  620. Py_XINCREF(typeobj);
  621. return typeobj;
  622. }
  623. mgb::DType dtype_np2mgb(PyObject* obj) {
  624. mgb_assert(obj && obj != Py_None, "can not convert null PyObject to numpy dtype");
  625. // see
  626. // http://stackoverflow.com/questions/8477122/numpy-c-api-convert-type-object-to-type-number
  627. PYTHON_GIL;
  628. PyArray_Descr* dtype;
  629. if (!PyArray_DescrConverter(obj, &dtype)) {
  630. throw ConversionError(ssprintf(
  631. "can not convert to np.dtype from %s", repr_pyobj(obj).c_str()));
  632. }
  633. mgb::DType result = dtype_np2mgb_descr(dtype);
  634. Py_DECREF(dtype);
  635. return result;
  636. }
  637. PyObject* to_mgb_supported_dtype(PyObject* dtype) {
  638. PYTHON_GIL;
  639. PyArray_Descr* descr;
  640. if (!PyArray_DescrConverter(dtype, &descr)) {
  641. throw ConversionError(ssprintf(
  642. "can not convert to np.dtype from %s", repr_pyobj(dtype).c_str()));
  643. }
  644. mgb_assert(
  645. !descr->metadata,
  646. "unexpected metadata in dtype: "
  647. "dtype_obj=%s metadata=%s",
  648. repr_pyobj(dtype).c_str(), repr_pyobj(descr->metadata).c_str());
  649. int type_num = to_mgb_supported_dtype_raw(descr->type_num);
  650. return PyArray_TypeObjectFromType(type_num);
  651. }
  652. TensorShape vec2shape(const std::vector<size_t>& vec) {
  653. TensorShape shape;
  654. mgb_assert(
  655. vec.size() <= TensorShape::MAX_NDIM, "dim too large: %zd (max %zd)",
  656. vec.size(), TensorShape::MAX_NDIM);
  657. shape.ndim = vec.size();
  658. for (size_t i = 0; i < vec.size(); i++) {
  659. if (!vec[i]) {
  660. shape.ndim = 0;
  661. break;
  662. }
  663. shape[i] = vec[i];
  664. }
  665. mgb_assert(shape.ndim, "shape should not be empty");
  666. return shape;
  667. }
  668. } // namespace npy