You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

transpose.cpp 1.7 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051
  1. /**
  2. * \file dnn/src/common/transpose.cpp
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. */
  11. #include "megdnn/oprs.h"
  12. #include "src/common/utils.h"
  13. namespace megdnn {
  14. void TransposeForward::deduce_layout(const TensorLayout &src, TensorLayout &dst)
  15. {
  16. dst = src;
  17. dst.dtype = src.dtype;
  18. std::swap(dst.shape[0], dst.shape[1]);
  19. dst.init_contiguous_stride();
  20. }
  21. void TransposeForward::check_exec(const TensorLayout &src,
  22. const TensorLayout &dst,
  23. size_t workspace_in_bytes)
  24. {
  25. // dtype must collide
  26. megdnn_assert(src.dtype == dst.dtype);
  27. // ndim must be 2
  28. megdnn_assert(src.ndim == 2);
  29. megdnn_assert(dst.ndim == 2);
  30. // shapes are swapped
  31. megdnn_assert(src.shape[0] == dst.shape[1]);
  32. megdnn_assert(src.shape[1] == dst.shape[0]);
  33. // last dimension stride must be 1
  34. megdnn_assert(src.stride[1] == 1);
  35. megdnn_assert(dst.stride[1] == 1);
  36. // leading dimension stride must be geq last dimension shape
  37. megdnn_assert(src.stride[0] > 0);
  38. megdnn_assert(dst.stride[0] > 0);
  39. megdnn_assert(static_cast<size_t>(src.stride[0]) >= src.shape[1]);
  40. megdnn_assert(static_cast<size_t>(dst.stride[0]) >= dst.shape[1]);
  41. auto required_workspace_in_bytes = get_workspace_in_bytes(src, dst);
  42. megdnn_assert(workspace_in_bytes >= required_workspace_in_bytes);
  43. }
  44. } // namespace megdnn
  45. // vim: syntax=cpp.doxygen

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台