You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

roi_align.cpp 3.7 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889
  1. /**
  2. * \file dnn/src/common/roi_align.cpp
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2020 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. */
  11. #include "megdnn/oprs.h"
  12. #include "src/common/utils.h"
  13. namespace megdnn {
  14. void ROIAlignBase::deduce_layout_fwd(const TensorLayout& src,
  15. const TensorLayout& rois,
  16. TensorLayout& dst, TensorLayout& index) {
  17. megdnn_assert_contiguous(src);
  18. megdnn_assert_contiguous(rois);
  19. megdnn_assert_contiguous(dst);
  20. megdnn_assert_contiguous(index);
  21. auto errmsg = [&]() {
  22. return megdnn_layout_msg(src) + ", " + megdnn_layout_msg(rois) + ", " +
  23. megdnn_layout_msg(dst) + ", " + megdnn_layout_msg(index);
  24. };
  25. MEGDNN_MARK_USED_VAR(errmsg);
  26. using Format = ROIAlignBase::Param::Format;
  27. megdnn_assert(param().format == Format::NCHW);
  28. auto src_dtype = src.dtype, rois_dtype = rois.dtype;
  29. megdnn_assert(src_dtype == rois_dtype &&
  30. src_dtype.category() == DTypeCategory::FLOAT);
  31. megdnn_assert(src.ndim == 4_z, "%s", errmsg().c_str());
  32. size_t channels = src.shape[1];
  33. megdnn_assert(rois.ndim == 2_z, "%s", errmsg().c_str());
  34. // rois shape: bid, x0, y0, x1, y1
  35. megdnn_assert(rois[1] == 5_z, "%s", errmsg().c_str());
  36. size_t M = rois[0];
  37. size_t pooled_height = param().pooled_height;
  38. size_t pooled_width = param().pooled_width;
  39. dst = TensorLayout{{M, channels, pooled_height, pooled_width}, src.dtype};
  40. index = dst;
  41. index.dtype = dtype::Int32();
  42. }
  43. void ROIAlignBase::check_layout_fwd(const TensorLayout& src,
  44. const TensorLayout& rois,
  45. const TensorLayout& dst,
  46. const TensorLayout& index) {
  47. TensorLayout dst_expected, index_expected;
  48. megdnn_assert_eq_dtype(src, dst);
  49. deduce_layout_fwd(src, rois, dst_expected, index_expected);
  50. megdnn_assert_eq_shape(dst_expected, dst);
  51. megdnn_assert_eq_shape(index_expected, index);
  52. megdnn_assert(index.dtype == dtype::Int32());
  53. }
  54. void ROIAlignForward::deduce_layout(const TensorLayout& src,
  55. const TensorLayout& rois, TensorLayout& dst,
  56. TensorLayout& index) {
  57. deduce_layout_fwd(src, rois, dst, index);
  58. }
  59. void ROIAlignForward::check_exec(const TensorLayout& src,
  60. const TensorLayout& rois,
  61. const TensorLayout& dst,
  62. const TensorLayout& index,
  63. size_t workspace_in_bytes) {
  64. check_layout_fwd(src, rois, dst, index);
  65. auto required_workspace_in_bytes =
  66. get_workspace_in_bytes(src, rois, dst, index);
  67. megdnn_assert(workspace_in_bytes >= required_workspace_in_bytes);
  68. }
  69. void ROIAlignBackward::check_exec(const TensorLayout& diff,
  70. const TensorLayout& rois,
  71. const TensorLayout& index,
  72. const TensorLayout& grad,
  73. size_t workspace_in_bytes) {
  74. check_layout_fwd(grad, rois, diff, index);
  75. auto required_workspace_in_bytes =
  76. get_workspace_in_bytes(diff, rois, index, grad);
  77. megdnn_assert(workspace_in_bytes >= required_workspace_in_bytes);
  78. }
  79. } // namespace megdnn
  80. // vim: syntax=cpp.doxygen

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台