You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

reorg.cpp 2.3 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283
  1. // Tencent is pleased to support the open source community by making ncnn available.
  2. //
  3. // Copyright (C) 2018 THL A29 Limited, a Tencent company. All rights reserved.
  4. //
  5. // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
  6. // in compliance with the License. You may obtain a copy of the License at
  7. //
  8. // https://opensource.org/licenses/BSD-3-Clause
  9. //
  10. // Unless required by applicable law or agreed to in writing, software distributed
  11. // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
  12. // CONDITIONS OF ANY KIND, either express or implied. See the License for the
  13. // specific language governing permissions and limitations under the License.
  14. #include "reorg.h"
  15. namespace ncnn {
  16. Reorg::Reorg()
  17. {
  18. one_blob_only = true;
  19. support_inplace = false;
  20. }
  21. int Reorg::load_param(const ParamDict& pd)
  22. {
  23. stride = pd.get(0, 1);
  24. mode = pd.get(1, 0);
  25. return 0;
  26. }
  27. int Reorg::forward(const Mat& bottom_blob, Mat& top_blob, const Option& opt) const
  28. {
  29. int w = bottom_blob.w;
  30. int h = bottom_blob.h;
  31. int channels = bottom_blob.c;
  32. size_t elemsize = bottom_blob.elemsize;
  33. int outw = w / stride;
  34. int outh = h / stride;
  35. int outc = channels * stride * stride;
  36. top_blob.create(outw, outh, outc, elemsize, opt.blob_allocator);
  37. if (top_blob.empty())
  38. return -100;
  39. #pragma omp parallel for num_threads(opt.num_threads)
  40. for (int q = 0; q < channels; q++)
  41. {
  42. const Mat m = bottom_blob.channel(q);
  43. for (int sh = 0; sh < stride; sh++)
  44. {
  45. for (int sw = 0; sw < stride; sw++)
  46. {
  47. int p;
  48. if (mode == 0)
  49. p = q * stride * stride + sh * stride + sw;
  50. else // if (mode == 1)
  51. p = (sh * stride + sw) * channels + q;
  52. float* outptr = top_blob.channel(p);
  53. for (int i = 0; i < outh; i++)
  54. {
  55. const float* sptr = m.row(i * stride + sh) + sw;
  56. for (int j = 0; j < outw; j++)
  57. {
  58. outptr[0] = sptr[0];
  59. sptr += stride;
  60. outptr++;
  61. }
  62. }
  63. }
  64. }
  65. }
  66. return 0;
  67. }
  68. } // namespace ncnn