You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

reorg.cpp 2.2 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778
  1. // Tencent is pleased to support the open source community by making ncnn available.
  2. //
  3. // Copyright (C) 2018 THL A29 Limited, a Tencent company. All rights reserved.
  4. //
  5. // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
  6. // in compliance with the License. You may obtain a copy of the License at
  7. //
  8. // https://opensource.org/licenses/BSD-3-Clause
  9. //
  10. // Unless required by applicable law or agreed to in writing, software distributed
  11. // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
  12. // CONDITIONS OF ANY KIND, either express or implied. See the License for the
  13. // specific language governing permissions and limitations under the License.
  14. #include "reorg.h"
  15. namespace ncnn {
  16. DEFINE_LAYER_CREATOR(Reorg)
  17. Reorg::Reorg()
  18. {
  19. one_blob_only = true;
  20. support_inplace = false;
  21. }
  22. int Reorg::load_param(const ParamDict& pd)
  23. {
  24. stride = pd.get(0, 0);
  25. return 0;
  26. }
  27. int Reorg::forward(const Mat& bottom_blob, Mat& top_blob, const Option& opt) const
  28. {
  29. int w = bottom_blob.w;
  30. int h = bottom_blob.h;
  31. int channels = bottom_blob.c;
  32. size_t elemsize = bottom_blob.elemsize;
  33. int outw = w / stride;
  34. int outh = h / stride;
  35. int outc = channels * stride * stride;
  36. top_blob.create(outw, outh, outc, elemsize, opt.blob_allocator);
  37. if (top_blob.empty())
  38. return -100;
  39. #pragma omp parallel for num_threads(opt.num_threads)
  40. for (int q=0; q<channels; q++)
  41. {
  42. const Mat m = bottom_blob.channel(q);
  43. for (int sh = 0; sh < stride; sh++)
  44. {
  45. for (int sw = 0; sw < stride; sw++)
  46. {
  47. float* outptr = top_blob.channel(q*stride*stride + sh*stride + sw);
  48. for (int i = 0; i < outh; i++)
  49. {
  50. const float* sptr = m.row(i*stride + sh) + sw;
  51. for (int j = 0; j < outw; j++)
  52. {
  53. outptr[0] = sptr[0];
  54. sptr += stride;
  55. outptr++;
  56. }
  57. }
  58. }
  59. }
  60. }
  61. return 0;
  62. }
  63. } // namespace ncnn