You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

test_command.cpp 6.5 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207
  1. // Tencent is pleased to support the open source community by making ncnn available.
  2. //
  3. // Copyright (C) 2021 THL A29 Limited, a Tencent company. All rights reserved.
  4. //
  5. // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
  6. // in compliance with the License. You may obtain a copy of the License at
  7. //
  8. // https://opensource.org/licenses/BSD-3-Clause
  9. //
  10. // Unless required by applicable law or agreed to in writing, software distributed
  11. // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
  12. // CONDITIONS OF ANY KIND, either express or implied. See the License for the
  13. // specific language governing permissions and limitations under the License.
  14. #include "command.h"
  15. #include "gpu.h"
  16. #include "mat.h"
  17. #include "testutil.h"
  18. static int test_command_upload_download(const ncnn::Mat& a)
  19. {
  20. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  21. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  22. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  23. ncnn::Option opt;
  24. opt.num_threads = 1;
  25. opt.use_vulkan_compute = true;
  26. opt.blob_vkallocator = blob_allocator;
  27. opt.staging_vkallocator = staging_allocator;
  28. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  29. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  30. ncnn::Mat c;
  31. {
  32. ncnn::VkCompute cmd(vkdev);
  33. ncnn::VkMat b;
  34. cmd.record_upload(a, b, opt);
  35. cmd.record_download(b, c, opt);
  36. cmd.submit_and_wait();
  37. }
  38. vkdev->reclaim_blob_allocator(blob_allocator);
  39. vkdev->reclaim_staging_allocator(staging_allocator);
  40. if (CompareMat(a, c, 0.001) != 0)
  41. {
  42. fprintf(stderr, "test_command_upload_download image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  43. return -1;
  44. }
  45. return 0;
  46. }
  47. static int test_command_clone(const ncnn::Mat& a)
  48. {
  49. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  50. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  51. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  52. ncnn::Option opt;
  53. opt.num_threads = 1;
  54. opt.use_vulkan_compute = true;
  55. opt.blob_vkallocator = blob_allocator;
  56. opt.staging_vkallocator = staging_allocator;
  57. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  58. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  59. ncnn::Mat d;
  60. ncnn::Mat e;
  61. {
  62. ncnn::VkCompute cmd(vkdev);
  63. ncnn::VkMat b1;
  64. ncnn::VkMat b2;
  65. ncnn::VkImageMat b3;
  66. ncnn::VkImageMat c1;
  67. ncnn::VkImageMat c2;
  68. ncnn::VkMat c3;
  69. cmd.record_clone(a, b1, opt);
  70. cmd.record_clone(a, c1, opt);
  71. cmd.record_clone(b1, b2, opt);
  72. cmd.record_clone(c1, c2, opt);
  73. cmd.record_clone(b2, b3, opt);
  74. cmd.record_clone(c2, c3, opt);
  75. cmd.record_clone(b3, d, opt);
  76. cmd.record_clone(c3, e, opt);
  77. cmd.submit_and_wait();
  78. }
  79. vkdev->reclaim_blob_allocator(blob_allocator);
  80. vkdev->reclaim_staging_allocator(staging_allocator);
  81. if (CompareMat(a, d, 0.001) != 0)
  82. {
  83. fprintf(stderr, "test_command_clone buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  84. return -1;
  85. }
  86. if (CompareMat(a, e, 0.001) != 0)
  87. {
  88. fprintf(stderr, "test_command_clone image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  89. return -1;
  90. }
  91. return 0;
  92. }
  93. static int test_command_transfer(const ncnn::Mat& a)
  94. {
  95. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  96. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  97. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  98. ncnn::Option opt;
  99. opt.num_threads = 1;
  100. opt.use_vulkan_compute = true;
  101. opt.blob_vkallocator = blob_allocator;
  102. opt.staging_vkallocator = staging_allocator;
  103. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  104. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  105. ncnn::Mat c;
  106. {
  107. ncnn::VkTransfer cmd1(vkdev);
  108. ncnn::VkMat b;
  109. cmd1.record_upload(a, b, opt, false);
  110. cmd1.submit_and_wait();
  111. ncnn::VkCompute cmd2(vkdev);
  112. cmd2.record_download(b, c, opt);
  113. cmd2.submit_and_wait();
  114. }
  115. vkdev->reclaim_blob_allocator(blob_allocator);
  116. vkdev->reclaim_staging_allocator(staging_allocator);
  117. if (CompareMat(a, c, 0.001) != 0)
  118. {
  119. fprintf(stderr, "test_command_transfer buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  120. return -1;
  121. }
  122. return 0;
  123. }
  124. static int test_command_0()
  125. {
  126. return 0
  127. || test_command_upload_download(RandomMat(5, 7, 24))
  128. || test_command_upload_download(RandomMat(7, 9, 12))
  129. || test_command_upload_download(RandomMat(3, 5, 13))
  130. || test_command_upload_download(RandomMat(15, 24))
  131. || test_command_upload_download(RandomMat(19, 12))
  132. || test_command_upload_download(RandomMat(17, 15))
  133. || test_command_upload_download(RandomMat(128))
  134. || test_command_upload_download(RandomMat(124))
  135. || test_command_upload_download(RandomMat(127));
  136. }
  137. static int test_command_1()
  138. {
  139. return 0
  140. || test_command_clone(RandomMat(5, 7, 24))
  141. || test_command_clone(RandomMat(7, 9, 12))
  142. || test_command_clone(RandomMat(3, 5, 13))
  143. || test_command_clone(RandomMat(15, 24))
  144. || test_command_clone(RandomMat(19, 12))
  145. || test_command_clone(RandomMat(17, 15))
  146. || test_command_clone(RandomMat(128))
  147. || test_command_clone(RandomMat(124))
  148. || test_command_clone(RandomMat(127));
  149. }
  150. static int test_command_2()
  151. {
  152. return 0
  153. || test_command_transfer(RandomMat(5, 7, 24))
  154. || test_command_transfer(RandomMat(7, 9, 12))
  155. || test_command_transfer(RandomMat(3, 5, 13))
  156. || test_command_transfer(RandomMat(15, 24))
  157. || test_command_transfer(RandomMat(19, 12))
  158. || test_command_transfer(RandomMat(17, 15))
  159. || test_command_transfer(RandomMat(128))
  160. || test_command_transfer(RandomMat(124))
  161. || test_command_transfer(RandomMat(127));
  162. }
  163. int main()
  164. {
  165. SRAND(7767517);
  166. return test_command_0() || test_command_1() || test_command_2();
  167. }