You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

test_command.cpp 7.3 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231
  1. // Tencent is pleased to support the open source community by making ncnn available.
  2. //
  3. // Copyright (C) 2021 THL A29 Limited, a Tencent company. All rights reserved.
  4. //
  5. // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
  6. // in compliance with the License. You may obtain a copy of the License at
  7. //
  8. // https://opensource.org/licenses/BSD-3-Clause
  9. //
  10. // Unless required by applicable law or agreed to in writing, software distributed
  11. // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
  12. // CONDITIONS OF ANY KIND, either express or implied. See the License for the
  13. // specific language governing permissions and limitations under the License.
  14. #include "command.h"
  15. #include "gpu.h"
  16. #include "mat.h"
  17. #include "testutil.h"
  18. static int test_command_upload_download(const ncnn::Mat& a)
  19. {
  20. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  21. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  22. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  23. ncnn::Option opt;
  24. opt.num_threads = 1;
  25. opt.use_vulkan_compute = true;
  26. opt.blob_vkallocator = blob_allocator;
  27. opt.staging_vkallocator = staging_allocator;
  28. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  29. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  30. ncnn::Mat d;
  31. ncnn::Mat e;
  32. {
  33. ncnn::VkCompute cmd(vkdev);
  34. ncnn::VkMat b1;
  35. ncnn::VkImageMat b2;
  36. ncnn::VkImageMat c1;
  37. ncnn::VkMat c2;
  38. cmd.record_upload(a, b1, opt);
  39. cmd.record_upload(a, c1, opt);
  40. cmd.record_buffer_to_image(b1, b2, opt);
  41. cmd.record_image_to_buffer(c1, c2, opt);
  42. cmd.record_download(b2, d, opt);
  43. cmd.record_download(c2, e, opt);
  44. cmd.submit_and_wait();
  45. }
  46. vkdev->reclaim_blob_allocator(blob_allocator);
  47. vkdev->reclaim_staging_allocator(staging_allocator);
  48. if (CompareMat(a, d, 0.001) != 0)
  49. {
  50. fprintf(stderr, "test_command_upload_download buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  51. return -1;
  52. }
  53. if (CompareMat(a, e, 0.001) != 0)
  54. {
  55. fprintf(stderr, "test_command_upload_download image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  56. return -1;
  57. }
  58. return 0;
  59. }
  60. static int test_command_clone(const ncnn::Mat& a)
  61. {
  62. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  63. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  64. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  65. ncnn::Option opt;
  66. opt.num_threads = 1;
  67. opt.use_vulkan_compute = true;
  68. opt.blob_vkallocator = blob_allocator;
  69. opt.staging_vkallocator = staging_allocator;
  70. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  71. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  72. ncnn::Mat d;
  73. ncnn::Mat e;
  74. {
  75. ncnn::VkCompute cmd(vkdev);
  76. ncnn::VkMat b1;
  77. ncnn::VkMat b2;
  78. ncnn::VkImageMat b3;
  79. ncnn::VkImageMat c1;
  80. ncnn::VkImageMat c2;
  81. ncnn::VkMat c3;
  82. cmd.record_clone(a, b1, opt);
  83. cmd.record_clone(a, c1, opt);
  84. cmd.record_clone(b1, b2, opt);
  85. cmd.record_clone(c1, c2, opt);
  86. cmd.record_clone(b2, b3, opt);
  87. cmd.record_clone(c2, c3, opt);
  88. cmd.record_clone(b3, d, opt);
  89. cmd.record_clone(c3, e, opt);
  90. cmd.submit_and_wait();
  91. }
  92. vkdev->reclaim_blob_allocator(blob_allocator);
  93. vkdev->reclaim_staging_allocator(staging_allocator);
  94. if (CompareMat(a, d, 0.001) != 0)
  95. {
  96. fprintf(stderr, "test_command_clone buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  97. return -1;
  98. }
  99. if (CompareMat(a, e, 0.001) != 0)
  100. {
  101. fprintf(stderr, "test_command_clone image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  102. return -1;
  103. }
  104. return 0;
  105. }
  106. static int test_command_transfer(const ncnn::Mat& a)
  107. {
  108. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  109. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  110. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  111. ncnn::Option opt;
  112. opt.num_threads = 1;
  113. opt.use_vulkan_compute = true;
  114. opt.blob_vkallocator = blob_allocator;
  115. opt.staging_vkallocator = staging_allocator;
  116. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  117. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  118. ncnn::Mat d;
  119. ncnn::Mat e;
  120. {
  121. ncnn::VkTransfer cmd1(vkdev);
  122. ncnn::VkMat b1;
  123. ncnn::VkImageMat c1;
  124. cmd1.record_upload(a, b1, opt, false);
  125. cmd1.record_upload(a, c1, opt);
  126. cmd1.submit_and_wait();
  127. ncnn::VkCompute cmd2(vkdev);
  128. cmd2.record_download(b1, d, opt);
  129. cmd2.record_download(c1, e, opt);
  130. cmd2.submit_and_wait();
  131. }
  132. vkdev->reclaim_blob_allocator(blob_allocator);
  133. vkdev->reclaim_staging_allocator(staging_allocator);
  134. if (CompareMat(a, d, 0.001) != 0)
  135. {
  136. fprintf(stderr, "test_command_transfer buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  137. return -1;
  138. }
  139. if (CompareMat(a, e, 0.001) != 0)
  140. {
  141. fprintf(stderr, "test_command_transfer image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  142. return -1;
  143. }
  144. return 0;
  145. }
  146. static int test_command_0()
  147. {
  148. return 0
  149. || test_command_upload_download(RandomMat(5, 7, 24))
  150. || test_command_upload_download(RandomMat(7, 9, 12))
  151. || test_command_upload_download(RandomMat(3, 5, 13))
  152. || test_command_upload_download(RandomMat(15, 24))
  153. || test_command_upload_download(RandomMat(19, 12))
  154. || test_command_upload_download(RandomMat(17, 15))
  155. || test_command_upload_download(RandomMat(128))
  156. || test_command_upload_download(RandomMat(124))
  157. || test_command_upload_download(RandomMat(127));
  158. }
  159. static int test_command_1()
  160. {
  161. return 0
  162. || test_command_clone(RandomMat(5, 7, 24))
  163. || test_command_clone(RandomMat(7, 9, 12))
  164. || test_command_clone(RandomMat(3, 5, 13))
  165. || test_command_clone(RandomMat(15, 24))
  166. || test_command_clone(RandomMat(19, 12))
  167. || test_command_clone(RandomMat(17, 15))
  168. || test_command_clone(RandomMat(128))
  169. || test_command_clone(RandomMat(124))
  170. || test_command_clone(RandomMat(127));
  171. }
  172. static int test_command_2()
  173. {
  174. return 0
  175. || test_command_transfer(RandomMat(5, 7, 24))
  176. || test_command_transfer(RandomMat(7, 9, 12))
  177. || test_command_transfer(RandomMat(3, 5, 13))
  178. || test_command_transfer(RandomMat(15, 24))
  179. || test_command_transfer(RandomMat(19, 12))
  180. || test_command_transfer(RandomMat(17, 15))
  181. || test_command_transfer(RandomMat(128))
  182. || test_command_transfer(RandomMat(124))
  183. || test_command_transfer(RandomMat(127));
  184. }
  185. int main()
  186. {
  187. SRAND(7767517);
  188. return test_command_0() || test_command_1() || test_command_2();
  189. }