You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

test_command.cpp 7.2 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228
  1. // Tencent is pleased to support the open source community by making ncnn available.
  2. //
  3. // Copyright (C) 2021 THL A29 Limited, a Tencent company. All rights reserved.
  4. //
  5. // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
  6. // in compliance with the License. You may obtain a copy of the License at
  7. //
  8. // https://opensource.org/licenses/BSD-3-Clause
  9. //
  10. // Unless required by applicable law or agreed to in writing, software distributed
  11. // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
  12. // CONDITIONS OF ANY KIND, either express or implied. See the License for the
  13. // specific language governing permissions and limitations under the License.
  14. #include "command.h"
  15. #include "gpu.h"
  16. #include "mat.h"
  17. #include "testutil.h"
  18. static int test_command_upload_download(const ncnn::Mat& a)
  19. {
  20. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  21. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  22. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  23. ncnn::Option opt;
  24. opt.use_vulkan_compute = true;
  25. opt.blob_vkallocator = blob_allocator;
  26. opt.staging_vkallocator = staging_allocator;
  27. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  28. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  29. ncnn::Mat d;
  30. ncnn::Mat e;
  31. {
  32. ncnn::VkCompute cmd(vkdev);
  33. ncnn::VkMat b1;
  34. ncnn::VkImageMat b2;
  35. ncnn::VkImageMat c1;
  36. ncnn::VkMat c2;
  37. cmd.record_upload(a, b1, opt);
  38. cmd.record_upload(a, c1, opt);
  39. cmd.record_buffer_to_image(b1, b2, opt);
  40. cmd.record_image_to_buffer(c1, c2, opt);
  41. cmd.record_download(b2, d, opt);
  42. cmd.record_download(c2, e, opt);
  43. cmd.submit_and_wait();
  44. }
  45. vkdev->reclaim_blob_allocator(blob_allocator);
  46. vkdev->reclaim_staging_allocator(staging_allocator);
  47. if (CompareMat(a, d, 0.001) != 0)
  48. {
  49. fprintf(stderr, "test_command_upload_download buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  50. return -1;
  51. }
  52. if (CompareMat(a, e, 0.001) != 0)
  53. {
  54. fprintf(stderr, "test_command_upload_download image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  55. return -1;
  56. }
  57. return 0;
  58. }
  59. static int test_command_clone(const ncnn::Mat& a)
  60. {
  61. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  62. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  63. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  64. ncnn::Option opt;
  65. opt.use_vulkan_compute = true;
  66. opt.blob_vkallocator = blob_allocator;
  67. opt.staging_vkallocator = staging_allocator;
  68. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  69. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  70. ncnn::Mat d;
  71. ncnn::Mat e;
  72. {
  73. ncnn::VkCompute cmd(vkdev);
  74. ncnn::VkMat b1;
  75. ncnn::VkMat b2;
  76. ncnn::VkImageMat b3;
  77. ncnn::VkImageMat c1;
  78. ncnn::VkImageMat c2;
  79. ncnn::VkMat c3;
  80. cmd.record_clone(a, b1, opt);
  81. cmd.record_clone(a, c1, opt);
  82. cmd.record_clone(b1, b2, opt);
  83. cmd.record_clone(c1, c2, opt);
  84. cmd.record_clone(b2, b3, opt);
  85. cmd.record_clone(c2, c3, opt);
  86. cmd.record_clone(b3, d, opt);
  87. cmd.record_clone(c3, e, opt);
  88. cmd.submit_and_wait();
  89. }
  90. vkdev->reclaim_blob_allocator(blob_allocator);
  91. vkdev->reclaim_staging_allocator(staging_allocator);
  92. if (CompareMat(a, d, 0.001) != 0)
  93. {
  94. fprintf(stderr, "test_command_clone buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  95. return -1;
  96. }
  97. if (CompareMat(a, e, 0.001) != 0)
  98. {
  99. fprintf(stderr, "test_command_clone image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  100. return -1;
  101. }
  102. return 0;
  103. }
  104. static int test_command_transfer(const ncnn::Mat& a)
  105. {
  106. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  107. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  108. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  109. ncnn::Option opt;
  110. opt.use_vulkan_compute = true;
  111. opt.blob_vkallocator = blob_allocator;
  112. opt.staging_vkallocator = staging_allocator;
  113. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  114. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  115. ncnn::Mat d;
  116. ncnn::Mat e;
  117. {
  118. ncnn::VkTransfer cmd1(vkdev);
  119. ncnn::VkMat b1;
  120. ncnn::VkImageMat c1;
  121. cmd1.record_upload(a, b1, opt, false);
  122. cmd1.record_upload(a, c1, opt);
  123. cmd1.submit_and_wait();
  124. ncnn::VkCompute cmd2(vkdev);
  125. cmd2.record_download(b1, d, opt);
  126. cmd2.record_download(c1, e, opt);
  127. cmd2.submit_and_wait();
  128. }
  129. vkdev->reclaim_blob_allocator(blob_allocator);
  130. vkdev->reclaim_staging_allocator(staging_allocator);
  131. if (CompareMat(a, d, 0.001) != 0)
  132. {
  133. fprintf(stderr, "test_command_transfer buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  134. return -1;
  135. }
  136. if (CompareMat(a, e, 0.001) != 0)
  137. {
  138. fprintf(stderr, "test_command_transfer image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  139. return -1;
  140. }
  141. return 0;
  142. }
  143. static int test_command_0()
  144. {
  145. return 0
  146. || test_command_upload_download(RandomMat(5, 7, 24))
  147. || test_command_upload_download(RandomMat(7, 9, 12))
  148. || test_command_upload_download(RandomMat(3, 5, 13))
  149. || test_command_upload_download(RandomMat(15, 24))
  150. || test_command_upload_download(RandomMat(19, 12))
  151. || test_command_upload_download(RandomMat(17, 15))
  152. || test_command_upload_download(RandomMat(128))
  153. || test_command_upload_download(RandomMat(124))
  154. || test_command_upload_download(RandomMat(127));
  155. }
  156. static int test_command_1()
  157. {
  158. return 0
  159. || test_command_clone(RandomMat(5, 7, 24))
  160. || test_command_clone(RandomMat(7, 9, 12))
  161. || test_command_clone(RandomMat(3, 5, 13))
  162. || test_command_clone(RandomMat(15, 24))
  163. || test_command_clone(RandomMat(19, 12))
  164. || test_command_clone(RandomMat(17, 15))
  165. || test_command_clone(RandomMat(128))
  166. || test_command_clone(RandomMat(124))
  167. || test_command_clone(RandomMat(127));
  168. }
  169. static int test_command_2()
  170. {
  171. return 0
  172. || test_command_transfer(RandomMat(5, 7, 24))
  173. || test_command_transfer(RandomMat(7, 9, 12))
  174. || test_command_transfer(RandomMat(3, 5, 13))
  175. || test_command_transfer(RandomMat(15, 24))
  176. || test_command_transfer(RandomMat(19, 12))
  177. || test_command_transfer(RandomMat(17, 15))
  178. || test_command_transfer(RandomMat(128))
  179. || test_command_transfer(RandomMat(124))
  180. || test_command_transfer(RandomMat(127));
  181. }
  182. int main()
  183. {
  184. SRAND(7767517);
  185. return test_command_0() || test_command_1() || test_command_2();
  186. }