You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

test_command.cpp 5.8 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196
  1. // Copyright 2021 Tencent
  2. // SPDX-License-Identifier: BSD-3-Clause
  3. #include "command.h"
  4. #include "gpu.h"
  5. #include "mat.h"
  6. #include "testutil.h"
  7. static int test_command_upload_download(const ncnn::Mat& a)
  8. {
  9. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  10. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  11. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  12. ncnn::Option opt;
  13. opt.num_threads = 1;
  14. opt.use_vulkan_compute = true;
  15. opt.blob_vkallocator = blob_allocator;
  16. opt.staging_vkallocator = staging_allocator;
  17. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  18. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  19. ncnn::Mat c;
  20. {
  21. ncnn::VkCompute cmd(vkdev);
  22. ncnn::VkMat b;
  23. cmd.record_upload(a, b, opt);
  24. cmd.record_download(b, c, opt);
  25. cmd.submit_and_wait();
  26. }
  27. vkdev->reclaim_blob_allocator(blob_allocator);
  28. vkdev->reclaim_staging_allocator(staging_allocator);
  29. if (CompareMat(a, c, 0.001) != 0)
  30. {
  31. fprintf(stderr, "test_command_upload_download image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  32. return -1;
  33. }
  34. return 0;
  35. }
  36. static int test_command_clone(const ncnn::Mat& a)
  37. {
  38. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  39. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  40. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  41. ncnn::Option opt;
  42. opt.num_threads = 1;
  43. opt.use_vulkan_compute = true;
  44. opt.blob_vkallocator = blob_allocator;
  45. opt.staging_vkallocator = staging_allocator;
  46. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  47. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  48. ncnn::Mat d;
  49. ncnn::Mat e;
  50. {
  51. ncnn::VkCompute cmd(vkdev);
  52. ncnn::VkMat b1;
  53. ncnn::VkMat b2;
  54. ncnn::VkImageMat b3;
  55. ncnn::VkImageMat c1;
  56. ncnn::VkImageMat c2;
  57. ncnn::VkMat c3;
  58. cmd.record_clone(a, b1, opt);
  59. cmd.record_clone(a, c1, opt);
  60. cmd.record_clone(b1, b2, opt);
  61. cmd.record_clone(c1, c2, opt);
  62. cmd.record_clone(b2, b3, opt);
  63. cmd.record_clone(c2, c3, opt);
  64. cmd.record_clone(b3, d, opt);
  65. cmd.record_clone(c3, e, opt);
  66. cmd.submit_and_wait();
  67. }
  68. vkdev->reclaim_blob_allocator(blob_allocator);
  69. vkdev->reclaim_staging_allocator(staging_allocator);
  70. if (CompareMat(a, d, 0.001) != 0)
  71. {
  72. fprintf(stderr, "test_command_clone buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  73. return -1;
  74. }
  75. if (CompareMat(a, e, 0.001) != 0)
  76. {
  77. fprintf(stderr, "test_command_clone image failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  78. return -1;
  79. }
  80. return 0;
  81. }
  82. static int test_command_transfer(const ncnn::Mat& a)
  83. {
  84. ncnn::VulkanDevice* vkdev = ncnn::get_gpu_device();
  85. ncnn::VkAllocator* blob_allocator = vkdev->acquire_blob_allocator();
  86. ncnn::VkAllocator* staging_allocator = vkdev->acquire_staging_allocator();
  87. ncnn::Option opt;
  88. opt.num_threads = 1;
  89. opt.use_vulkan_compute = true;
  90. opt.blob_vkallocator = blob_allocator;
  91. opt.staging_vkallocator = staging_allocator;
  92. if (!vkdev->info.support_fp16_packed()) opt.use_fp16_packed = false;
  93. if (!vkdev->info.support_fp16_storage()) opt.use_fp16_storage = false;
  94. ncnn::Mat c;
  95. {
  96. ncnn::VkTransfer cmd1(vkdev);
  97. ncnn::VkMat b;
  98. cmd1.record_upload(a, b, opt, false);
  99. cmd1.submit_and_wait();
  100. ncnn::VkCompute cmd2(vkdev);
  101. cmd2.record_download(b, c, opt);
  102. cmd2.submit_and_wait();
  103. }
  104. vkdev->reclaim_blob_allocator(blob_allocator);
  105. vkdev->reclaim_staging_allocator(staging_allocator);
  106. if (CompareMat(a, c, 0.001) != 0)
  107. {
  108. fprintf(stderr, "test_command_transfer buffer failed a.dims=%d a=(%d %d %d)\n", a.dims, a.w, a.h, a.c);
  109. return -1;
  110. }
  111. return 0;
  112. }
  113. static int test_command_0()
  114. {
  115. return 0
  116. || test_command_upload_download(RandomMat(5, 7, 24))
  117. || test_command_upload_download(RandomMat(7, 9, 12))
  118. || test_command_upload_download(RandomMat(3, 5, 13))
  119. || test_command_upload_download(RandomMat(15, 24))
  120. || test_command_upload_download(RandomMat(19, 12))
  121. || test_command_upload_download(RandomMat(17, 15))
  122. || test_command_upload_download(RandomMat(128))
  123. || test_command_upload_download(RandomMat(124))
  124. || test_command_upload_download(RandomMat(127));
  125. }
  126. static int test_command_1()
  127. {
  128. return 0
  129. || test_command_clone(RandomMat(5, 7, 24))
  130. || test_command_clone(RandomMat(7, 9, 12))
  131. || test_command_clone(RandomMat(3, 5, 13))
  132. || test_command_clone(RandomMat(15, 24))
  133. || test_command_clone(RandomMat(19, 12))
  134. || test_command_clone(RandomMat(17, 15))
  135. || test_command_clone(RandomMat(128))
  136. || test_command_clone(RandomMat(124))
  137. || test_command_clone(RandomMat(127));
  138. }
  139. static int test_command_2()
  140. {
  141. return 0
  142. || test_command_transfer(RandomMat(5, 7, 24))
  143. || test_command_transfer(RandomMat(7, 9, 12))
  144. || test_command_transfer(RandomMat(3, 5, 13))
  145. || test_command_transfer(RandomMat(15, 24))
  146. || test_command_transfer(RandomMat(19, 12))
  147. || test_command_transfer(RandomMat(17, 15))
  148. || test_command_transfer(RandomMat(128))
  149. || test_command_transfer(RandomMat(124))
  150. || test_command_transfer(RandomMat(127));
  151. }
  152. int main()
  153. {
  154. SRAND(7767517);
  155. return test_command_0() || test_command_1() || test_command_2();
  156. }