You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

test_convolution_3.cpp 17 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408
  1. // Tencent is pleased to support the open source community by making ncnn available.
  2. //
  3. // Copyright (C) 2019 THL A29 Limited, a Tencent company. All rights reserved.
  4. //
  5. // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
  6. // in compliance with the License. You may obtain a copy of the License at
  7. //
  8. // https://opensource.org/licenses/BSD-3-Clause
  9. //
  10. // Unless required by applicable law or agreed to in writing, software distributed
  11. // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
  12. // CONDITIONS OF ANY KIND, either express or implied. See the License for the
  13. // specific language governing permissions and limitations under the License.
  14. #include "layer/convolution.h"
  15. #include "testutil.h"
  16. static int test_convolution_vec(int w, int outch, int kernel, int dilation, int stride, int pad, int bias)
  17. {
  18. ncnn::Mat a = RandomMat(w);
  19. ncnn::ParamDict pd;
  20. pd.set(0, outch); // num_output
  21. pd.set(1, kernel); // kernel_w
  22. pd.set(2, dilation); // dilation_w
  23. pd.set(3, stride); // stride_w
  24. pd.set(4, pad); // pad_w
  25. pd.set(5, bias); // bias_term
  26. pd.set(6, outch * w * kernel * kernel);
  27. int activation_type = RAND() % 7; // 0 1 2 3 4 5 6
  28. ncnn::Mat activation_params(2);
  29. activation_params[0] = (activation_type == 6) ? RandomFloat(0, 1) : RandomFloat(-1, 0); // alpha
  30. activation_params[1] = RandomFloat(0, 1); // beta
  31. pd.set(9, activation_type);
  32. pd.set(10, activation_params);
  33. std::vector<ncnn::Mat> weights(bias ? 2 : 1);
  34. weights[0] = RandomMat(outch * w * kernel * kernel);
  35. if (bias)
  36. weights[1] = RandomMat(outch);
  37. int ret = test_layer<ncnn::Convolution>("Convolution", pd, weights, a);
  38. if (ret != 0)
  39. {
  40. fprintf(stderr, "test_convolution_vec failed w=%d outch=%d kernel=%d dilation=%d stride=%d pad=%d bias=%d act=%d actparams=[%f,%f]\n", w, outch, kernel, dilation, stride, pad, bias, activation_type, activation_params[0], activation_params[1]);
  41. }
  42. return ret;
  43. }
  44. static int test_convolution_2()
  45. {
  46. return 0
  47. || test_convolution_vec(1, 1, 1, 1, 1, 0, 1)
  48. || test_convolution_vec(11, 12, 1, 1, 1, 0, 0)
  49. || test_convolution_vec(20, 15, 1, 1, 1, 0, 1)
  50. || test_convolution_vec(12, 20, 1, 1, 1, 0, 0)
  51. || test_convolution_vec(3, 24, 1, 1, 1, 0, 1)
  52. || test_convolution_vec(24, 5, 1, 1, 1, 0, 0)
  53. || test_convolution_vec(32, 24, 1, 1, 1, 0, 1)
  54. || test_convolution_vec(12, 32, 1, 1, 1, 0, 0)
  55. || test_convolution_vec(64, 20, 1, 1, 1, 0, 1)
  56. || test_convolution_vec(64, 128, 1, 1, 1, 0, 0);
  57. }
  58. static int test_convolution_dynamic(int w, int h, int c, int outch, int kernel, int dilation, int stride, int pad, int bias)
  59. {
  60. ncnn::Mat a = RandomMat(w, h, c);
  61. ncnn::ParamDict pd;
  62. pd.set(0, 0);
  63. pd.set(1, 0);
  64. pd.set(2, dilation);
  65. pd.set(3, stride);
  66. pd.set(4, pad);
  67. pd.set(5, bias);
  68. pd.set(6, 0);
  69. pd.set(19, 1); // dynamic weight
  70. int activation_type = RAND() % 7; // 0 1 2 3 4 5 6
  71. ncnn::Mat activation_params(2);
  72. activation_params[0] = (activation_type == 6) ? RandomFloat(0, 1) : RandomFloat(-1, 0); // alpha
  73. activation_params[1] = RandomFloat(0, 1); // beta
  74. pd.set(9, activation_type);
  75. pd.set(10, activation_params);
  76. std::vector<ncnn::Mat> as(bias ? 3 : 2);
  77. as[0] = a;
  78. as[1] = RandomMat(kernel, kernel, c, outch);
  79. if (bias)
  80. as[2] = RandomMat(outch);
  81. std::vector<ncnn::Mat> weights(0);
  82. int ret = test_layer<ncnn::Convolution>("Convolution", pd, weights, as);
  83. if (ret != 0)
  84. {
  85. fprintf(stderr, "test_convolution_dynamic failed w=%d h=%d c=%d outch=%d kernel=%d dilation=%d stride=%d pad=%d bias=%d act=%d actparams=[%f,%f]\n", w, h, c, outch, kernel, dilation, stride, pad, bias, activation_type, activation_params[0], activation_params[1]);
  86. }
  87. return ret;
  88. }
  89. static int test_convolution_3()
  90. {
  91. static const int kdsp[7][4] = {
  92. {1, 1, 1, 0},
  93. {1, 1, 2, 0},
  94. {2, 1, 1, 1},
  95. {2, 1, 2, -233},
  96. {3, 1, 1, 1},
  97. {3, 1, 2, 1},
  98. {3, 2, 1, -234},
  99. };
  100. for (int i = 0; i < 7; i++)
  101. {
  102. const int k = kdsp[i][0];
  103. const int d = kdsp[i][1];
  104. const int s = kdsp[i][2];
  105. const int p = kdsp[i][3];
  106. int ret = 0
  107. || test_convolution_dynamic(11, 10, 1, 1, k, d, s, p, 1)
  108. || test_convolution_dynamic(11, 10, 4, 13, k, d, s, p, 0)
  109. || test_convolution_dynamic(11, 10, 13, 4, k, d, s, p, 1)
  110. || test_convolution_dynamic(11, 10, 12, 12, k, d, s, p, 0)
  111. || test_convolution_dynamic(11, 10, 8, 12, k, d, s, p, 1)
  112. || test_convolution_dynamic(11, 10, 8, 13, k, d, s, p, 0)
  113. || test_convolution_dynamic(11, 10, 13, 8, k, d, s, p, 1)
  114. || test_convolution_dynamic(11, 10, 12, 16, k, d, s, p, 0)
  115. || test_convolution_dynamic(11, 10, 15, 15, k, d, s, p, 0)
  116. || test_convolution_dynamic(11, 10, 16, 16, k, d, s, p, 0);
  117. if (ret != 0)
  118. return -1;
  119. }
  120. return 0;
  121. }
  122. #if NCNN_INT8
  123. static int test_convolution_int8(int w, int h, int c, int outch, int kernel, int dilation, int stride, int pad, int bias, bool requant = false)
  124. {
  125. ncnn::Mat a = RandomMat(w, h, c);
  126. ncnn::ParamDict pd;
  127. pd.set(0, outch);
  128. pd.set(1, kernel);
  129. pd.set(2, dilation);
  130. pd.set(3, stride);
  131. pd.set(4, pad);
  132. pd.set(5, bias);
  133. pd.set(6, outch * c * kernel * kernel);
  134. pd.set(8, requant ? 101 : 1); // int8_scale_term
  135. int activation_type = RAND() % 7; // 0 1 2 3 4 5 6
  136. ncnn::Mat activation_params(2);
  137. activation_params[0] = (activation_type == 6) ? RandomFloat(0, 1) : RandomFloat(-1, 0); // alpha
  138. activation_params[1] = RandomFloat(0, 1); // beta
  139. pd.set(9, activation_type);
  140. pd.set(10, activation_params);
  141. std::vector<ncnn::Mat> weights(bias ? 5 : 4);
  142. weights[0] = RandomMat(outch * c * kernel * kernel);
  143. ncnn::Mat weight_scales = scales_mat(weights[0], outch, c * kernel * kernel, c * kernel * kernel);
  144. ncnn::Mat input_scales = scales_mat(a, 1, w * h * c, a.cstep);
  145. ncnn::Mat top_scales = requant ? scales_mat(a, 1, w * h * c, a.cstep) : ncnn::Mat();
  146. if (bias)
  147. {
  148. weights[1] = RandomMat(outch);
  149. weights[2] = weight_scales;
  150. weights[3] = input_scales;
  151. weights[4] = top_scales;
  152. }
  153. else
  154. {
  155. weights[1] = weight_scales;
  156. weights[2] = input_scales;
  157. weights[3] = top_scales;
  158. }
  159. int flag = TEST_LAYER_DISABLE_GPU_TESTING;
  160. int ret = test_layer<ncnn::Convolution>("Convolution", pd, weights, a, requant ? 1.0f : 0.001f, 0, flag);
  161. if (ret != 0)
  162. {
  163. fprintf(stderr, "test_convolution_int8 failed w=%d h=%d c=%d outch=%d kernel=%d dilation=%d stride=%d pad=%d bias=%d requant=%d act=%d actparams=[%f,%f]\n", w, h, c, outch, kernel, dilation, stride, pad, bias, requant, activation_type, activation_params[0], activation_params[1]);
  164. return ret;
  165. }
  166. {
  167. ncnn::Option opt;
  168. opt.num_threads = 1;
  169. opt.use_packing_layout = true;
  170. opt.use_fp16_packed = false;
  171. opt.use_fp16_storage = false;
  172. opt.use_fp16_arithmetic = false;
  173. opt.use_bf16_storage = false;
  174. opt.use_shader_pack8 = false;
  175. opt.use_image_storage = false;
  176. opt.use_sgemm_convolution = false;
  177. opt.use_winograd_convolution = false;
  178. ret = test_layer_opt<ncnn::Convolution>("Convolution", pd, weights, opt, a, requant ? 1.0f : 0.001f, 0, flag);
  179. if (ret != 0)
  180. {
  181. fprintf(stderr, "test_convolution_int8 failed w=%d h=%d c=%d outch=%d kernel=%d dilation=%d stride=%d pad=%d bias=%d requant=%d act=%d actparams=[%f,%f]\n", w, h, c, outch, kernel, dilation, stride, pad, bias, requant, activation_type, activation_params[0], activation_params[1]);
  182. return ret;
  183. }
  184. }
  185. {
  186. ncnn::Option opt;
  187. opt.num_threads = 1;
  188. opt.use_packing_layout = true;
  189. opt.use_fp16_packed = true;
  190. opt.use_fp16_storage = true;
  191. opt.use_fp16_arithmetic = true;
  192. opt.use_bf16_storage = true;
  193. opt.use_shader_pack8 = true;
  194. opt.use_image_storage = true;
  195. opt.use_sgemm_convolution = false;
  196. opt.use_winograd_convolution = false;
  197. ret = test_layer_opt<ncnn::Convolution>("Convolution", pd, weights, opt, a, requant ? 1.0f : 0.001f, 0, flag);
  198. if (ret != 0)
  199. {
  200. fprintf(stderr, "test_convolution_int8 failed w=%d h=%d c=%d outch=%d kernel=%d dilation=%d stride=%d pad=%d bias=%d requant=%d act=%d actparams=[%f,%f]\n", w, h, c, outch, kernel, dilation, stride, pad, bias, requant, activation_type, activation_params[0], activation_params[1]);
  201. return ret;
  202. }
  203. }
  204. return ret;
  205. }
  206. static int test_convolution_1()
  207. {
  208. static const int kdsp[16][4] = {
  209. {1, 1, 1, 0},
  210. {1, 1, 2, 0},
  211. {2, 1, 1, 1},
  212. {2, 1, 2, -233},
  213. {3, 1, 1, 1},
  214. {3, 1, 2, 1},
  215. {3, 2, 1, 1},
  216. {4, 1, 1, 2},
  217. {4, 1, 2, -233},
  218. {4, 2, 1, -234},
  219. {5, 1, 1, -234},
  220. {5, 1, 2, 2},
  221. {5, 2, 2, 2},
  222. {7, 1, 1, 3},
  223. {7, 1, 2, 3},
  224. {7, 2, 1, -233},
  225. };
  226. for (int i = 0; i < 16; i++)
  227. {
  228. const int k = kdsp[i][0];
  229. const int d = kdsp[i][1];
  230. const int s = kdsp[i][2];
  231. const int p = kdsp[i][3];
  232. int ret = 0
  233. || test_convolution_int8(9, 7, 1, 1, k, d, s, p, 1)
  234. || test_convolution_int8(9, 7, 2, 2, k, d, s, p, 1)
  235. || test_convolution_int8(9, 7, 3, 3, k, d, s, p, 1)
  236. || test_convolution_int8(9, 7, 4, 4, k, d, s, p, 1)
  237. || test_convolution_int8(9, 7, 7, 7, k, d, s, p, 1)
  238. || test_convolution_int8(9, 7, 8, 8, k, d, s, p, 1)
  239. || test_convolution_int8(9, 7, 15, 15, k, d, s, p, 1)
  240. || test_convolution_int8(9, 7, 16, 15, k, d, s, p, 1)
  241. || test_convolution_int8(9, 7, 15, 16, k, d, s, p, 1)
  242. || test_convolution_int8(9, 7, 16, 16, k, d, s, p, 1);
  243. if (ret != 0)
  244. return -1;
  245. }
  246. for (int i = 0; i < 16; i++)
  247. {
  248. const int k = kdsp[i][0];
  249. const int d = kdsp[i][1];
  250. const int s = kdsp[i][2];
  251. const int p = kdsp[i][3];
  252. int ret = 0
  253. || test_convolution_int8(9, 7, 1, 1, k, d, s, p, 1, true)
  254. || test_convolution_int8(9, 7, 1, 1, k, d, s, p, 1, true)
  255. || test_convolution_int8(9, 7, 2, 2, k, d, s, p, 1, true)
  256. || test_convolution_int8(9, 7, 3, 3, k, d, s, p, 1, true)
  257. || test_convolution_int8(9, 7, 4, 4, k, d, s, p, 1, true)
  258. || test_convolution_int8(9, 7, 7, 7, k, d, s, p, 1, true)
  259. || test_convolution_int8(9, 7, 8, 8, k, d, s, p, 1, true)
  260. || test_convolution_int8(9, 7, 15, 15, k, d, s, p, 1, true)
  261. || test_convolution_int8(9, 7, 16, 15, k, d, s, p, 1, true)
  262. || test_convolution_int8(9, 7, 15, 16, k, d, s, p, 1, true)
  263. || test_convolution_int8(9, 7, 16, 16, k, d, s, p, 1, true);
  264. if (ret != 0)
  265. return -1;
  266. }
  267. return 0
  268. || test_convolution_int8(11, 11, 8, 16, 3, 1, 1, 1, 1)
  269. || test_convolution_int8(13, 16, 16, 24, 3, 1, 1, 1, 1)
  270. || test_convolution_int8(8, 8, 16, 24, 3, 1, 1, 1, 0)
  271. || test_convolution_int8(4, 8, 16, 24, 3, 1, 1, 1, 1)
  272. || test_convolution_int8(4, 20, 16, 24, 3, 1, 1, 1, 0)
  273. || test_convolution_int8(6, 7, 64, 64, 3, 1, 2, 0, 1)
  274. || test_convolution_int8(25, 33, 16, 15, 3, 1, 1, 1, 0)
  275. || test_convolution_int8(7, 7, 15, 12, 3, 1, 1, 1, 0);
  276. }
  277. static int test_convolution_1_2()
  278. {
  279. return 0
  280. || test_convolution_int8(19, 17, 1, 1, 3, 2, 2, 0, 1)
  281. || test_convolution_int8(19, 17, 2, 1, 3, 2, 2, 0, 0)
  282. || test_convolution_int8(19, 17, 7, 1, 3, 2, 2, 0, 1)
  283. || test_convolution_int8(19, 17, 8, 1, 3, 2, 2, 0, 0)
  284. || test_convolution_int8(19, 17, 15, 1, 3, 2, 2, 0, 1)
  285. || test_convolution_int8(19, 17, 16, 1, 3, 2, 2, 0, 0)
  286. || test_convolution_int8(19, 17, 31, 1, 3, 2, 2, 0, 1)
  287. || test_convolution_int8(19, 17, 32, 1, 3, 2, 2, 0, 0)
  288. || test_convolution_int8(19, 17, 1, 2, 5, 2, 2, 0, 1)
  289. || test_convolution_int8(19, 17, 2, 2, 5, 2, 2, 0, 0)
  290. || test_convolution_int8(19, 17, 7, 2, 5, 2, 2, 0, 1)
  291. || test_convolution_int8(19, 17, 8, 2, 5, 2, 2, 0, 0)
  292. || test_convolution_int8(19, 17, 15, 2, 5, 2, 2, 0, 1)
  293. || test_convolution_int8(19, 17, 16, 2, 5, 2, 2, 0, 0)
  294. || test_convolution_int8(19, 17, 31, 2, 5, 2, 2, 0, 1)
  295. || test_convolution_int8(19, 17, 32, 2, 5, 2, 2, 0, 0)
  296. || test_convolution_int8(19, 17, 1, 7, 5, 2, 2, 0, 1)
  297. || test_convolution_int8(19, 17, 2, 7, 5, 2, 2, 0, 0)
  298. || test_convolution_int8(19, 17, 7, 7, 5, 2, 2, 0, 1)
  299. || test_convolution_int8(19, 17, 8, 7, 5, 2, 2, 0, 0)
  300. || test_convolution_int8(19, 17, 15, 7, 5, 2, 2, 0, 1)
  301. || test_convolution_int8(19, 17, 16, 7, 5, 2, 2, 0, 0)
  302. || test_convolution_int8(19, 17, 31, 7, 5, 2, 2, 0, 1)
  303. || test_convolution_int8(19, 17, 32, 7, 5, 2, 2, 0, 0)
  304. || test_convolution_int8(19, 17, 1, 8, 5, 2, 2, 0, 1)
  305. || test_convolution_int8(19, 17, 2, 8, 5, 2, 2, 0, 0)
  306. || test_convolution_int8(19, 17, 7, 8, 5, 2, 2, 0, 1)
  307. || test_convolution_int8(19, 17, 8, 8, 5, 2, 2, 0, 0)
  308. || test_convolution_int8(19, 17, 15, 8, 5, 2, 2, 0, 1)
  309. || test_convolution_int8(19, 17, 16, 8, 5, 2, 2, 0, 0)
  310. || test_convolution_int8(19, 17, 31, 8, 5, 2, 2, 0, 1)
  311. || test_convolution_int8(19, 17, 32, 8, 5, 2, 2, 0, 0)
  312. || test_convolution_int8(19, 17, 1, 15, 5, 2, 2, 0, 1)
  313. || test_convolution_int8(19, 17, 2, 15, 5, 2, 2, 0, 0)
  314. || test_convolution_int8(19, 17, 7, 15, 5, 2, 2, 0, 1)
  315. || test_convolution_int8(19, 17, 8, 15, 5, 2, 2, 0, 0)
  316. || test_convolution_int8(19, 17, 15, 15, 5, 2, 2, 0, 1)
  317. || test_convolution_int8(19, 17, 16, 15, 5, 2, 2, 0, 0)
  318. || test_convolution_int8(19, 17, 31, 15, 5, 2, 2, 0, 1)
  319. || test_convolution_int8(19, 17, 32, 15, 5, 2, 2, 0, 0)
  320. || test_convolution_int8(19, 17, 1, 16, 5, 2, 2, 0, 1)
  321. || test_convolution_int8(19, 17, 2, 16, 5, 2, 2, 0, 0)
  322. || test_convolution_int8(19, 17, 7, 16, 5, 2, 2, 0, 1)
  323. || test_convolution_int8(19, 17, 8, 16, 5, 2, 2, 0, 0)
  324. || test_convolution_int8(19, 17, 15, 16, 5, 2, 2, 0, 1)
  325. || test_convolution_int8(19, 17, 16, 16, 5, 2, 2, 0, 0)
  326. || test_convolution_int8(19, 17, 31, 16, 5, 2, 2, 0, 1)
  327. || test_convolution_int8(19, 17, 32, 16, 5, 2, 2, 0, 0)
  328. || test_convolution_int8(19, 17, 1, 31, 5, 2, 2, 0, 1)
  329. || test_convolution_int8(19, 17, 2, 31, 5, 2, 2, 0, 0)
  330. || test_convolution_int8(19, 17, 7, 31, 5, 2, 2, 0, 1)
  331. || test_convolution_int8(19, 17, 8, 31, 5, 2, 2, 0, 0)
  332. || test_convolution_int8(19, 17, 15, 31, 5, 2, 2, 0, 1)
  333. || test_convolution_int8(19, 17, 16, 31, 5, 2, 2, 0, 0)
  334. || test_convolution_int8(19, 17, 31, 31, 5, 2, 2, 0, 1)
  335. || test_convolution_int8(19, 17, 32, 31, 5, 2, 2, 0, 0)
  336. || test_convolution_int8(19, 17, 1, 32, 5, 2, 2, 0, 1)
  337. || test_convolution_int8(19, 17, 2, 32, 5, 2, 2, 0, 0)
  338. || test_convolution_int8(19, 17, 7, 32, 5, 2, 2, 0, 1)
  339. || test_convolution_int8(19, 17, 8, 32, 5, 2, 2, 0, 0)
  340. || test_convolution_int8(19, 17, 15, 32, 5, 2, 2, 0, 1)
  341. || test_convolution_int8(19, 17, 16, 32, 5, 2, 2, 0, 0)
  342. || test_convolution_int8(19, 17, 31, 32, 5, 2, 2, 0, 1)
  343. || test_convolution_int8(19, 17, 32, 32, 5, 2, 2, 0, 0);
  344. }
  345. #endif // NCNN_INT8
  346. int main()
  347. {
  348. SRAND(7767517);
  349. #if NCNN_INT8
  350. return 0
  351. || test_convolution_1()
  352. || test_convolution_1_2()
  353. || test_convolution_2()
  354. || test_convolution_3();
  355. #else
  356. return 0
  357. || test_convolution_2()
  358. || test_convolution_3();
  359. #endif
  360. }