You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

test_multiheadattention.cpp 5.5 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161
  1. // Tencent is pleased to support the open source community by making ncnn available.
  2. //
  3. // Copyright (C) 2021 THL A29 Limited, a Tencent company. All rights reserved.
  4. //
  5. // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
  6. // in compliance with the License. You may obtain a copy of the License at
  7. //
  8. // https://opensource.org/licenses/BSD-3-Clause
  9. //
  10. // Unless required by applicable law or agreed to in writing, software distributed
  11. // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
  12. // CONDITIONS OF ANY KIND, either express or implied. See the License for the
  13. // specific language governing permissions and limitations under the License.
  14. #include "layer/multiheadattention.h"
  15. #include "testutil.h"
  16. static int test_multiheadattention(const ncnn::Mat& q, const ncnn::Mat& k, const ncnn::Mat& v, int num_heads, int kdim, int vdim)
  17. {
  18. int embed_dim = q.w;
  19. ncnn::ParamDict pd;
  20. pd.set(0, embed_dim);
  21. pd.set(1, num_heads);
  22. pd.set(2, embed_dim * embed_dim);
  23. pd.set(3, kdim);
  24. pd.set(4, vdim);
  25. std::vector<ncnn::Mat> weights(8);
  26. weights[0] = RandomMat(embed_dim * embed_dim);
  27. weights[1] = RandomMat(embed_dim);
  28. weights[2] = RandomMat(embed_dim * kdim);
  29. weights[3] = RandomMat(embed_dim);
  30. weights[4] = RandomMat(embed_dim * vdim);
  31. weights[5] = RandomMat(embed_dim);
  32. weights[6] = RandomMat(embed_dim * embed_dim);
  33. weights[7] = RandomMat(embed_dim);
  34. std::vector<ncnn::Mat> as(3);
  35. as[0] = q;
  36. as[1] = k;
  37. as[2] = v;
  38. float epsilon = 0.005;
  39. int ret = test_layer<ncnn::MultiHeadAttention>("MultiHeadAttention", pd, weights, as, 1, epsilon);
  40. if (ret != 0)
  41. {
  42. fprintf(stderr, "test_multiheadattention failed q=(%d %d) k=(%d %d) v=(%d %d)\n", q.w, q.h, k.w, k.h, v.w, v.h);
  43. }
  44. return ret;
  45. }
  46. static int test_multiheadattention_samekv(const ncnn::Mat& q, const ncnn::Mat& kv, int num_heads, int kvdim)
  47. {
  48. int embed_dim = q.w;
  49. ncnn::ParamDict pd;
  50. pd.set(0, embed_dim);
  51. pd.set(1, num_heads);
  52. pd.set(2, embed_dim * embed_dim);
  53. pd.set(3, kvdim);
  54. pd.set(4, kvdim);
  55. std::vector<ncnn::Mat> weights(8);
  56. weights[0] = RandomMat(embed_dim * embed_dim);
  57. weights[1] = RandomMat(embed_dim);
  58. weights[2] = RandomMat(embed_dim * kvdim);
  59. weights[3] = RandomMat(embed_dim);
  60. weights[4] = RandomMat(embed_dim * kvdim);
  61. weights[5] = RandomMat(embed_dim);
  62. weights[6] = RandomMat(embed_dim * embed_dim);
  63. weights[7] = RandomMat(embed_dim);
  64. std::vector<ncnn::Mat> as(2);
  65. as[0] = q;
  66. as[1] = kv;
  67. float epsilon = 0.005;
  68. int ret = test_layer<ncnn::MultiHeadAttention>("MultiHeadAttention", pd, weights, as, 1, epsilon);
  69. if (ret != 0)
  70. {
  71. fprintf(stderr, "test_multiheadattention_samekv failed q=(%d %d) kv=(%d %d)\n", q.w, q.h, kv.w, kv.h);
  72. }
  73. return ret;
  74. }
  75. static int test_multiheadattention_sameqkv(const ncnn::Mat& a, int num_heads)
  76. {
  77. int embed_dim = a.w;
  78. ncnn::ParamDict pd;
  79. pd.set(0, embed_dim);
  80. pd.set(1, num_heads);
  81. pd.set(2, embed_dim * embed_dim);
  82. std::vector<ncnn::Mat> weights(8);
  83. weights[0] = RandomMat(embed_dim * embed_dim);
  84. weights[1] = RandomMat(embed_dim);
  85. weights[2] = RandomMat(embed_dim * embed_dim);
  86. weights[3] = RandomMat(embed_dim);
  87. weights[4] = RandomMat(embed_dim * embed_dim);
  88. weights[5] = RandomMat(embed_dim);
  89. weights[6] = RandomMat(embed_dim * embed_dim);
  90. weights[7] = RandomMat(embed_dim);
  91. std::vector<ncnn::Mat> as(1);
  92. as[0] = a;
  93. float epsilon = 0.005;
  94. int ret = test_layer<ncnn::MultiHeadAttention>("MultiHeadAttention", pd, weights, as, 1, epsilon);
  95. if (ret != 0)
  96. {
  97. fprintf(stderr, "test_multiheadattention_sameqkv failed a=(%d %d)\n", a.w, a.h);
  98. }
  99. return ret;
  100. }
  101. static int test_multiheadattention_0()
  102. {
  103. return 0
  104. || test_multiheadattention(RandomMat(64, 128), RandomMat(64, 128), RandomMat(64, 128), 4, 64, 64)
  105. || test_multiheadattention(RandomMat(64, 127), RandomMat(64, 127), RandomMat(64, 127), 16, 64, 64)
  106. || test_multiheadattention(RandomMat(16, 128), RandomMat(44, 128), RandomMat(55, 128), 2, 44, 55)
  107. || test_multiheadattention(RandomMat(16, 128), RandomMat(44, 127), RandomMat(55, 127), 4, 44, 55)
  108. || test_multiheadattention(RandomMat(12, 17), RandomMat(28, 127), RandomMat(32, 127), 3, 28, 32)
  109. || test_multiheadattention(RandomMat(12, 17), RandomMat(28, 32), RandomMat(11, 32), 3, 28, 11);
  110. }
  111. static int test_multiheadattention_1()
  112. {
  113. return 0
  114. || test_multiheadattention_samekv(RandomMat(64, 128), RandomMat(64, 128), 4, 64)
  115. || test_multiheadattention_samekv(RandomMat(64, 127), RandomMat(64, 127), 16, 64)
  116. || test_multiheadattention_samekv(RandomMat(16, 128), RandomMat(44, 128), 2, 44)
  117. || test_multiheadattention_samekv(RandomMat(16, 128), RandomMat(22, 127), 4, 22)
  118. || test_multiheadattention_samekv(RandomMat(12, 17), RandomMat(28, 127), 3, 28)
  119. || test_multiheadattention_samekv(RandomMat(12, 17), RandomMat(11, 32), 3, 11);
  120. }
  121. static int test_multiheadattention_2()
  122. {
  123. return 0
  124. || test_multiheadattention_sameqkv(RandomMat(64, 128), 8)
  125. || test_multiheadattention_sameqkv(RandomMat(64, 127), 32);
  126. }
  127. int main()
  128. {
  129. SRAND(7767517);
  130. return 0
  131. || test_multiheadattention_0()
  132. || test_multiheadattention_1()
  133. || test_multiheadattention_2();
  134. }