// Tencent is pleased to support the open source community by making ncnn available. // // Copyright (C) 2021 THL A29 Limited, a Tencent company. All rights reserved. // // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except // in compliance with the License. You may obtain a copy of the License at // // https://opensource.org/licenses/BSD-3-Clause // // Unless required by applicable law or agreed to in writing, software distributed // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR // CONDITIONS OF ANY KIND, either express or implied. See the License for the // specific language governing permissions and limitations under the License. #include "layer/multiheadattention.h" #include "testutil.h" static int test_multiheadattention(const ncnn::Mat& q, const ncnn::Mat& k, const ncnn::Mat& v, int num_heads, int kdim, int vdim) { int embed_dim = q.w; ncnn::ParamDict pd; pd.set(0, embed_dim); pd.set(1, num_heads); pd.set(2, embed_dim * embed_dim); pd.set(3, kdim); pd.set(4, vdim); std::vector weights(8); weights[0] = RandomMat(embed_dim * embed_dim); weights[1] = RandomMat(embed_dim); weights[2] = RandomMat(embed_dim * kdim); weights[3] = RandomMat(embed_dim); weights[4] = RandomMat(embed_dim * vdim); weights[5] = RandomMat(embed_dim); weights[6] = RandomMat(embed_dim * embed_dim); weights[7] = RandomMat(embed_dim); std::vector as(3); as[0] = q; as[1] = k; as[2] = v; int ret = test_layer("MultiHeadAttention", pd, weights, as); if (ret != 0) { fprintf(stderr, "test_multiheadattention failed q=(%d %d) k=(%d %d) v=(%d %d)\n", q.w, q.h, k.w, k.h, v.w, v.h); } return ret; } static int test_multiheadattention_samekv(const ncnn::Mat& q, const ncnn::Mat& kv, int num_heads, int kvdim) { int embed_dim = q.w; ncnn::ParamDict pd; pd.set(0, embed_dim); pd.set(1, num_heads); pd.set(2, embed_dim * embed_dim); pd.set(3, kvdim); pd.set(4, kvdim); std::vector weights(8); weights[0] = RandomMat(embed_dim * embed_dim); weights[1] = RandomMat(embed_dim); weights[2] = RandomMat(embed_dim * kvdim); weights[3] = RandomMat(embed_dim); weights[4] = RandomMat(embed_dim * kvdim); weights[5] = RandomMat(embed_dim); weights[6] = RandomMat(embed_dim * embed_dim); weights[7] = RandomMat(embed_dim); std::vector as(2); as[0] = q; as[1] = kv; int ret = test_layer("MultiHeadAttention", pd, weights, as); if (ret != 0) { fprintf(stderr, "test_multiheadattention failed q=(%d %d) kv=(%d %d)\n", q.w, q.h, kv.w, kv.h); } return ret; } static int test_multiheadattention_sameqkv(const ncnn::Mat& a, int num_heads) { int embed_dim = a.w; ncnn::ParamDict pd; pd.set(0, embed_dim); pd.set(1, num_heads); pd.set(2, embed_dim * embed_dim); std::vector weights(8); weights[0] = RandomMat(embed_dim * embed_dim); weights[1] = RandomMat(embed_dim); weights[2] = RandomMat(embed_dim * embed_dim); weights[3] = RandomMat(embed_dim); weights[4] = RandomMat(embed_dim * embed_dim); weights[5] = RandomMat(embed_dim); weights[6] = RandomMat(embed_dim * embed_dim); weights[7] = RandomMat(embed_dim); std::vector as(1); as[0] = a; int ret = test_layer("MultiHeadAttention", pd, weights, as); if (ret != 0) { fprintf(stderr, "test_multiheadattention failed a=(%d %d)\n", a.w, a.h); } return ret; } static int test_multiheadattention_0() { return 0 || test_multiheadattention(RandomMat(64, 128), RandomMat(64, 128), RandomMat(64, 128), 4, 64, 64) || test_multiheadattention(RandomMat(64, 127), RandomMat(64, 127), RandomMat(64, 127), 16, 64, 64) || test_multiheadattention(RandomMat(16, 128), RandomMat(44, 128), RandomMat(55, 128), 2, 44, 55) || test_multiheadattention(RandomMat(16, 128), RandomMat(44, 127), RandomMat(55, 127), 4, 44, 55) || test_multiheadattention(RandomMat(12, 17), RandomMat(28, 127), RandomMat(32, 127), 3, 28, 32) || test_multiheadattention(RandomMat(12, 17), RandomMat(28, 32), RandomMat(11, 32), 3, 28, 11); } static int test_multiheadattention_1() { return 0 || test_multiheadattention_samekv(RandomMat(64, 128), RandomMat(64, 128), 4, 64) || test_multiheadattention_samekv(RandomMat(64, 127), RandomMat(64, 127), 16, 64) || test_multiheadattention_samekv(RandomMat(16, 128), RandomMat(44, 128), 2, 44) || test_multiheadattention_samekv(RandomMat(16, 128), RandomMat(22, 127), 4, 22) || test_multiheadattention_samekv(RandomMat(12, 17), RandomMat(28, 127), 3, 28) || test_multiheadattention_samekv(RandomMat(12, 17), RandomMat(11, 32), 3, 11); } static int test_multiheadattention_2() { return 0 || test_multiheadattention_sameqkv(RandomMat(64, 128), 8) || test_multiheadattention_sameqkv(RandomMat(64, 127), 32); } int main() { SRAND(7767517); return 0 || test_multiheadattention_0() || test_multiheadattention_1() || test_multiheadattention_2(); }