From 6dc0c0b9cc5205619824168939f3bc461e6dbc8e Mon Sep 17 00:00:00 2001 From: Megvii Engine Team Date: Thu, 10 Mar 2022 11:50:09 +0800 Subject: [PATCH] fix(dnn): fix the sync problem in some kernels GitOrigin-RevId: df3f7dc51bdc1d8ad8073c491b522c769291c5f6 --- .../cuda/convolution3d/backward_filter/inplace_matmul_impl.cu | 3 ++- dnn/src/cuda/padding/padding.cu | 2 +- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/dnn/src/cuda/convolution3d/backward_filter/inplace_matmul_impl.cu b/dnn/src/cuda/convolution3d/backward_filter/inplace_matmul_impl.cu index 9188ff7b..0f06a3fe 100644 --- a/dnn/src/cuda/convolution3d/backward_filter/inplace_matmul_impl.cu +++ b/dnn/src/cuda/convolution3d/backward_filter/inplace_matmul_impl.cu @@ -355,7 +355,8 @@ void convolution3d::exec_inplace_matmul_bwd_filter( } else { BX = BY = 16; } - cudaMemset(grad, 0, OC * IC * FD * FH * FW * sizeof(float)); + cuda_check( + cudaMemsetAsync(grad, 0, OC * IC * FD * FH * FW * sizeof(float), stream)); dim3 blocks(DIVUP(n, 4 * BX), DIVUP(m, 4 * BY), N); dim3 threads(BX, BY); #define DISPATCH_BX_BY(BX, BY) \ diff --git a/dnn/src/cuda/padding/padding.cu b/dnn/src/cuda/padding/padding.cu index 5b4678cd..3e1147ed 100644 --- a/dnn/src/cuda/padding/padding.cu +++ b/dnn/src/cuda/padding/padding.cu @@ -224,7 +224,7 @@ void padding_backward_proxy( params.offsets[i * 2 + 1] = offsets[i * 2 + 1]; } - cudaMemset(dst.raw_ptr(), 0, dst.layout.access_bytes()); + cuda_check(cudaMemsetAsync(dst.raw_ptr(), 0, dst.layout.access_bytes(), stream)); void (*bwd_kern)(const size_t, const size_t, const T* const, T* const, ShapeParams);