|
|
|
@@ -101,7 +101,7 @@ class BiasAddGradGpuKernel : public GpuKernel { |
|
|
|
cudnnSetTensorNdDescriptorEx(db_desc_, CUDNN_TENSOR_NCHW, cudnn_data_type_, SizeToInt(cudnn_dims), db_dims.get()), |
|
|
|
"cudnnSetTensorNdDescriptor failed"); |
|
|
|
CHECK_CUDNN_RET_WITH_EXCEPT( |
|
|
|
cudnnSetReduceTensorDescriptor(op_desc_, CUDNN_REDUCE_TENSOR_ADD, cudnn_data_type_, CUDNN_NOT_PROPAGATE_NAN, |
|
|
|
cudnnSetReduceTensorDescriptor(op_desc_, CUDNN_REDUCE_TENSOR_ADD, CUDNN_DATA_FLOAT, CUDNN_NOT_PROPAGATE_NAN, |
|
|
|
CUDNN_REDUCE_TENSOR_NO_INDICES, CUDNN_32BIT_INDICES), |
|
|
|
"cudnnSetReduceTensorDescriptor failed"); |
|
|
|
|
|
|
|
|