Browse Source

optimize opencl conv2d on mate40

pull/14399/head
wangdongxu 4 years ago
parent
commit
8c3e9e49d2
1 changed files with 3 additions and 0 deletions
  1. +3
    -0
      mindspore/lite/src/runtime/kernel/opencl/kernel/conv2d.cc

+ 3
- 0
mindspore/lite/src/runtime/kernel/opencl/kernel/conv2d.cc View File

@@ -350,6 +350,9 @@ void Conv2DOpenCLKernel::SetGlobalLocal() {
size_t global_w = UP_DIV(OW_, block_size_.W);
size_t global_c = UP_DIV(CO_SLICES_, block_size_.C);
int local_max = filter_type_ == MemType::IMG ? 64 : 128;
if (ocl_runtime_->DeviceComputeUnits() > 16) {
local_max = 256;
}
const int local_c_max = 16;
const int OH_threshold = 100;
const int OW_threshold = 100;


Loading…
Cancel
Save