|
|
|
@@ -41,10 +41,12 @@ TEST_F(CUDA, BENCHMARK_CONVOLUTION_8X8X32) |
|
|
|
auto time_in_ms_float = benchmarker.set_param(param_float) |
|
|
|
.set_dtype(0, dtype::Float32()) |
|
|
|
.set_dtype(1, dtype::Float32()) |
|
|
|
.set_dtype(2, dtype::Float32()) |
|
|
|
.execs({src_float, filter_float, {}}); |
|
|
|
auto time_in_ms_int = benchmarker.set_param(param_int) |
|
|
|
.set_dtype(0, dtype::Int8()) |
|
|
|
.set_dtype(1, dtype::Int8()) |
|
|
|
.set_dtype(2, dtype::Int32()) |
|
|
|
.execs({src_int, filter_int, {}}); |
|
|
|
std::cout << "1x1: N=" << N << " OC=" << OC << " IC=" << IC |
|
|
|
<< " H=" << H << " W=" << W |
|
|
|
@@ -67,10 +69,12 @@ TEST_F(CUDA, BENCHMARK_CONVOLUTION_8X8X32) |
|
|
|
auto time_in_ms_float = benchmarker.set_param(param_float) |
|
|
|
.set_dtype(0, dtype::Float32()) |
|
|
|
.set_dtype(1, dtype::Float32()) |
|
|
|
.set_dtype(2, dtype::Float32()) |
|
|
|
.execs({src_float, filter_float, {}}); |
|
|
|
auto time_in_ms_int = benchmarker.set_param(param_int) |
|
|
|
.set_dtype(0, dtype::Int8()) |
|
|
|
.set_dtype(1, dtype::Int8()) |
|
|
|
.set_dtype(2, dtype::Int32()) |
|
|
|
.execs({src_int, filter_int, {}}); |
|
|
|
std::cout << "chanwise: N=" << N << " C=" << C |
|
|
|
<< " H=" << H << " W=" << W << " F=" << F |
|
|
|
|