|
|
|
@@ -514,14 +514,15 @@ void MaxPoolingOptInt8(const int8_t *input_ptr, int8_t *output_ptr, PoolingParam |
|
|
|
#ifdef ENABLE_NEON |
|
|
|
int c16 = real_channel / 16 * 16; |
|
|
|
int c8 = real_channel / 8 * 8; |
|
|
|
int8_t *tmp_out_data = out_data; |
|
|
|
for (; j < c16; j += 16) { |
|
|
|
vst1q_s8(out_data, vld1q_s8(out_array + j)); |
|
|
|
out_data += 16; |
|
|
|
vst1q_s8(tmp_out_data, vld1q_s8(out_array + j)); |
|
|
|
tmp_out_data += 16; |
|
|
|
} // 16 channel loop |
|
|
|
|
|
|
|
for (; j < c8; j += 8) { |
|
|
|
vst1_s8(out_data, vld1_s8(out_array + j)); |
|
|
|
out_data += 8; |
|
|
|
vst1_s8(tmp_out_data, vld1_s8(out_array + j)); |
|
|
|
tmp_out_data += 8; |
|
|
|
} // 8 channel loop |
|
|
|
#endif |
|
|
|
for (; j < real_channel; ++j) { |
|
|
|
|