| @@ -514,14 +514,15 @@ void MaxPoolingOptInt8(const int8_t *input_ptr, int8_t *output_ptr, PoolingParam | |||||
| #ifdef ENABLE_NEON | #ifdef ENABLE_NEON | ||||
| int c16 = real_channel / 16 * 16; | int c16 = real_channel / 16 * 16; | ||||
| int c8 = real_channel / 8 * 8; | int c8 = real_channel / 8 * 8; | ||||
| int8_t *tmp_out_data = out_data; | |||||
| for (; j < c16; j += 16) { | for (; j < c16; j += 16) { | ||||
| vst1q_s8(out_data, vld1q_s8(out_array + j)); | |||||
| out_data += 16; | |||||
| vst1q_s8(tmp_out_data, vld1q_s8(out_array + j)); | |||||
| tmp_out_data += 16; | |||||
| } // 16 channel loop | } // 16 channel loop | ||||
| for (; j < c8; j += 8) { | for (; j < c8; j += 8) { | ||||
| vst1_s8(out_data, vld1_s8(out_array + j)); | |||||
| out_data += 8; | |||||
| vst1_s8(tmp_out_data, vld1_s8(out_array + j)); | |||||
| tmp_out_data += 8; | |||||
| } // 8 channel loop | } // 8 channel loop | ||||
| #endif | #endif | ||||
| for (; j < real_channel; ++j) { | for (; j < real_channel; ++j) { | ||||