|
|
|
@@ -33,7 +33,7 @@ void MatMul16x8(const float16_t *a, const float16_t *b, float16_t *dst, const fl |
|
|
|
int deep, int row, int col, int stride, bool write_nhwc); |
|
|
|
|
|
|
|
void MatMulFp16(const float16_t *a, const float16_t *b, float16_t *c, const float16_t *bias, ActType act_type, |
|
|
|
int depth, int row, int col, int stride, bool write_nhwc); |
|
|
|
int depth, int row, int col, int stride, int out_type); |
|
|
|
|
|
|
|
void ColMajor2Row8MajorFp16(void *src_ptr, float16_t *dst_ptr, size_t row, size_t col, bool src_float16); |
|
|
|
|
|
|
|
@@ -43,7 +43,7 @@ void MatmulFp16Neon64(const float16_t *a, const float16_t *b, float16_t *c, cons |
|
|
|
size_t depth, size_t row, size_t col, size_t stride, bool write_nhwc); |
|
|
|
|
|
|
|
void MatmulFp16Neon64Opt(const float16_t *a, const float16_t *b, float16_t *c, const float16_t *bias, int act_type, |
|
|
|
size_t depth, size_t row, size_t col, size_t stride, int write_nhwc); |
|
|
|
size_t depth, size_t row, size_t col, size_t stride, size_t write_nhwc); |
|
|
|
|
|
|
|
void RowMajor2Col16MajorFp16(void *src, float16_t *dst, int row, int col, bool is_fp32_src); |
|
|
|
|
|
|
|
|