|
|
|
@ -33,7 +33,7 @@ void MatMul16x8(const float16_t *a, const float16_t *b, float16_t *dst, const fl
|
|
|
|
|
int deep, int row, int col, int stride, bool write_nhwc);
|
|
|
|
|
|
|
|
|
|
void MatMulFp16(const float16_t *a, const float16_t *b, float16_t *c, const float16_t *bias, ActType act_type,
|
|
|
|
|
int depth, int row, int col, int stride, bool write_nhwc);
|
|
|
|
|
int depth, int row, int col, int stride, int out_type);
|
|
|
|
|
|
|
|
|
|
void ColMajor2Row8MajorFp16(void *src_ptr, float16_t *dst_ptr, size_t row, size_t col, bool src_float16);
|
|
|
|
|
|
|
|
|
@ -43,7 +43,7 @@ void MatmulFp16Neon64(const float16_t *a, const float16_t *b, float16_t *c, cons
|
|
|
|
|
size_t depth, size_t row, size_t col, size_t stride, bool write_nhwc);
|
|
|
|
|
|
|
|
|
|
void MatmulFp16Neon64Opt(const float16_t *a, const float16_t *b, float16_t *c, const float16_t *bias, int act_type,
|
|
|
|
|
size_t depth, size_t row, size_t col, size_t stride, int write_nhwc);
|
|
|
|
|
size_t depth, size_t row, size_t col, size_t stride, size_t write_nhwc);
|
|
|
|
|
|
|
|
|
|
void RowMajor2Col16MajorFp16(void *src, float16_t *dst, int row, int col, bool is_fp32_src);
|
|
|
|
|
|
|
|
|
|