|
|
|
@ -39,6 +39,11 @@ void ConvDwInt8PostAlign4(int8_t *dst, int32_t *buffer, int num_pixels, int32_t
|
|
|
|
|
int32_t left_shift, int32_t right_shift, int32_t acc_min, int32_t acc_max);
|
|
|
|
|
void IndirectGemmInt16to32_8x4(int32_t *dst, const int16_t *src, const int16_t *weight, size_t ksize, size_t ic8,
|
|
|
|
|
size_t oc4, size_t offset);
|
|
|
|
|
void ConvDwInt8Center(int8_t *dst, const int8_t *src, const int16_t *weight, const int32_t *bias, size_t height,
|
|
|
|
|
size_t width, size_t kernel_h, size_t kernel_w, size_t out_h_step, size_t block_channel,
|
|
|
|
|
size_t in_sh_step, size_t in_sw_step, size_t in_kh_step, size_t in_kw_step, int8_t *in_zp,
|
|
|
|
|
int32_t *out_zp, int32_t *out_multiplier, int32_t *left_shift, int32_t *right_shift,
|
|
|
|
|
int32_t *acc_min, int32_t *acc_max);
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#ifdef ENABLE_ARM32
|
|
|
|
@ -59,11 +64,6 @@ void IndirectGemmInt8_4x4(int8_t *output, const int8_t *input, const int8_t *wei
|
|
|
|
|
void DeconvDwInt8Center(int32_t *dst, const int16_t *src, const int16_t *weight, size_t height, size_t width,
|
|
|
|
|
size_t kernel_h, size_t kernel_w, size_t out_h_step, size_t block_channel, size_t in_sh_step,
|
|
|
|
|
size_t in_sw_step, size_t in_kh_step, size_t in_kw_step);
|
|
|
|
|
void ConvDwInt8Center(int8_t *dst, const int8_t *src, const int16_t *weight, const int32_t *bias, size_t height,
|
|
|
|
|
size_t width, size_t kernel_h, size_t kernel_w, size_t out_h_step, size_t block_channel,
|
|
|
|
|
size_t in_sh_step, size_t in_sw_step, size_t in_kh_step, size_t in_kw_step, int8_t *in_zp,
|
|
|
|
|
int32_t *out_zp, int32_t *out_multiplier, int32_t *left_shift, int32_t *right_shift,
|
|
|
|
|
int32_t *acc_min, int32_t *acc_max);
|
|
|
|
|
void ConvDwInt8PostAlign4PerChannel(int8_t *dst, int32_t *buffer, int channel4, int32_t output_zp,
|
|
|
|
|
int32_t *out_multiplier, int32_t *left_shift, int32_t *right_shift, int32_t acc_min,
|
|
|
|
|
int32_t acc_max);
|
|
|
|
|