|
|
|
@ -151,9 +151,9 @@ void Row8x8Major2RowMajor(float *src_ptr, float *dst_ptr, size_t row, size_t col
|
|
|
|
|
"mov x10, %[src_c] \n"
|
|
|
|
|
"mov x11, %[dst_c] \n"
|
|
|
|
|
|
|
|
|
|
"Loop8x8: \n"
|
|
|
|
|
"1: \n"
|
|
|
|
|
"cmp x0, x1 \n"
|
|
|
|
|
"beq End \n"
|
|
|
|
|
"beq 2f \n"
|
|
|
|
|
|
|
|
|
|
"ld1 {v0.4s}, [x10], #16\n"
|
|
|
|
|
"ld1 {v1.4s}, [x10], #16\n"
|
|
|
|
@ -190,9 +190,9 @@ void Row8x8Major2RowMajor(float *src_ptr, float *dst_ptr, size_t row, size_t col
|
|
|
|
|
"st1 {v13.4s}, [x11], %[offset]\n"
|
|
|
|
|
"st1 {v14.4s}, [x11], #16\n"
|
|
|
|
|
"st1 {v15.4s}, [x11], %[offset]\n"
|
|
|
|
|
"b Loop8x8\n"
|
|
|
|
|
"b 1b\n"
|
|
|
|
|
|
|
|
|
|
"End:\n"
|
|
|
|
|
"2:\n"
|
|
|
|
|
|
|
|
|
|
:
|
|
|
|
|
: [ dst_c ] "r"(dst_c), [ src_c ] "r"(src_c), [ offset ] "r"(offset), [ row_8div ] "r"(row_8div)
|
|
|
|
|