resample: load more data on aarch64 because we can

This commit is contained in:
Wim Taymans 2020-06-19 11:47:57 +02:00
parent ecead2b7e4
commit 4be29c1124

View file

@ -43,10 +43,8 @@ static void inner_product_neon(float *d, const float * SPA_RESTRICT s,
" bne 4f\n" " bne 4f\n"
" b 5f\n" " b 5f\n"
"1:" "1:"
" ld1 {v4.4s, v5.4s}, [%[taps]], #32\n" " ld1 {v4.4s, v5.4s, v6.4s, v7.4s}, [%[taps]], #64\n"
" ld1 {v8.4s, v9.4s}, [%[s]], #32\n" " ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [%[s]], #64\n"
" ld1 {v6.4s, v7.4s}, [%[taps]], #32\n"
" ld1 {v10.4s, v11.4s}, [%[s]], #32\n"
" subs %[n_taps], %[n_taps], #16\n" " subs %[n_taps], %[n_taps], #16\n"
" fmul v0.4s, v4.4s, v8.4s\n" " fmul v0.4s, v4.4s, v8.4s\n"
" fmul v1.4s, v5.4s, v9.4s\n" " fmul v1.4s, v5.4s, v9.4s\n"
@ -54,10 +52,8 @@ static void inner_product_neon(float *d, const float * SPA_RESTRICT s,
" fmul v3.4s, v7.4s, v11.4s\n" " fmul v3.4s, v7.4s, v11.4s\n"
" beq 3f\n" " beq 3f\n"
"2:" "2:"
" ld1 { v4.4s, v5.4s}, [%[taps]], #32\n" " ld1 {v4.4s, v5.4s, v6.4s, v7.4s}, [%[taps]], #64\n"
" ld1 { v8.4s, v9.4s}, [%[s]], #32\n" " ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [%[s]], #64\n"
" ld1 { v6.4s, v7.4s}, [%[taps]], #32\n"
" ld1 { v10.4s, v11.4s}, [%[s]], #32\n"
" subs %[n_taps], %[n_taps], #16\n" " subs %[n_taps], %[n_taps], #16\n"
" fmla v0.4s, v4.4s, v8.4s\n" " fmla v0.4s, v4.4s, v8.4s\n"
" fmla v1.4s, v5.4s, v9.4s\n" " fmla v1.4s, v5.4s, v9.4s\n"