2009-08-25 12:27:32 +02:00
|
|
|
/***
|
|
|
|
|
This file is part of PulseAudio.
|
|
|
|
|
|
|
|
|
|
Copyright 2004-2006 Lennart Poettering
|
|
|
|
|
Copyright 2009 Wim Taymans <wim.taymans@collabora.co.uk.com>
|
|
|
|
|
|
|
|
|
|
PulseAudio is free software; you can redistribute it and/or modify
|
|
|
|
|
it under the terms of the GNU Lesser General Public License as published
|
|
|
|
|
by the Free Software Foundation; either version 2.1 of the License,
|
|
|
|
|
or (at your option) any later version.
|
|
|
|
|
|
|
|
|
|
PulseAudio is distributed in the hope that it will be useful, but
|
|
|
|
|
WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
|
General Public License for more details.
|
|
|
|
|
|
|
|
|
|
You should have received a copy of the GNU Lesser General Public License
|
2014-11-26 14:14:51 +01:00
|
|
|
along with PulseAudio; if not, see <http://www.gnu.org/licenses/>.
|
2009-08-25 12:27:32 +02:00
|
|
|
***/
|
|
|
|
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
|
|
|
#include <config.h>
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#include <pulse/sample.h>
|
2013-03-28 14:46:49 +01:00
|
|
|
#include <pulse/volume.h>
|
2009-08-25 12:27:32 +02:00
|
|
|
#include <pulsecore/log.h>
|
|
|
|
|
#include <pulsecore/macro.h>
|
|
|
|
|
|
|
|
|
|
#include "cpu-x86.h"
|
|
|
|
|
#include "remap.h"
|
|
|
|
|
|
|
|
|
|
#define LOAD_SAMPLES \
|
|
|
|
|
" movdqu (%1), %%xmm0 \n\t" \
|
|
|
|
|
" movdqu 16(%1), %%xmm2 \n\t" \
|
|
|
|
|
" movdqu 32(%1), %%xmm4 \n\t" \
|
|
|
|
|
" movdqu 48(%1), %%xmm6 \n\t" \
|
|
|
|
|
" movdqa %%xmm0, %%xmm1 \n\t" \
|
|
|
|
|
" movdqa %%xmm2, %%xmm3 \n\t" \
|
|
|
|
|
" movdqa %%xmm4, %%xmm5 \n\t" \
|
|
|
|
|
" movdqa %%xmm6, %%xmm7 \n\t"
|
|
|
|
|
|
|
|
|
|
#define UNPACK_SAMPLES(s) \
|
|
|
|
|
" punpckl"#s" %%xmm0, %%xmm0 \n\t" \
|
|
|
|
|
" punpckh"#s" %%xmm1, %%xmm1 \n\t" \
|
|
|
|
|
" punpckl"#s" %%xmm2, %%xmm2 \n\t" \
|
|
|
|
|
" punpckh"#s" %%xmm3, %%xmm3 \n\t" \
|
|
|
|
|
" punpckl"#s" %%xmm4, %%xmm4 \n\t" \
|
|
|
|
|
" punpckh"#s" %%xmm5, %%xmm5 \n\t" \
|
|
|
|
|
" punpckl"#s" %%xmm6, %%xmm6 \n\t" \
|
2009-08-26 19:29:21 +02:00
|
|
|
" punpckh"#s" %%xmm7, %%xmm7 \n\t"
|
2009-08-25 12:27:32 +02:00
|
|
|
|
|
|
|
|
#define STORE_SAMPLES \
|
|
|
|
|
" movdqu %%xmm0, (%0) \n\t" \
|
|
|
|
|
" movdqu %%xmm1, 16(%0) \n\t" \
|
|
|
|
|
" movdqu %%xmm2, 32(%0) \n\t" \
|
|
|
|
|
" movdqu %%xmm3, 48(%0) \n\t" \
|
|
|
|
|
" movdqu %%xmm4, 64(%0) \n\t" \
|
|
|
|
|
" movdqu %%xmm5, 80(%0) \n\t" \
|
|
|
|
|
" movdqu %%xmm6, 96(%0) \n\t" \
|
|
|
|
|
" movdqu %%xmm7, 112(%0) \n\t" \
|
|
|
|
|
" add $64, %1 \n\t" \
|
|
|
|
|
" add $128, %0 \n\t"
|
|
|
|
|
|
2009-08-29 12:22:42 +02:00
|
|
|
#define HANDLE_SINGLE_dq() \
|
2009-08-26 19:29:21 +02:00
|
|
|
" movd (%1), %%xmm0 \n\t" \
|
2009-08-29 12:22:42 +02:00
|
|
|
" punpckldq %%xmm0, %%xmm0 \n\t" \
|
2009-08-26 19:29:21 +02:00
|
|
|
" movq %%xmm0, (%0) \n\t" \
|
2009-08-25 12:27:32 +02:00
|
|
|
" add $4, %1 \n\t" \
|
|
|
|
|
" add $8, %0 \n\t"
|
|
|
|
|
|
2009-08-29 12:22:42 +02:00
|
|
|
#define HANDLE_SINGLE_wd() \
|
|
|
|
|
" movw (%1), %w3 \n\t" \
|
|
|
|
|
" movd %3, %%xmm0 \n\t" \
|
|
|
|
|
" punpcklwd %%xmm0, %%xmm0 \n\t" \
|
|
|
|
|
" movd %%xmm0, (%0) \n\t" \
|
|
|
|
|
" add $2, %1 \n\t" \
|
|
|
|
|
" add $4, %0 \n\t"
|
|
|
|
|
|
2009-09-03 00:13:21 +02:00
|
|
|
#define MONO_TO_STEREO(s,shift,mask) \
|
|
|
|
|
" mov %4, %2 \n\t" \
|
|
|
|
|
" sar $"#shift", %2 \n\t" \
|
|
|
|
|
" cmp $0, %2 \n\t" \
|
|
|
|
|
" je 2f \n\t" \
|
|
|
|
|
"1: \n\t" \
|
|
|
|
|
LOAD_SAMPLES \
|
|
|
|
|
UNPACK_SAMPLES(s) \
|
|
|
|
|
STORE_SAMPLES \
|
|
|
|
|
" dec %2 \n\t" \
|
|
|
|
|
" jne 1b \n\t" \
|
|
|
|
|
"2: \n\t" \
|
|
|
|
|
" mov %4, %2 \n\t" \
|
|
|
|
|
" and $"#mask", %2 \n\t" \
|
|
|
|
|
" je 4f \n\t" \
|
|
|
|
|
"3: \n\t" \
|
|
|
|
|
HANDLE_SINGLE_##s() \
|
|
|
|
|
" dec %2 \n\t" \
|
|
|
|
|
" jne 3b \n\t" \
|
2009-08-26 19:29:21 +02:00
|
|
|
"4: \n\t"
|
2009-08-25 12:27:32 +02:00
|
|
|
|
2009-09-03 01:48:30 +02:00
|
|
|
#if defined (__i386__) || defined (__amd64__)
|
2014-04-27 22:22:03 +02:00
|
|
|
static void remap_mono_to_stereo_s16ne_sse2(pa_remap_t *m, int16_t *dst, const int16_t *src, unsigned n) {
|
2009-08-29 12:22:42 +02:00
|
|
|
pa_reg_x86 temp, temp2;
|
2009-08-25 12:27:32 +02:00
|
|
|
|
2014-04-16 11:58:11 +02:00
|
|
|
__asm__ __volatile__ (
|
|
|
|
|
MONO_TO_STEREO(wd, 5, 31) /* do words to doubles */
|
|
|
|
|
: "+r" (dst), "+r" (src), "=&r" (temp), "=&r" (temp2)
|
|
|
|
|
: "r" ((pa_reg_x86)n)
|
|
|
|
|
: "cc"
|
|
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
|
2019-03-26 10:35:55 +01:00
|
|
|
/* Works for both S32NE and FLOAT32NE */
|
|
|
|
|
static void remap_mono_to_stereo_any32ne_sse2(pa_remap_t *m, float *dst, const float *src, unsigned n) {
|
2014-04-16 11:58:11 +02:00
|
|
|
pa_reg_x86 temp, temp2;
|
|
|
|
|
|
|
|
|
|
__asm__ __volatile__ (
|
|
|
|
|
MONO_TO_STEREO(dq, 4, 15) /* do doubles to quads */
|
|
|
|
|
: "+r" (dst), "+r" (src), "=&r" (temp), "=&r" (temp2)
|
|
|
|
|
: "r" ((pa_reg_x86)n)
|
|
|
|
|
: "cc"
|
|
|
|
|
);
|
2009-08-25 12:27:32 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* set the function that will execute the remapping based on the matrices */
|
2011-03-02 12:41:26 +01:00
|
|
|
static void init_remap_sse2(pa_remap_t *m) {
|
2009-08-25 12:27:32 +02:00
|
|
|
unsigned n_oc, n_ic;
|
|
|
|
|
|
2014-04-16 11:25:58 +02:00
|
|
|
n_oc = m->o_ss.channels;
|
|
|
|
|
n_ic = m->i_ss.channels;
|
2009-08-25 12:27:32 +02:00
|
|
|
|
|
|
|
|
/* find some common channel remappings, fall back to full matrix operation. */
|
|
|
|
|
if (n_ic == 1 && n_oc == 2 &&
|
2014-04-16 19:24:01 +02:00
|
|
|
m->map_table_i[0][0] == 0x10000 && m->map_table_i[1][0] == 0x10000) {
|
2014-04-16 11:58:11 +02:00
|
|
|
|
2013-01-30 11:03:58 +01:00
|
|
|
pa_log_info("Using SSE2 mono to stereo remapping");
|
2014-04-27 22:22:03 +02:00
|
|
|
pa_set_remap_func(m, (pa_do_remap_func_t) remap_mono_to_stereo_s16ne_sse2,
|
2019-03-26 10:35:55 +01:00
|
|
|
(pa_do_remap_func_t) remap_mono_to_stereo_any32ne_sse2,
|
|
|
|
|
(pa_do_remap_func_t) remap_mono_to_stereo_any32ne_sse2);
|
2009-08-25 12:27:32 +02:00
|
|
|
}
|
|
|
|
|
}
|
2009-09-03 01:48:30 +02:00
|
|
|
#endif /* defined (__i386__) || defined (__amd64__) */
|
2009-08-25 12:27:32 +02:00
|
|
|
|
2011-03-02 12:41:26 +01:00
|
|
|
void pa_remap_func_init_sse(pa_cpu_x86_flag_t flags) {
|
2009-08-25 12:27:32 +02:00
|
|
|
#if defined (__i386__) || defined (__amd64__)
|
|
|
|
|
|
2009-09-09 04:28:22 +02:00
|
|
|
if (flags & PA_CPU_X86_SSE2) {
|
|
|
|
|
pa_log_info("Initialising SSE2 optimized remappers.");
|
|
|
|
|
pa_set_init_remap_func ((pa_init_remap_func_t) init_remap_sse2);
|
|
|
|
|
}
|
|
|
|
|
|
2009-08-25 12:27:32 +02:00
|
|
|
#endif /* defined (__i386__) || defined (__amd64__) */
|
|
|
|
|
}
|