pulseaudio/src/pulsecore/remap_sse.c

159 lines
6.3 KiB
C
Raw Normal View History

/***
This file is part of PulseAudio.
Copyright 2004-2006 Lennart Poettering
Copyright 2009 Wim Taymans <wim.taymans@collabora.co.uk.com>
PulseAudio is free software; you can redistribute it and/or modify
it under the terms of the GNU Lesser General Public License as published
by the Free Software Foundation; either version 2.1 of the License,
or (at your option) any later version.
PulseAudio is distributed in the hope that it will be useful, but
WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
General Public License for more details.
You should have received a copy of the GNU Lesser General Public License
along with PulseAudio; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
USA.
***/
#ifdef HAVE_CONFIG_H
#include <config.h>
#endif
#include <pulse/sample.h>
#include <pulse/volume.h>
#include <pulsecore/log.h>
#include <pulsecore/macro.h>
#include "cpu-x86.h"
#include "remap.h"
#define LOAD_SAMPLES \
" movdqu (%1), %%xmm0 \n\t" \
" movdqu 16(%1), %%xmm2 \n\t" \
" movdqu 32(%1), %%xmm4 \n\t" \
" movdqu 48(%1), %%xmm6 \n\t" \
" movdqa %%xmm0, %%xmm1 \n\t" \
" movdqa %%xmm2, %%xmm3 \n\t" \
" movdqa %%xmm4, %%xmm5 \n\t" \
" movdqa %%xmm6, %%xmm7 \n\t"
#define UNPACK_SAMPLES(s) \
" punpckl"#s" %%xmm0, %%xmm0 \n\t" \
" punpckh"#s" %%xmm1, %%xmm1 \n\t" \
" punpckl"#s" %%xmm2, %%xmm2 \n\t" \
" punpckh"#s" %%xmm3, %%xmm3 \n\t" \
" punpckl"#s" %%xmm4, %%xmm4 \n\t" \
" punpckh"#s" %%xmm5, %%xmm5 \n\t" \
" punpckl"#s" %%xmm6, %%xmm6 \n\t" \
2009-08-26 19:29:21 +02:00
" punpckh"#s" %%xmm7, %%xmm7 \n\t"
#define STORE_SAMPLES \
" movdqu %%xmm0, (%0) \n\t" \
" movdqu %%xmm1, 16(%0) \n\t" \
" movdqu %%xmm2, 32(%0) \n\t" \
" movdqu %%xmm3, 48(%0) \n\t" \
" movdqu %%xmm4, 64(%0) \n\t" \
" movdqu %%xmm5, 80(%0) \n\t" \
" movdqu %%xmm6, 96(%0) \n\t" \
" movdqu %%xmm7, 112(%0) \n\t" \
" add $64, %1 \n\t" \
" add $128, %0 \n\t"
#define HANDLE_SINGLE_dq() \
2009-08-26 19:29:21 +02:00
" movd (%1), %%xmm0 \n\t" \
" punpckldq %%xmm0, %%xmm0 \n\t" \
2009-08-26 19:29:21 +02:00
" movq %%xmm0, (%0) \n\t" \
" add $4, %1 \n\t" \
" add $8, %0 \n\t"
#define HANDLE_SINGLE_wd() \
" movw (%1), %w3 \n\t" \
" movd %3, %%xmm0 \n\t" \
" punpcklwd %%xmm0, %%xmm0 \n\t" \
" movd %%xmm0, (%0) \n\t" \
" add $2, %1 \n\t" \
" add $4, %0 \n\t"
#define MONO_TO_STEREO(s,shift,mask) \
" mov %4, %2 \n\t" \
" sar $"#shift", %2 \n\t" \
" cmp $0, %2 \n\t" \
" je 2f \n\t" \
"1: \n\t" \
LOAD_SAMPLES \
UNPACK_SAMPLES(s) \
STORE_SAMPLES \
" dec %2 \n\t" \
" jne 1b \n\t" \
"2: \n\t" \
" mov %4, %2 \n\t" \
" and $"#mask", %2 \n\t" \
" je 4f \n\t" \
"3: \n\t" \
HANDLE_SINGLE_##s() \
" dec %2 \n\t" \
" jne 3b \n\t" \
2009-08-26 19:29:21 +02:00
"4: \n\t"
2009-09-03 01:48:30 +02:00
#if defined (__i386__) || defined (__amd64__)
static void remap_mono_to_stereo_sse2(pa_remap_t *m, void *dst, const void *src, unsigned n) {
pa_reg_x86 temp, temp2;
switch (m->format) {
case PA_SAMPLE_FLOAT32NE:
{
__asm__ __volatile__ (
MONO_TO_STEREO(dq, 4, 15) /* do doubles to quads */
: "+r" (dst), "+r" (src), "=&r" (temp), "=&r" (temp2)
: "r" ((pa_reg_x86)n)
: "cc"
);
break;
}
case PA_SAMPLE_S16NE:
{
__asm__ __volatile__ (
MONO_TO_STEREO(wd, 5, 31) /* do words to doubles */
: "+r" (dst), "+r" (src), "=&r" (temp), "=&r" (temp2)
: "r" ((pa_reg_x86)n)
: "cc"
);
break;
}
default:
pa_assert_not_reached();
}
}
/* set the function that will execute the remapping based on the matrices */
static void init_remap_sse2(pa_remap_t *m) {
unsigned n_oc, n_ic;
n_oc = m->o_ss.channels;
n_ic = m->i_ss.channels;
/* find some common channel remappings, fall back to full matrix operation. */
if (n_ic == 1 && n_oc == 2 &&
m->map_table_i[0][0] == 0x10000 && m->map_table_i[1][0] == 0x10000) {
m->do_remap = (pa_do_remap_func_t) remap_mono_to_stereo_sse2;
pa_log_info("Using SSE2 mono to stereo remapping");
}
}
2009-09-03 01:48:30 +02:00
#endif /* defined (__i386__) || defined (__amd64__) */
void pa_remap_func_init_sse(pa_cpu_x86_flag_t flags) {
#if defined (__i386__) || defined (__amd64__)
if (flags & PA_CPU_X86_SSE2) {
pa_log_info("Initialising SSE2 optimized remappers.");
pa_set_init_remap_func ((pa_init_remap_func_t) init_remap_sse2);
}
#endif /* defined (__i386__) || defined (__amd64__) */
}