endianmacros: Replace borked PA_FLOAT32_SWAP() with PA_READ_FLOAT32RE() / PA_WRITE_FLOAT32RE()

building PA with -O0 leads to test failure in mix-test on i386

issue reported by Felipe, see
http://lists.freedesktop.org/archives/pulseaudio-discuss/2014-August/021406.html

the problem is the value 0xbeffbd7f: when byte-swapped it becomes 0x7fbdffbe and according
to IEEE-754 represents a signalling NaN (starting with s111 1111 10, see http://en.wikipedia.org/wiki/NaN)

when this value is assigned to a floating point register, it becomes 0x7ffdffbe, representing
a quiet NaN (starting with s111 1111 11) -- a signalling NaN is turned into a quiet NaN!

so PA_FLOAT32_SWAP(PA_FLOAT32_SWAP(x)) != x for certain values, uhuh!

the following test code can be used; due to volatile, it will always demonstrate the issue;
without volatile, it depends on the optimization level (i386, 32-bit, gcc 4.9):

// snip

static inline float PA_FLOAT32_SWAP(float x) {
    union {
        float f;
        uint32_t u;
    } t;

    t.f = x;
    t.u = bswap_32(t.u);
    return t.f;
}

int main() {
  unsigned x = 0xbeffbd7f;
  volatile float f = PA_FLOAT32_SWAP(*(float *)&x);
  printf("%08x %08x %08x %f\n", 0xbeffbd7f, *(unsigned *)&f, bswap_32(*(unsigned *)&f), f);
}
// snip

the problem goes away with optimization when no temporary floating point registers are used

the proposed solution is to avoid passing swapped floating point data in a
float; this is done with new functions PA_READ_FLOAT32RE() and PA_WRITE_FLOAT32RE()
which use uint32_t to dereference a pointer and byte-swap the data, hence no temporary
float variable is used

also delete PA_FLOAT32_TO_LE()/_BE(), not used

Signed-off-by: Peter Meerwald <pmeerw@pmeerw.net>
Reported-by: Felipe Sateler <fsateler@debian.org>
This commit is contained in:
Peter Meerwald 2014-09-02 23:53:09 +02:00
parent 5d7b5e509c
commit 293a1739e2
7 changed files with 32 additions and 40 deletions

View file

@ -71,15 +71,24 @@ static inline void PA_WRITE24LE(uint8_t *p, uint32_t u) {
p[0] = (uint8_t) u; p[0] = (uint8_t) u;
} }
static inline float PA_FLOAT32_SWAP(float x) { static inline float PA_READ_FLOAT32RE(const void *p) {
union {
float f;
uint32_t u;
} t;
t.u = PA_UINT32_SWAP(*(uint32_t *) p);
return t.f;
}
static inline void PA_WRITE_FLOAT32RE(void *p, float x) {
union { union {
float f; float f;
uint32_t u; uint32_t u;
} t; } t;
t.f = x; t.f = x;
t.u = PA_UINT32_SWAP(t.u); *(uint32_t *) p = PA_UINT32_SWAP(t.u);
return t.f;
} }
#define PA_MAYBE_INT16_SWAP(c,x) ((c) ? PA_INT16_SWAP(x) : (x)) #define PA_MAYBE_INT16_SWAP(c,x) ((c) ? PA_INT16_SWAP(x) : (x))
@ -88,8 +97,6 @@ static inline float PA_FLOAT32_SWAP(float x) {
#define PA_MAYBE_INT32_SWAP(c,x) ((c) ? PA_INT32_SWAP(x) : (x)) #define PA_MAYBE_INT32_SWAP(c,x) ((c) ? PA_INT32_SWAP(x) : (x))
#define PA_MAYBE_UINT32_SWAP(c,x) ((c) ? PA_UINT32_SWAP(x) : (x)) #define PA_MAYBE_UINT32_SWAP(c,x) ((c) ? PA_UINT32_SWAP(x) : (x))
#define PA_MAYBE_FLOAT32_SWAP(c,x) ((c) ? PA_FLOAT32_SWAP(x) : (x))
#ifdef WORDS_BIGENDIAN #ifdef WORDS_BIGENDIAN
#define PA_INT16_FROM_LE(x) PA_INT16_SWAP(x) #define PA_INT16_FROM_LE(x) PA_INT16_SWAP(x)
#define PA_INT16_FROM_BE(x) ((int16_t)(x)) #define PA_INT16_FROM_BE(x) ((int16_t)(x))
@ -115,9 +122,6 @@ static inline float PA_FLOAT32_SWAP(float x) {
#define PA_UINT32_TO_LE(x) PA_UINT32_SWAP(x) #define PA_UINT32_TO_LE(x) PA_UINT32_SWAP(x)
#define PA_UINT32_TO_BE(x) ((uint32_t)(x)) #define PA_UINT32_TO_BE(x) ((uint32_t)(x))
#define PA_FLOAT32_TO_LE(x) PA_FLOAT32_SWAP(x)
#define PA_FLOAT32_TO_BE(x) ((float) (x))
#define PA_READ24NE(x) PA_READ24BE(x) #define PA_READ24NE(x) PA_READ24BE(x)
#define PA_WRITE24NE(x,y) PA_WRITE24BE((x),(y)) #define PA_WRITE24NE(x,y) PA_WRITE24BE((x),(y))
@ -148,9 +152,6 @@ static inline float PA_FLOAT32_SWAP(float x) {
#define PA_UINT32_TO_LE(x) ((uint32_t)(x)) #define PA_UINT32_TO_LE(x) ((uint32_t)(x))
#define PA_UINT32_TO_BE(x) PA_UINT32_SWAP(x) #define PA_UINT32_TO_BE(x) PA_UINT32_SWAP(x)
#define PA_FLOAT32_TO_LE(x) ((float) (x))
#define PA_FLOAT32_TO_BE(x) PA_FLOAT32_SWAP(x)
#define PA_READ24NE(x) PA_READ24LE(x) #define PA_READ24NE(x) PA_READ24LE(x)
#define PA_WRITE24NE(x,y) PA_WRITE24LE((x),(y)) #define PA_WRITE24NE(x,y) PA_WRITE24LE((x),(y))

View file

@ -576,17 +576,14 @@ static void pa_mix_float32re_c(pa_mix_info streams[], unsigned nstreams, unsigne
for (i = 0; i < nstreams; i++) { for (i = 0; i < nstreams; i++) {
pa_mix_info *m = streams + i; pa_mix_info *m = streams + i;
float v, cv = m->linear[channel].f; float cv = m->linear[channel].f;
if (PA_LIKELY(cv > 0)) { if (PA_LIKELY(cv > 0))
v = PA_FLOAT32_SWAP(*(float*) m->ptr); sum += PA_READ_FLOAT32RE(m->ptr) * cv;
v *= cv;
sum += v;
}
m->ptr = (uint8_t*) m->ptr + sizeof(float); m->ptr = (uint8_t*) m->ptr + sizeof(float);
} }
*data = PA_FLOAT32_SWAP(sum); PA_WRITE_FLOAT32RE(data, sum);
if (PA_UNLIKELY(++channel >= channels)) if (PA_UNLIKELY(++channel >= channels))
channel = 0; channel = 0;

View file

@ -296,9 +296,9 @@ void pa_sample_clamp(pa_sample_format_t format, void *dst, size_t dstr, const vo
for (; n > 0; n--) { for (; n > 0; n--) {
float f; float f;
f = PA_FLOAT32_SWAP(*s); f = PA_READ_FLOAT32RE(s);
f = PA_CLAMP_UNLIKELY(f, -1.0f, 1.0f); f = PA_CLAMP_UNLIKELY(f, -1.0f, 1.0f);
*d = PA_FLOAT32_SWAP(f); PA_WRITE_FLOAT32RE(d, f);
s = (const float*) ((const uint8_t*) s + sstr); s = (const float*) ((const uint8_t*) s + sstr);
d = (float*) ((uint8_t*) d + dstr); d = (float*) ((uint8_t*) d + dstr);

View file

@ -157,8 +157,7 @@ void pa_sconv_s16le_to_float32re(unsigned n, const int16_t *a, float *b) {
for (; n > 0; n--) { for (; n > 0; n--) {
int16_t s = *(a++); int16_t s = *(a++);
float k = INT16_FROM(s) * (1.0f / (1 << 15)); float k = INT16_FROM(s) * (1.0f / (1 << 15));
k = PA_FLOAT32_SWAP(k); PA_WRITE_FLOAT32RE(b++, k);
*(b++) = k;
} }
} }
@ -169,8 +168,7 @@ void pa_sconv_s32le_to_float32re(unsigned n, const int32_t *a, float *b) {
for (; n > 0; n--) { for (; n > 0; n--) {
int32_t s = *(a++); int32_t s = *(a++);
float k = INT32_FROM(s) * (1.0f / (1U << 31)); float k = INT32_FROM(s) * (1.0f / (1U << 31));
k = PA_FLOAT32_SWAP(k); PA_WRITE_FLOAT32RE(b++, k);
*(b++) = k;
} }
} }
@ -180,8 +178,7 @@ void pa_sconv_s16le_from_float32re(unsigned n, const float *a, int16_t *b) {
for (; n > 0; n--) { for (; n > 0; n--) {
int16_t s; int16_t s;
float v = *(a++); float v = PA_READ_FLOAT32RE(a++) * (1 << 15);
v = PA_FLOAT32_SWAP(v) * (1 << 15);
s = (int16_t) PA_CLAMP_UNLIKELY(lrintf(v), -0x8000, 0x7FFF); s = (int16_t) PA_CLAMP_UNLIKELY(lrintf(v), -0x8000, 0x7FFF);
*(b++) = INT16_TO(s); *(b++) = INT16_TO(s);
} }
@ -193,8 +190,7 @@ void pa_sconv_s32le_from_float32re(unsigned n, const float *a, int32_t *b) {
for (; n > 0; n--) { for (; n > 0; n--) {
int32_t s; int32_t s;
float v = *(a++); float v = PA_READ_FLOAT32RE(a++) * (1U << 31);
v = PA_FLOAT32_SWAP(v) * (1U << 31);
s = (int32_t) PA_CLAMP_UNLIKELY(llrintf(v), -0x80000000LL, 0x7FFFFFFFLL); s = (int32_t) PA_CLAMP_UNLIKELY(llrintf(v), -0x80000000LL, 0x7FFFFFFFLL);
*(b++) = INT32_TO(s); *(b++) = INT32_TO(s);
} }
@ -325,7 +321,7 @@ void pa_sconv_s24le_to_float32re(unsigned n, const uint8_t *a, float *b) {
for (; n > 0; n--) { for (; n > 0; n--) {
int32_t s = READ24(a) << 8; int32_t s = READ24(a) << 8;
float k = s * (1.0f / (1U << 31)); float k = s * (1.0f / (1U << 31));
*b = PA_FLOAT32_SWAP(k); PA_WRITE_FLOAT32RE(b, k);
a += 3; a += 3;
b++; b++;
} }
@ -337,8 +333,7 @@ void pa_sconv_s24le_from_float32re(unsigned n, const float *a, uint8_t *b) {
for (; n > 0; n--) { for (; n > 0; n--) {
int32_t s; int32_t s;
float v = *a; float v = PA_READ_FLOAT32RE(a) * (1U << 31);
v = PA_FLOAT32_SWAP(v) * (1U << 31);
s = (int32_t) PA_CLAMP_UNLIKELY(llrint(v), -0x80000000LL, 0x7FFFFFFFLL); s = (int32_t) PA_CLAMP_UNLIKELY(llrint(v), -0x80000000LL, 0x7FFFFFFFLL);
WRITE24(b, ((uint32_t) s) >> 8); WRITE24(b, ((uint32_t) s) >> 8);
a++; a++;
@ -411,7 +406,7 @@ void pa_sconv_s24_32le_to_float32re(unsigned n, const uint32_t *a, float *b) {
for (; n > 0; n--) { for (; n > 0; n--) {
int32_t s = (int32_t) (UINT32_FROM(*a) << 8); int32_t s = (int32_t) (UINT32_FROM(*a) << 8);
float k = s * (1.0f / (1U << 31)); float k = s * (1.0f / (1U << 31));
*b = PA_FLOAT32_SWAP(k); PA_WRITE_FLOAT32RE(b, k);
a++; a++;
b++; b++;
} }
@ -437,8 +432,7 @@ void pa_sconv_s24_32le_from_float32re(unsigned n, const float *a, uint32_t *b) {
for (; n > 0; n--) { for (; n > 0; n--) {
int32_t s; int32_t s;
float v = *a; float v = PA_READ_FLOAT32RE(a) * (1U << 31);
v = PA_FLOAT32_SWAP(v) * (1U << 31);
s = (int32_t) PA_CLAMP_UNLIKELY(llrint(v), -0x80000000LL, 0x7FFFFFFFLL); s = (int32_t) PA_CLAMP_UNLIKELY(llrint(v), -0x80000000LL, 0x7FFFFFFFLL);
*b = UINT32_TO(((uint32_t) s) >> 8); *b = UINT32_TO(((uint32_t) s) >> 8);
a++; a++;

View file

@ -125,9 +125,9 @@ static void pa_volume_float32re_c(float *samples, const float *volumes, unsigned
for (channel = 0; length; length--) { for (channel = 0; length; length--) {
float t; float t;
t = PA_FLOAT32_SWAP(*samples); t = PA_READ_FLOAT32RE(samples);
t *= volumes[channel]; t *= volumes[channel];
*samples++ = PA_FLOAT32_SWAP(t); PA_WRITE_FLOAT32RE(samples++, t);
if (PA_UNLIKELY(++channel >= channels)) if (PA_UNLIKELY(++channel >= channels))
channel = 0; channel = 0;

View file

@ -150,7 +150,7 @@ static void compare_block(const pa_sample_spec *ss, const pa_memchunk *chunk, in
float *u = d; float *u = d;
for (i = 0; i < chunk->length / pa_frame_size(ss); i++) { for (i = 0; i < chunk->length / pa_frame_size(ss); i++) {
float uu = PA_MAYBE_FLOAT32_SWAP(ss->format != PA_SAMPLE_FLOAT32NE, *u); float uu = ss->format == PA_SAMPLE_FLOAT32NE ? *u : PA_READ_FLOAT32RE(u);
fail_unless(fabsf(uu - *v) <= 1e-6f, NULL); fail_unless(fabsf(uu - *v) <= 1e-6f, NULL);
++u; ++u;
++v; ++v;
@ -264,7 +264,7 @@ static pa_memblock* generate_block(pa_mempool *pool, const pa_sample_spec *ss) {
if (ss->format == PA_SAMPLE_FLOAT32RE) { if (ss->format == PA_SAMPLE_FLOAT32RE) {
float *u = d; float *u = d;
for (i = 0; i < 10; i++) for (i = 0; i < 10; i++)
u[i] = PA_FLOAT32_SWAP(float32ne_result[0][i]); PA_WRITE_FLOAT32RE(&u[i], float32ne_result[0][i]);
} else } else
memcpy(d, float32ne_result[0], sizeof(float32ne_result[0])); memcpy(d, float32ne_result[0], sizeof(float32ne_result[0]));

View file

@ -98,7 +98,7 @@ static void dump_block(const char *label, const pa_sample_spec *ss, const pa_mem
float *u = d; float *u = d;
for (i = 0; i < chunk->length / pa_frame_size(ss); i++) { for (i = 0; i < chunk->length / pa_frame_size(ss); i++) {
printf("%4.3g ", ss->format == PA_SAMPLE_FLOAT32NE ? *u : PA_FLOAT32_SWAP(*u)); printf("%4.3g ", ss->format == PA_SAMPLE_FLOAT32NE ? *u : PA_READ_FLOAT32RE(u));
u++; u++;
} }
@ -222,7 +222,7 @@ static pa_memblock* generate_block(pa_mempool *pool, const pa_sample_spec *ss) {
if (ss->format == PA_SAMPLE_FLOAT32RE) if (ss->format == PA_SAMPLE_FLOAT32RE)
for (i = 0; i < 10; i++) for (i = 0; i < 10; i++)
u[i] = PA_FLOAT32_SWAP(u[i]); PA_WRITE_FLOAT32RE(&u[i], u[i]);
break; break;
} }