From 9f4f374a19e808ba4f7d4bb04266526bf5ed428b Mon Sep 17 00:00:00 2001 From: Lennart Poettering Date: Thu, 3 Sep 2009 00:17:28 +0200 Subject: remap_sse: fix inner loop increment on SSE In each iteration we can process 2^4 S16NE samples and 2^5 F32NE samples, that's twice as much as in MMX, hence correct the increments. --- src/pulsecore/remap_sse.c | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/pulsecore/remap_sse.c b/src/pulsecore/remap_sse.c index fa21c6c8..368a3196 100644 --- a/src/pulsecore/remap_sse.c +++ b/src/pulsecore/remap_sse.c @@ -108,7 +108,7 @@ static void remap_mono_to_stereo_sse (pa_remap_t *m, void *dst, const void *src, case PA_SAMPLE_FLOAT32NE: { __asm__ __volatile__ ( - MONO_TO_STEREO(dq,3,7) /* do doubles to quads */ + MONO_TO_STEREO(dq, 4, 15) /* do doubles to quads */ : "+r" (dst), "+r" (src), "=&r" (temp), "=&r" (temp2) : "r" ((pa_reg_x86)n) : "cc" @@ -118,7 +118,7 @@ static void remap_mono_to_stereo_sse (pa_remap_t *m, void *dst, const void *src, case PA_SAMPLE_S16NE: { __asm__ __volatile__ ( - MONO_TO_STEREO(wd,4,15) /* do words to doubles */ + MONO_TO_STEREO(wd, 5, 31) /* do words to doubles */ : "+r" (dst), "+r" (src), "=&r" (temp), "=&r" (temp2) : "r" ((pa_reg_x86)n) : "cc" -- cgit