diff options
author | Arun Raghavan <arun.raghavan@collabora.co.uk> | 2011-04-17 15:28:15 +0530 |
---|---|---|
committer | Colin Guthrie <colin@mageia.org> | 2011-04-18 10:31:51 +0200 |
commit | 0b2457432a95fc3b0ffdca815d14a7576a6d4b67 (patch) | |
tree | 375ad2e18170656878c86a20b34726a3a3cd6819 /src/pulsecore/svolume_sse.c | |
parent | 837e0a960630251ce30c124da5e65079b748d978 (diff) |
volume: Get more data from volume tests
This makes the volume tests run in two loops and print the minimum,
maximum and standard deviation of readings from the inner loop. This
makes it easier to reason out performance drops (i.e. algorithmic
problems vs. other system issues such as processor contention).
Diffstat (limited to 'src/pulsecore/svolume_sse.c')
-rw-r--r-- | src/pulsecore/svolume_sse.c | 46 |
1 files changed, 34 insertions, 12 deletions
diff --git a/src/pulsecore/svolume_sse.c b/src/pulsecore/svolume_sse.c index ef07a243..8fed69b2 100644 --- a/src/pulsecore/svolume_sse.c +++ b/src/pulsecore/svolume_sse.c @@ -253,6 +253,7 @@ static void pa_volume_s16re_sse2(int16_t *samples, int32_t *volumes, unsigned ch #define CHANNELS 2 #define SAMPLES 1022 #define TIMES 1000 +#define TIMES2 100 #define PADDING 16 static void run_test(void) { @@ -263,6 +264,9 @@ static void run_test(void) { int i, j, padding; pa_do_volume_func_t func; pa_usec_t start, stop; + int k; + pa_usec_t min = INT_MAX, max = 0; + double s1 = 0, s2 = 0; func = pa_get_volume_func(PA_SAMPLE_S16NE); @@ -286,21 +290,39 @@ static void run_test(void) { } } - start = pa_rtclock_now(); - for (j = 0; j < TIMES; j++) { - memcpy(samples, samples_orig, sizeof(samples)); - pa_volume_s16ne_sse2(samples, volumes, CHANNELS, sizeof(samples)); + for (k = 0; k < TIMES2; k++) { + start = pa_rtclock_now(); + for (j = 0; j < TIMES; j++) { + memcpy(samples, samples_orig, sizeof(samples)); + pa_volume_s16ne_sse2(samples, volumes, CHANNELS, sizeof(samples)); + } + stop = pa_rtclock_now(); + + if (min > (stop - start)) min = stop - start; + if (max < (stop - start)) max = stop - start; + s1 += stop - start; + s2 += (stop - start) * (stop - start); } - stop = pa_rtclock_now(); - pa_log_info("SSE: %llu usec.", (long long unsigned int)(stop - start)); + pa_log_info("SSE: %llu usec (min = %llu, max = %llu, stddev = %g).", (long long unsigned int)s1, + (long long unsigned int)min, (long long unsigned int)max, sqrt(TIMES2 * s2 - s1 * s1) / TIMES2); + + min = INT_MAX; max = 0; + s1 = s2 = 0; + for (k = 0; k < TIMES2; k++) { + start = pa_rtclock_now(); + for (j = 0; j < TIMES; j++) { + memcpy(samples_ref, samples_orig, sizeof(samples)); + func(samples_ref, volumes, CHANNELS, sizeof(samples)); + } + stop = pa_rtclock_now(); - start = pa_rtclock_now(); - for (j = 0; j < TIMES; j++) { - memcpy(samples_ref, samples_orig, sizeof(samples)); - func(samples_ref, volumes, CHANNELS, sizeof (samples)); + if (min > (stop - start)) min = stop - start; + if (max < (stop - start)) max = stop - start; + s1 += stop - start; + s2 += (stop - start) * (stop - start); } - stop = pa_rtclock_now(); - pa_log_info("ref: %llu usec.", (long long unsigned int)(stop - start)); + pa_log_info("ref: %llu usec (min = %llu, max = %llu, stddev = %g).", (long long unsigned int)s1, + (long long unsigned int)min, (long long unsigned int)max, sqrt(TIMES2 * s2 - s1 * s1) / TIMES2); pa_assert_se(memcmp(samples_ref, samples, sizeof(samples)) == 0); } |