summaryrefslogtreecommitdiffstats
path: root/src/pulsecore/svolume_mmx.c
diff options
context:
space:
mode:
authorArun Raghavan <arun.raghavan@collabora.co.uk>2011-04-17 15:28:15 +0530
committerColin Guthrie <colin@mageia.org>2011-04-18 10:31:51 +0200
commit0b2457432a95fc3b0ffdca815d14a7576a6d4b67 (patch)
tree375ad2e18170656878c86a20b34726a3a3cd6819 /src/pulsecore/svolume_mmx.c
parent837e0a960630251ce30c124da5e65079b748d978 (diff)
volume: Get more data from volume tests
This makes the volume tests run in two loops and print the minimum, maximum and standard deviation of readings from the inner loop. This makes it easier to reason out performance drops (i.e. algorithmic problems vs. other system issues such as processor contention).
Diffstat (limited to 'src/pulsecore/svolume_mmx.c')
-rw-r--r--src/pulsecore/svolume_mmx.c46
1 files changed, 34 insertions, 12 deletions
diff --git a/src/pulsecore/svolume_mmx.c b/src/pulsecore/svolume_mmx.c
index 421156ea..7286b4a2 100644
--- a/src/pulsecore/svolume_mmx.c
+++ b/src/pulsecore/svolume_mmx.c
@@ -241,6 +241,7 @@ static void pa_volume_s16re_mmx(int16_t *samples, int32_t *volumes, unsigned cha
#define CHANNELS 2
#define SAMPLES 1022
#define TIMES 1000
+#define TIMES2 100
#define PADDING 16
static void run_test(void) {
@@ -251,6 +252,9 @@ static void run_test(void) {
int i, j, padding;
pa_do_volume_func_t func;
pa_usec_t start, stop;
+ int k;
+ pa_usec_t min = INT_MAX, max = 0;
+ double s1 = 0, s2 = 0;
func = pa_get_volume_func(PA_SAMPLE_S16NE);
@@ -277,21 +281,39 @@ static void run_test(void) {
}
}
- start = pa_rtclock_now();
- for (j = 0; j < TIMES; j++) {
- memcpy(samples, samples_orig, sizeof(samples));
- pa_volume_s16ne_mmx(samples, volumes, CHANNELS, sizeof(samples));
+ for (k = 0; k < TIMES2; k++) {
+ start = pa_rtclock_now();
+ for (j = 0; j < TIMES; j++) {
+ memcpy(samples, samples_orig, sizeof(samples));
+ pa_volume_s16ne_mmx(samples, volumes, CHANNELS, sizeof(samples));
+ }
+ stop = pa_rtclock_now();
+
+ if (min > (stop - start)) min = stop - start;
+ if (max < (stop - start)) max = stop - start;
+ s1 += stop - start;
+ s2 += (stop - start) * (stop - start);
}
- stop = pa_rtclock_now();
- pa_log_info("MMX: %llu usec.", (long long unsigned int)(stop - start));
+ pa_log_info("MMX: %llu usec (min = %llu, max = %llu, stddev = %g).", (long long unsigned int)s1,
+ (long long unsigned int)min, (long long unsigned int)max, sqrt(TIMES2 * s2 - s1 * s1) / TIMES2);
+
+ min = INT_MAX; max = 0;
+ s1 = s2 = 0;
+ for (k = 0; k < TIMES2; k++) {
+ start = pa_rtclock_now();
+ for (j = 0; j < TIMES; j++) {
+ memcpy(samples_ref, samples_orig, sizeof(samples));
+ func(samples_ref, volumes, CHANNELS, sizeof(samples));
+ }
+ stop = pa_rtclock_now();
- start = pa_rtclock_now();
- for (j = 0; j < TIMES; j++) {
- memcpy(samples_ref, samples_orig, sizeof(samples));
- func(samples_ref, volumes, CHANNELS, sizeof(samples));
+ if (min > (stop - start)) min = stop - start;
+ if (max < (stop - start)) max = stop - start;
+ s1 += stop - start;
+ s2 += (stop - start) * (stop - start);
}
- stop = pa_rtclock_now();
- pa_log_info("ref: %llu usec.", (long long unsigned int)(stop - start));
+ pa_log_info("ref: %llu usec (min = %llu, max = %llu, stddev = %g).", (long long unsigned int)s1,
+ (long long unsigned int)min, (long long unsigned int)max, sqrt(TIMES2 * s2 - s1 * s1) / TIMES2);
pa_assert_se(memcmp(samples_ref, samples, sizeof(samples)) == 0);
}