blob: 24d3917b115f320ebac4b991e31a25dacdc8ff6c [file] [log] [blame]
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +00001/*
2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11#include <math.h>
12
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +000013#include "testing/gtest/include/gtest/gtest.h"
14#include "webrtc/voice_engine/output_mixer.h"
15#include "webrtc/voice_engine/output_mixer_internal.h"
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +000016
17namespace webrtc {
18namespace voe {
19namespace {
20
21class OutputMixerTest : public ::testing::Test {
22 protected:
23 OutputMixerTest() {
24 src_frame_.sample_rate_hz_ = 16000;
25 src_frame_.samples_per_channel_ = src_frame_.sample_rate_hz_ / 100;
26 src_frame_.num_channels_ = 1;
andrew@webrtc.orgae1a58b2013-01-22 04:44:30 +000027 dst_frame_.CopyFrom(src_frame_);
28 golden_frame_.CopyFrom(src_frame_);
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +000029 }
30
31 void RunResampleTest(int src_channels, int src_sample_rate_hz,
32 int dst_channels, int dst_sample_rate_hz);
33
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +000034 PushResampler resampler_;
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +000035 AudioFrame src_frame_;
36 AudioFrame dst_frame_;
37 AudioFrame golden_frame_;
38};
39
40// Sets the signal value to increase by |data| with every sample. Floats are
41// used so non-integer values result in rounding error, but not an accumulating
42// error.
43void SetMonoFrame(AudioFrame* frame, float data, int sample_rate_hz) {
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +000044 memset(frame->data_, 0, sizeof(frame->data_));
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +000045 frame->num_channels_ = 1;
46 frame->sample_rate_hz_ = sample_rate_hz;
47 frame->samples_per_channel_ = sample_rate_hz / 100;
48 for (int i = 0; i < frame->samples_per_channel_; i++) {
49 frame->data_[i] = data * i;
50 }
51}
52
53// Keep the existing sample rate.
54void SetMonoFrame(AudioFrame* frame, float data) {
55 SetMonoFrame(frame, data, frame->sample_rate_hz_);
56}
57
58// Sets the signal value to increase by |left| and |right| with every sample in
59// each channel respectively.
60void SetStereoFrame(AudioFrame* frame, float left, float right,
61 int sample_rate_hz) {
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +000062 memset(frame->data_, 0, sizeof(frame->data_));
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +000063 frame->num_channels_ = 2;
64 frame->sample_rate_hz_ = sample_rate_hz;
65 frame->samples_per_channel_ = sample_rate_hz / 100;
66 for (int i = 0; i < frame->samples_per_channel_; i++) {
67 frame->data_[i * 2] = left * i;
68 frame->data_[i * 2 + 1] = right * i;
69 }
70}
71
72// Keep the existing sample rate.
73void SetStereoFrame(AudioFrame* frame, float left, float right) {
74 SetStereoFrame(frame, left, right, frame->sample_rate_hz_);
75}
76
77void VerifyParams(const AudioFrame& ref_frame, const AudioFrame& test_frame) {
78 EXPECT_EQ(ref_frame.num_channels_, test_frame.num_channels_);
79 EXPECT_EQ(ref_frame.samples_per_channel_, test_frame.samples_per_channel_);
80 EXPECT_EQ(ref_frame.sample_rate_hz_, test_frame.sample_rate_hz_);
81}
82
83// Computes the best SNR based on the error between |ref_frame| and
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +000084// |test_frame|. It allows for up to a |max_delay| in samples between the
85// signals to compensate for the resampling delay.
86float ComputeSNR(const AudioFrame& ref_frame, const AudioFrame& test_frame,
87 int max_delay) {
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +000088 VerifyParams(ref_frame, test_frame);
89 float best_snr = 0;
90 int best_delay = 0;
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +000091 for (int delay = 0; delay <= max_delay; delay++) {
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +000092 float mse = 0;
93 float variance = 0;
94 for (int i = 0; i < ref_frame.samples_per_channel_ *
95 ref_frame.num_channels_ - delay; i++) {
96 int error = ref_frame.data_[i] - test_frame.data_[i + delay];
97 mse += error * error;
98 variance += ref_frame.data_[i] * ref_frame.data_[i];
99 }
100 float snr = 100; // We assign 100 dB to the zero-error case.
101 if (mse > 0)
102 snr = 10 * log10(variance / mse);
103 if (snr > best_snr) {
104 best_snr = snr;
105 best_delay = delay;
106 }
107 }
108 printf("SNR=%.1f dB at delay=%d\n", best_snr, best_delay);
109 return best_snr;
110}
111
112void VerifyFramesAreEqual(const AudioFrame& ref_frame,
113 const AudioFrame& test_frame) {
114 VerifyParams(ref_frame, test_frame);
115 for (int i = 0; i < ref_frame.samples_per_channel_ * ref_frame.num_channels_;
116 i++) {
117 EXPECT_EQ(ref_frame.data_[i], test_frame.data_[i]);
118 }
119}
120
121void OutputMixerTest::RunResampleTest(int src_channels,
122 int src_sample_rate_hz,
123 int dst_channels,
124 int dst_sample_rate_hz) {
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000125 PushResampler resampler; // Create a new one with every test.
126 const int16_t kSrcLeft = 30; // Shouldn't overflow for any used sample rate.
127 const int16_t kSrcRight = 15;
128 const float resampling_factor = (1.0 * src_sample_rate_hz) /
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000129 dst_sample_rate_hz;
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000130 const float dst_left = resampling_factor * kSrcLeft;
131 const float dst_right = resampling_factor * kSrcRight;
132 const float dst_mono = (dst_left + dst_right) / 2;
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000133 if (src_channels == 1)
134 SetMonoFrame(&src_frame_, kSrcLeft, src_sample_rate_hz);
135 else
136 SetStereoFrame(&src_frame_, kSrcLeft, kSrcRight, src_sample_rate_hz);
137
138 if (dst_channels == 1) {
139 SetMonoFrame(&dst_frame_, 0, dst_sample_rate_hz);
140 if (src_channels == 1)
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000141 SetMonoFrame(&golden_frame_, dst_left, dst_sample_rate_hz);
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000142 else
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000143 SetMonoFrame(&golden_frame_, dst_mono, dst_sample_rate_hz);
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000144 } else {
145 SetStereoFrame(&dst_frame_, 0, 0, dst_sample_rate_hz);
146 if (src_channels == 1)
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000147 SetStereoFrame(&golden_frame_, dst_left, dst_left, dst_sample_rate_hz);
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000148 else
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000149 SetStereoFrame(&golden_frame_, dst_left, dst_right, dst_sample_rate_hz);
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000150 }
151
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000152 // The sinc resampler has a known delay, which we compute here. Multiplying by
153 // two gives us a crude maximum for any resampling, as the old resampler
154 // typically (but not always) has lower delay.
155 static const int kInputKernelDelaySamples = 16;
156 const int max_delay = static_cast<double>(dst_sample_rate_hz)
157 / src_sample_rate_hz * kInputKernelDelaySamples * dst_channels * 2;
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000158 printf("(%d, %d Hz) -> (%d, %d Hz) ", // SNR reported on the same line later.
159 src_channels, src_sample_rate_hz, dst_channels, dst_sample_rate_hz);
160 EXPECT_EQ(0, RemixAndResample(src_frame_, &resampler, &dst_frame_));
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000161 EXPECT_GT(ComputeSNR(golden_frame_, dst_frame_, max_delay), 39.0f);
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000162}
163
164TEST_F(OutputMixerTest, RemixAndResampleCopyFrameSucceeds) {
165 // Stereo -> stereo.
166 SetStereoFrame(&src_frame_, 10, 10);
167 SetStereoFrame(&dst_frame_, 0, 0);
168 EXPECT_EQ(0, RemixAndResample(src_frame_, &resampler_, &dst_frame_));
169 VerifyFramesAreEqual(src_frame_, dst_frame_);
170
171 // Mono -> mono.
172 SetMonoFrame(&src_frame_, 20);
173 SetMonoFrame(&dst_frame_, 0);
174 EXPECT_EQ(0, RemixAndResample(src_frame_, &resampler_, &dst_frame_));
175 VerifyFramesAreEqual(src_frame_, dst_frame_);
176}
177
178TEST_F(OutputMixerTest, RemixAndResampleMixingOnlySucceeds) {
179 // Stereo -> mono.
180 SetStereoFrame(&dst_frame_, 0, 0);
181 SetMonoFrame(&src_frame_, 10);
182 SetStereoFrame(&golden_frame_, 10, 10);
183 EXPECT_EQ(0, RemixAndResample(src_frame_, &resampler_, &dst_frame_));
184 VerifyFramesAreEqual(dst_frame_, golden_frame_);
185
186 // Mono -> stereo.
187 SetMonoFrame(&dst_frame_, 0);
188 SetStereoFrame(&src_frame_, 10, 20);
189 SetMonoFrame(&golden_frame_, 15);
190 EXPECT_EQ(0, RemixAndResample(src_frame_, &resampler_, &dst_frame_));
191 VerifyFramesAreEqual(golden_frame_, dst_frame_);
192}
193
194TEST_F(OutputMixerTest, RemixAndResampleSucceeds) {
andrew@webrtc.org50b2efe2013-04-29 17:27:29 +0000195 // TODO(ajm): convert this to the parameterized TEST_P style used in
196 // sinc_resampler_unittest.cc. We can then easily add tighter SNR thresholds.
197 const int kSampleRates[] = {8000, 16000, 32000, 44100, 48000, 96000};
andrew@webrtc.org4ecea3e2012-06-27 03:25:31 +0000198 const int kSampleRatesSize = sizeof(kSampleRates) / sizeof(*kSampleRates);
199 const int kChannels[] = {1, 2};
200 const int kChannelsSize = sizeof(kChannels) / sizeof(*kChannels);
201 for (int src_rate = 0; src_rate < kSampleRatesSize; src_rate++) {
202 for (int dst_rate = 0; dst_rate < kSampleRatesSize; dst_rate++) {
203 for (int src_channel = 0; src_channel < kChannelsSize; src_channel++) {
204 for (int dst_channel = 0; dst_channel < kChannelsSize; dst_channel++) {
205 RunResampleTest(kChannels[src_channel], kSampleRates[src_rate],
206 kChannels[dst_channel], kSampleRates[dst_rate]);
207 }
208 }
209 }
210 }
211}
212
213} // namespace
214} // namespace voe
215} // namespace webrtc