blob: 95a2134e314345ace9b5b8173c6d7692a654c402 [file] [log] [blame]
peah522d71b2017-02-23 05:16:26 -08001/*
2 * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "modules/audio_processing/aec3/aec_state.h"
peah522d71b2017-02-23 05:16:26 -080012
Per Åhgren8ba58612017-12-01 23:01:44 +010013#include "modules/audio_processing/aec3/aec3_fft.h"
14#include "modules/audio_processing/aec3/render_delay_buffer.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020015#include "modules/audio_processing/logging/apm_data_dumper.h"
Sam Zackrisson8f736c02019-10-01 12:47:53 +020016#include "rtc_base/strings/string_builder.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020017#include "test/gtest.h"
peah522d71b2017-02-23 05:16:26 -080018
19namespace webrtc {
Sam Zackrisson8f736c02019-10-01 12:47:53 +020020namespace {
21std::string ProduceDebugText(size_t num_render_channels,
22 size_t num_capture_channels) {
23 rtc::StringBuilder ss;
24 ss << "Render channels: " << num_render_channels;
25 ss << ", Capture channels: " << num_capture_channels;
26 return ss.Release();
27}
peah522d71b2017-02-23 05:16:26 -080028
Sam Zackrisson8f736c02019-10-01 12:47:53 +020029void RunNormalUsageTest(size_t num_render_channels,
30 size_t num_capture_channels) {
31 // TODO(bugs.webrtc.org/10913): Test with different content in different
32 // channels.
Per Åhgrence202a02019-09-02 17:01:19 +020033 constexpr int kSampleRateHz = 48000;
34 constexpr size_t kNumBands = NumBandsForRate(kSampleRateHz);
peah522d71b2017-02-23 05:16:26 -080035 ApmDataDumper data_dumper(42);
Per Åhgren8ba58612017-12-01 23:01:44 +010036 EchoCanceller3Config config;
Sam Zackrisson8f736c02019-10-01 12:47:53 +020037 AecState state(config, num_capture_channels);
Danil Chapovalovdb9f7ab2018-06-19 10:50:11 +020038 absl::optional<DelayEstimate> delay_estimate =
Per Åhgren5c532d32018-03-22 00:29:25 +010039 DelayEstimate(DelayEstimate::Quality::kRefined, 10);
Per Åhgren8ba58612017-12-01 23:01:44 +010040 std::unique_ptr<RenderDelayBuffer> render_delay_buffer(
Sam Zackrisson8f736c02019-10-01 12:47:53 +020041 RenderDelayBuffer::Create(config, kSampleRateHz, num_render_channels));
peah86afe9d2017-04-06 15:45:32 -070042 std::array<float, kFftLengthBy2Plus1> E2_main = {};
43 std::array<float, kFftLengthBy2Plus1> Y2 = {};
Per Åhgrence202a02019-09-02 17:01:19 +020044 std::vector<std::vector<std::vector<float>>> x(
45 kNumBands, std::vector<std::vector<float>>(
Sam Zackrisson8f736c02019-10-01 12:47:53 +020046 num_render_channels, std::vector<float>(kBlockSize, 0.f)));
Per Åhgren8ba58612017-12-01 23:01:44 +010047 EchoPathVariability echo_path_variability(
48 false, EchoPathVariability::DelayAdjustment::kNone, false);
Sam Zackrisson8f736c02019-10-01 12:47:53 +020049 std::vector<std::array<float, kBlockSize>> y(num_capture_channels);
50 std::vector<SubtractorOutput> subtractor_output(num_capture_channels);
51 for (size_t ch = 0; ch < num_capture_channels; ++ch) {
52 subtractor_output[ch].Reset();
53 subtractor_output[ch].s_main.fill(100.f);
54 subtractor_output[ch].e_main.fill(100.f);
55 y[ch].fill(1000.f);
56 }
Per Åhgren8ba58612017-12-01 23:01:44 +010057 Aec3Fft fft;
Sam Zackrisson46b01402019-10-08 16:17:48 +020058 std::vector<std::vector<std::array<float, kFftLengthBy2Plus1>>>
59 converged_filter_frequency_response(
60 num_capture_channels,
61 std::vector<std::array<float, kFftLengthBy2Plus1>>(10));
62 for (auto& v_ch : converged_filter_frequency_response) {
63 for (auto& v : v_ch) {
64 v.fill(0.01f);
65 }
peah522d71b2017-02-23 05:16:26 -080066 }
Sam Zackrisson46b01402019-10-08 16:17:48 +020067 std::vector<std::vector<std::array<float, kFftLengthBy2Plus1>>>
peah522d71b2017-02-23 05:16:26 -080068 diverged_filter_frequency_response = converged_filter_frequency_response;
Sam Zackrisson46b01402019-10-08 16:17:48 +020069 converged_filter_frequency_response[0][2].fill(100.f);
70 converged_filter_frequency_response[0][2][0] = 1.f;
71 std::vector<std::vector<float>> impulse_response(
72 num_capture_channels,
73 std::vector<float>(GetTimeDomainLength(config.filter.main.length_blocks),
74 0.f));
peah29103572017-07-11 02:54:02 -070075
peah522d71b2017-02-23 05:16:26 -080076 // Verify that linear AEC usability is true when the filter is converged
Per Åhgrence202a02019-09-02 17:01:19 +020077 for (size_t band = 0; band < kNumBands; ++band) {
Sam Zackrisson8f736c02019-10-01 12:47:53 +020078 for (size_t ch = 0; ch < num_render_channels; ++ch) {
79 std::fill(x[band][ch].begin(), x[band][ch].end(), 101.f);
Per Åhgrence202a02019-09-02 17:01:19 +020080 }
81 }
peah86afe9d2017-04-06 15:45:32 -070082 for (int k = 0; k < 3000; ++k) {
Per Åhgren0e6d2f52017-12-20 22:19:56 +010083 render_delay_buffer->Insert(x);
Sam Zackrisson8f736c02019-10-01 12:47:53 +020084 for (size_t ch = 0; ch < num_capture_channels; ++ch) {
85 subtractor_output[ch].ComputeMetrics(y[ch]);
86 }
Per Åhgren5c532d32018-03-22 00:29:25 +010087 state.Update(delay_estimate, converged_filter_frequency_response,
Per Åhgrenb20b9372018-07-13 00:22:54 +020088 impulse_response, *render_delay_buffer->GetRenderBuffer(),
Sam Zackrisson8f736c02019-10-01 12:47:53 +020089 E2_main, Y2, subtractor_output);
peah522d71b2017-02-23 05:16:26 -080090 }
91 EXPECT_TRUE(state.UsableLinearEstimate());
92
Sam Zackrisson8f736c02019-10-01 12:47:53 +020093 // Verify that linear AEC usability becomes false after an echo path
94 // change is reported
95 for (size_t ch = 0; ch < num_capture_channels; ++ch) {
96 subtractor_output[ch].ComputeMetrics(y[ch]);
97 }
Per Åhgren8ba58612017-12-01 23:01:44 +010098 state.HandleEchoPathChange(EchoPathVariability(
Per Åhgren88cf0502018-07-16 17:08:41 +020099 false, EchoPathVariability::DelayAdjustment::kBufferReadjustment, false));
Per Åhgren3ab308f2018-02-21 08:46:03 +0100100 state.Update(delay_estimate, converged_filter_frequency_response,
Per Åhgrenb20b9372018-07-13 00:22:54 +0200101 impulse_response, *render_delay_buffer->GetRenderBuffer(),
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200102 E2_main, Y2, subtractor_output);
peah522d71b2017-02-23 05:16:26 -0800103 EXPECT_FALSE(state.UsableLinearEstimate());
104
105 // Verify that the active render detection works as intended.
Per Åhgrence202a02019-09-02 17:01:19 +0200106 std::fill(x[0][0].begin(), x[0][0].end(), 101.f);
Per Åhgren0e6d2f52017-12-20 22:19:56 +0100107 render_delay_buffer->Insert(x);
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200108 for (size_t ch = 0; ch < num_capture_channels; ++ch) {
109 subtractor_output[ch].ComputeMetrics(y[ch]);
110 }
Per Åhgren8ba58612017-12-01 23:01:44 +0100111 state.HandleEchoPathChange(EchoPathVariability(
112 true, EchoPathVariability::DelayAdjustment::kNewDetectedDelay, false));
Per Åhgren3ab308f2018-02-21 08:46:03 +0100113 state.Update(delay_estimate, converged_filter_frequency_response,
Per Åhgrenb20b9372018-07-13 00:22:54 +0200114 impulse_response, *render_delay_buffer->GetRenderBuffer(),
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200115 E2_main, Y2, subtractor_output);
peah522d71b2017-02-23 05:16:26 -0800116 EXPECT_FALSE(state.ActiveRender());
117
peah86afe9d2017-04-06 15:45:32 -0700118 for (int k = 0; k < 1000; ++k) {
Per Åhgren0e6d2f52017-12-20 22:19:56 +0100119 render_delay_buffer->Insert(x);
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200120 for (size_t ch = 0; ch < num_capture_channels; ++ch) {
121 subtractor_output[ch].ComputeMetrics(y[ch]);
122 }
Per Åhgren5c532d32018-03-22 00:29:25 +0100123 state.Update(delay_estimate, converged_filter_frequency_response,
Per Åhgrenb20b9372018-07-13 00:22:54 +0200124 impulse_response, *render_delay_buffer->GetRenderBuffer(),
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200125 E2_main, Y2, subtractor_output);
peah86afe9d2017-04-06 15:45:32 -0700126 }
peah522d71b2017-02-23 05:16:26 -0800127 EXPECT_TRUE(state.ActiveRender());
128
peah522d71b2017-02-23 05:16:26 -0800129 // Verify that the ERL is properly estimated
Per Åhgrence202a02019-09-02 17:01:19 +0200130 for (auto& band : x) {
131 for (auto& channel : band) {
132 channel = std::vector<float>(kBlockSize, 0.f);
133 }
peah86afe9d2017-04-06 15:45:32 -0700134 }
135
Per Åhgrence202a02019-09-02 17:01:19 +0200136 x[0][0][0] = 5000.f;
Per Åhgrenc59a5762017-12-11 21:34:19 +0100137 for (size_t k = 0;
Per Åhgrenec22e3f2017-12-20 15:20:37 +0100138 k < render_delay_buffer->GetRenderBuffer()->GetFftBuffer().size(); ++k) {
Per Åhgren8ba58612017-12-01 23:01:44 +0100139 render_delay_buffer->Insert(x);
140 if (k == 0) {
141 render_delay_buffer->Reset();
142 }
Per Åhgrenc59a5762017-12-11 21:34:19 +0100143 render_delay_buffer->PrepareCaptureProcessing();
peah86afe9d2017-04-06 15:45:32 -0700144 }
145
146 Y2.fill(10.f * 10000.f * 10000.f);
147 for (size_t k = 0; k < 1000; ++k) {
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200148 for (size_t ch = 0; ch < num_capture_channels; ++ch) {
149 subtractor_output[ch].ComputeMetrics(y[ch]);
150 }
Per Åhgren5c532d32018-03-22 00:29:25 +0100151 state.Update(delay_estimate, converged_filter_frequency_response,
Per Åhgrenb20b9372018-07-13 00:22:54 +0200152 impulse_response, *render_delay_buffer->GetRenderBuffer(),
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200153 E2_main, Y2, subtractor_output);
peah522d71b2017-02-23 05:16:26 -0800154 }
155
156 ASSERT_TRUE(state.UsableLinearEstimate());
157 const std::array<float, kFftLengthBy2Plus1>& erl = state.Erl();
peah86afe9d2017-04-06 15:45:32 -0700158 EXPECT_EQ(erl[0], erl[1]);
159 for (size_t k = 1; k < erl.size() - 1; ++k) {
160 EXPECT_NEAR(k % 2 == 0 ? 10.f : 1000.f, erl[k], 0.1);
161 }
162 EXPECT_EQ(erl[erl.size() - 2], erl[erl.size() - 1]);
peah522d71b2017-02-23 05:16:26 -0800163
164 // Verify that the ERLE is properly estimated
peah86afe9d2017-04-06 15:45:32 -0700165 E2_main.fill(1.f * 10000.f * 10000.f);
peah522d71b2017-02-23 05:16:26 -0800166 Y2.fill(10.f * E2_main[0]);
peah86afe9d2017-04-06 15:45:32 -0700167 for (size_t k = 0; k < 1000; ++k) {
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200168 for (size_t ch = 0; ch < num_capture_channels; ++ch) {
169 subtractor_output[ch].ComputeMetrics(y[ch]);
170 }
Per Åhgren5c532d32018-03-22 00:29:25 +0100171 state.Update(delay_estimate, converged_filter_frequency_response,
Per Åhgrenb20b9372018-07-13 00:22:54 +0200172 impulse_response, *render_delay_buffer->GetRenderBuffer(),
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200173 E2_main, Y2, subtractor_output);
peah522d71b2017-02-23 05:16:26 -0800174 }
175 ASSERT_TRUE(state.UsableLinearEstimate());
peah86afe9d2017-04-06 15:45:32 -0700176 {
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200177 // Note that the render spectrum is built so it does not have energy in
178 // the odd bands but just in the even bands.
Per Åhgrenb4161d32019-10-08 12:35:47 +0200179 const auto& erle = state.Erle()[0];
peah86afe9d2017-04-06 15:45:32 -0700180 EXPECT_EQ(erle[0], erle[1]);
peah1d680892017-05-23 04:07:10 -0700181 constexpr size_t kLowFrequencyLimit = 32;
Jesús de Vicente Peñae9a7e902018-09-27 11:49:39 +0200182 for (size_t k = 2; k < kLowFrequencyLimit; k = k + 2) {
183 EXPECT_NEAR(4.f, erle[k], 0.1);
peah86afe9d2017-04-06 15:45:32 -0700184 }
Jesús de Vicente Peñae9a7e902018-09-27 11:49:39 +0200185 for (size_t k = kLowFrequencyLimit; k < erle.size() - 1; k = k + 2) {
186 EXPECT_NEAR(1.5f, erle[k], 0.1);
peah1d680892017-05-23 04:07:10 -0700187 }
peah86afe9d2017-04-06 15:45:32 -0700188 EXPECT_EQ(erle[erle.size() - 2], erle[erle.size() - 1]);
189 }
peah522d71b2017-02-23 05:16:26 -0800190
peah86afe9d2017-04-06 15:45:32 -0700191 E2_main.fill(1.f * 10000.f * 10000.f);
peah522d71b2017-02-23 05:16:26 -0800192 Y2.fill(5.f * E2_main[0]);
peah86afe9d2017-04-06 15:45:32 -0700193 for (size_t k = 0; k < 1000; ++k) {
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200194 for (size_t ch = 0; ch < num_capture_channels; ++ch) {
195 subtractor_output[ch].ComputeMetrics(y[ch]);
196 }
Per Åhgren5c532d32018-03-22 00:29:25 +0100197 state.Update(delay_estimate, converged_filter_frequency_response,
Per Åhgrenb20b9372018-07-13 00:22:54 +0200198 impulse_response, *render_delay_buffer->GetRenderBuffer(),
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200199 E2_main, Y2, subtractor_output);
peah522d71b2017-02-23 05:16:26 -0800200 }
peah86afe9d2017-04-06 15:45:32 -0700201
peah522d71b2017-02-23 05:16:26 -0800202 ASSERT_TRUE(state.UsableLinearEstimate());
peah86afe9d2017-04-06 15:45:32 -0700203 {
Per Åhgrenb4161d32019-10-08 12:35:47 +0200204 const auto& erle = state.Erle()[0];
peah86afe9d2017-04-06 15:45:32 -0700205 EXPECT_EQ(erle[0], erle[1]);
peah1d680892017-05-23 04:07:10 -0700206 constexpr size_t kLowFrequencyLimit = 32;
207 for (size_t k = 1; k < kLowFrequencyLimit; ++k) {
Per Åhgren5c532d32018-03-22 00:29:25 +0100208 EXPECT_NEAR(k % 2 == 0 ? 4.f : 1.f, erle[k], 0.1);
peah86afe9d2017-04-06 15:45:32 -0700209 }
peah1d680892017-05-23 04:07:10 -0700210 for (size_t k = kLowFrequencyLimit; k < erle.size() - 1; ++k) {
211 EXPECT_NEAR(k % 2 == 0 ? 1.5f : 1.f, erle[k], 0.1);
212 }
peah86afe9d2017-04-06 15:45:32 -0700213 EXPECT_EQ(erle[erle.size() - 2], erle[erle.size() - 1]);
214 }
peah522d71b2017-02-23 05:16:26 -0800215}
216
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200217} // namespace
218
219// Verify the general functionality of AecState
220TEST(AecState, NormalUsage) {
221 for (size_t num_render_channels : {1, 2, 8}) {
222 for (size_t num_capture_channels : {1, 2, 8}) {
223 SCOPED_TRACE(ProduceDebugText(num_render_channels, num_capture_channels));
224 RunNormalUsageTest(num_render_channels, num_capture_channels);
225 }
226 }
227}
228
peah522d71b2017-02-23 05:16:26 -0800229// Verifies the delay for a converged filter is correctly identified.
230TEST(AecState, ConvergedFilterDelay) {
Per Åhgren5c532d32018-03-22 00:29:25 +0100231 constexpr int kFilterLengthBlocks = 10;
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200232 constexpr size_t kNumCaptureChannels = 1;
Per Åhgren8ba58612017-12-01 23:01:44 +0100233 EchoCanceller3Config config;
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200234 AecState state(config, kNumCaptureChannels);
Per Åhgren8ba58612017-12-01 23:01:44 +0100235 std::unique_ptr<RenderDelayBuffer> render_delay_buffer(
Per Åhgrence202a02019-09-02 17:01:19 +0200236 RenderDelayBuffer::Create(config, 48000, 1));
Danil Chapovalovdb9f7ab2018-06-19 10:50:11 +0200237 absl::optional<DelayEstimate> delay_estimate;
peah522d71b2017-02-23 05:16:26 -0800238 std::array<float, kFftLengthBy2Plus1> E2_main;
peah522d71b2017-02-23 05:16:26 -0800239 std::array<float, kFftLengthBy2Plus1> Y2;
240 std::array<float, kBlockSize> x;
Per Åhgren8ba58612017-12-01 23:01:44 +0100241 EchoPathVariability echo_path_variability(
242 false, EchoPathVariability::DelayAdjustment::kNone, false);
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200243 std::vector<SubtractorOutput> subtractor_output(kNumCaptureChannels);
244 for (auto& output : subtractor_output) {
245 output.Reset();
246 output.s_main.fill(100.f);
247 }
Per Åhgrenb20b9372018-07-13 00:22:54 +0200248 std::array<float, kBlockSize> y;
peah522d71b2017-02-23 05:16:26 -0800249 x.fill(0.f);
Per Åhgrenb20b9372018-07-13 00:22:54 +0200250 y.fill(0.f);
peah522d71b2017-02-23 05:16:26 -0800251
Sam Zackrisson46b01402019-10-08 16:17:48 +0200252 std::vector<std::vector<std::array<float, kFftLengthBy2Plus1>>>
253 frequency_response(
254 kNumCaptureChannels,
255 std::vector<std::array<float, kFftLengthBy2Plus1>>(kFilterLengthBlocks));
256 for (auto& v_ch : frequency_response) {
257 for (auto& v : v_ch) {
258 v.fill(0.01f);
259 }
Per Åhgren5c532d32018-03-22 00:29:25 +0100260 }
peah522d71b2017-02-23 05:16:26 -0800261
Sam Zackrisson46b01402019-10-08 16:17:48 +0200262 std::vector<std::vector<float>> impulse_response(
263 kNumCaptureChannels,
264 std::vector<float>(GetTimeDomainLength(config.filter.main.length_blocks),
265 0.f));
peah29103572017-07-11 02:54:02 -0700266
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200267 // Verify that the filter delay for a converged filter is properly
268 // identified.
Per Åhgren5c532d32018-03-22 00:29:25 +0100269 for (int k = 0; k < kFilterLengthBlocks; ++k) {
Sam Zackrisson46b01402019-10-08 16:17:48 +0200270 for (auto& ir : impulse_response) {
271 std::fill(ir.begin(), ir.end(), 0.f);
272 ir[k * kBlockSize + 1] = 1.f;
273 }
Per Åhgren5c532d32018-03-22 00:29:25 +0100274
peah86afe9d2017-04-06 15:45:32 -0700275 state.HandleEchoPathChange(echo_path_variability);
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200276 subtractor_output[0].ComputeMetrics(y);
Per Åhgrenb20b9372018-07-13 00:22:54 +0200277 state.Update(delay_estimate, frequency_response, impulse_response,
Sam Zackrisson8f736c02019-10-01 12:47:53 +0200278 *render_delay_buffer->GetRenderBuffer(), E2_main, Y2,
279 subtractor_output);
peah522d71b2017-02-23 05:16:26 -0800280 }
281}
282
peah522d71b2017-02-23 05:16:26 -0800283} // namespace webrtc