blob: a0cf4f9a82f36967519e4e77e04541155b000321 [file] [log] [blame]
peahe0eae3c2016-12-14 01:16:23 -08001/*
2 * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020010#include "modules/audio_processing/aec3/echo_canceller3.h"
peahe0eae3c2016-12-14 01:16:23 -080011
peahd0263542017-01-03 04:20:34 -080012#include <sstream>
13
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020014#include "modules/audio_processing/logging/apm_data_dumper.h"
15#include "rtc_base/atomicops.h"
Per Åhgren251c7352018-03-28 16:31:57 +020016#include "rtc_base/logging.h"
peahe0eae3c2016-12-14 01:16:23 -080017
18namespace webrtc {
19
peahd0263542017-01-03 04:20:34 -080020namespace {
21
peahcf02cf12017-04-05 14:18:07 -070022enum class EchoCanceller3ApiCall { kCapture, kRender };
23
peahd0263542017-01-03 04:20:34 -080024bool DetectSaturation(rtc::ArrayView<const float> y) {
25 for (auto y_k : y) {
peah522d71b2017-02-23 05:16:26 -080026 if (y_k >= 32700.0f || y_k <= -32700.0f) {
peahd0263542017-01-03 04:20:34 -080027 return true;
28 }
29 }
30 return false;
31}
32
Per Åhgren251c7352018-03-28 16:31:57 +020033// Method for adjusting config parameter dependencies..
34EchoCanceller3Config AdjustConfig(const EchoCanceller3Config& config) {
35 EchoCanceller3Config adjusted_cfg = config;
36
37 // Use customized parameters when the system has clock-drift.
38 if (config.echo_removal_control.has_clock_drift) {
39 RTC_LOG(LS_WARNING)
40 << "Customizing parameters to work well for the clock-drift case.";
41 if (config.ep_strength.bounded_erl) {
42 adjusted_cfg.ep_strength.default_len = 0.85f;
43 adjusted_cfg.ep_strength.lf = 0.01f;
44 adjusted_cfg.ep_strength.mf = 0.01f;
45 adjusted_cfg.ep_strength.hf = 0.01f;
46 adjusted_cfg.echo_model.render_pre_window_size = 1;
47 adjusted_cfg.echo_model.render_post_window_size = 1;
48 adjusted_cfg.echo_model.nonlinear_hold = 3;
49 adjusted_cfg.echo_model.nonlinear_release = 0.001f;
50 } else {
51 adjusted_cfg.ep_strength.bounded_erl = true;
52 adjusted_cfg.delay.down_sampling_factor = 2;
53 adjusted_cfg.ep_strength.default_len = 0.8f;
54 adjusted_cfg.ep_strength.lf = 0.01f;
55 adjusted_cfg.ep_strength.mf = 0.01f;
56 adjusted_cfg.ep_strength.hf = 0.01f;
57 adjusted_cfg.filter.main = {30, 0.1f, 0.8f, 0.001f, 20075344.f};
58 adjusted_cfg.filter.shadow = {30, 0.7f, 20075344.f};
59 adjusted_cfg.filter.main_initial = {30, 0.1f, 1.5f, 0.001f, 20075344.f};
60 adjusted_cfg.filter.shadow_initial = {30, 0.9f, 20075344.f};
61 adjusted_cfg.echo_model.render_pre_window_size = 2;
62 adjusted_cfg.echo_model.render_post_window_size = 2;
63 adjusted_cfg.echo_model.nonlinear_hold = 3;
64 adjusted_cfg.echo_model.nonlinear_release = 0.6f;
65 }
66 }
67 return adjusted_cfg;
68}
69
peahd0263542017-01-03 04:20:34 -080070void FillSubFrameView(AudioBuffer* frame,
71 size_t sub_frame_index,
72 std::vector<rtc::ArrayView<float>>* sub_frame_view) {
73 RTC_DCHECK_GE(1, sub_frame_index);
74 RTC_DCHECK_LE(0, sub_frame_index);
75 RTC_DCHECK_EQ(frame->num_bands(), sub_frame_view->size());
76 for (size_t k = 0; k < sub_frame_view->size(); ++k) {
77 (*sub_frame_view)[k] = rtc::ArrayView<float>(
78 &frame->split_bands_f(0)[k][sub_frame_index * kSubFrameLength],
79 kSubFrameLength);
80 }
81}
82
83void FillSubFrameView(std::vector<std::vector<float>>* frame,
84 size_t sub_frame_index,
85 std::vector<rtc::ArrayView<float>>* sub_frame_view) {
86 RTC_DCHECK_GE(1, sub_frame_index);
87 RTC_DCHECK_EQ(frame->size(), sub_frame_view->size());
88 for (size_t k = 0; k < frame->size(); ++k) {
89 (*sub_frame_view)[k] = rtc::ArrayView<float>(
90 &(*frame)[k][sub_frame_index * kSubFrameLength], kSubFrameLength);
91 }
92}
93
94void ProcessCaptureFrameContent(
95 AudioBuffer* capture,
peah69221db2017-01-27 03:28:19 -080096 bool level_change,
peahd0263542017-01-03 04:20:34 -080097 bool saturated_microphone_signal,
98 size_t sub_frame_index,
99 FrameBlocker* capture_blocker,
100 BlockFramer* output_framer,
101 BlockProcessor* block_processor,
102 std::vector<std::vector<float>>* block,
103 std::vector<rtc::ArrayView<float>>* sub_frame_view) {
104 FillSubFrameView(capture, sub_frame_index, sub_frame_view);
105 capture_blocker->InsertSubFrameAndExtractBlock(*sub_frame_view, block);
peah69221db2017-01-27 03:28:19 -0800106 block_processor->ProcessCapture(level_change, saturated_microphone_signal,
107 block);
peahd0263542017-01-03 04:20:34 -0800108 output_framer->InsertBlockAndExtractSubFrame(*block, sub_frame_view);
109}
110
111void ProcessRemainingCaptureFrameContent(
peah69221db2017-01-27 03:28:19 -0800112 bool level_change,
peahd0263542017-01-03 04:20:34 -0800113 bool saturated_microphone_signal,
114 FrameBlocker* capture_blocker,
115 BlockFramer* output_framer,
116 BlockProcessor* block_processor,
117 std::vector<std::vector<float>>* block) {
118 if (!capture_blocker->IsBlockAvailable()) {
119 return;
120 }
121
122 capture_blocker->ExtractBlock(block);
peah69221db2017-01-27 03:28:19 -0800123 block_processor->ProcessCapture(level_change, saturated_microphone_signal,
124 block);
peahd0263542017-01-03 04:20:34 -0800125 output_framer->InsertBlock(*block);
126}
127
peahcf02cf12017-04-05 14:18:07 -0700128void BufferRenderFrameContent(
peahd0263542017-01-03 04:20:34 -0800129 std::vector<std::vector<float>>* render_frame,
130 size_t sub_frame_index,
131 FrameBlocker* render_blocker,
132 BlockProcessor* block_processor,
133 std::vector<std::vector<float>>* block,
134 std::vector<rtc::ArrayView<float>>* sub_frame_view) {
135 FillSubFrameView(render_frame, sub_frame_index, sub_frame_view);
136 render_blocker->InsertSubFrameAndExtractBlock(*sub_frame_view, block);
peahcf02cf12017-04-05 14:18:07 -0700137 block_processor->BufferRender(*block);
peahd0263542017-01-03 04:20:34 -0800138}
139
peahcf02cf12017-04-05 14:18:07 -0700140void BufferRemainingRenderFrameContent(FrameBlocker* render_blocker,
peahd0263542017-01-03 04:20:34 -0800141 BlockProcessor* block_processor,
142 std::vector<std::vector<float>>* block) {
143 if (!render_blocker->IsBlockAvailable()) {
peahcf02cf12017-04-05 14:18:07 -0700144 return;
peahd0263542017-01-03 04:20:34 -0800145 }
146 render_blocker->ExtractBlock(block);
peahcf02cf12017-04-05 14:18:07 -0700147 block_processor->BufferRender(*block);
peahd0263542017-01-03 04:20:34 -0800148}
149
peahcf02cf12017-04-05 14:18:07 -0700150void CopyBufferIntoFrame(AudioBuffer* buffer,
151 size_t num_bands,
152 size_t frame_length,
153 std::vector<std::vector<float>>* frame) {
peahd0263542017-01-03 04:20:34 -0800154 RTC_DCHECK_EQ(num_bands, frame->size());
peah522d71b2017-02-23 05:16:26 -0800155 RTC_DCHECK_EQ(frame_length, (*frame)[0].size());
peahcf02cf12017-04-05 14:18:07 -0700156 for (size_t k = 0; k < num_bands; ++k) {
157 rtc::ArrayView<float> buffer_view(&buffer->split_bands_f(0)[k][0],
158 frame_length);
159 std::copy(buffer_view.begin(), buffer_view.end(), (*frame)[k].begin());
160 }
peahd0263542017-01-03 04:20:34 -0800161}
162
163// [B,A] = butter(2,100/4000,'high')
164const CascadedBiQuadFilter::BiQuadCoefficients
165 kHighPassFilterCoefficients_8kHz = {{0.94598f, -1.89195f, 0.94598f},
166 {-1.88903f, 0.89487f}};
167const int kNumberOfHighPassBiQuads_8kHz = 1;
168
169// [B,A] = butter(2,100/8000,'high')
170const CascadedBiQuadFilter::BiQuadCoefficients
171 kHighPassFilterCoefficients_16kHz = {{0.97261f, -1.94523f, 0.97261f},
172 {-1.94448f, 0.94598f}};
173const int kNumberOfHighPassBiQuads_16kHz = 1;
174
peahd0263542017-01-03 04:20:34 -0800175} // namespace
176
177class EchoCanceller3::RenderWriter {
178 public:
179 RenderWriter(ApmDataDumper* data_dumper,
180 SwapQueue<std::vector<std::vector<float>>,
181 Aec3RenderQueueItemVerifier>* render_transfer_queue,
182 std::unique_ptr<CascadedBiQuadFilter> render_highpass_filter,
183 int sample_rate_hz,
184 int frame_length,
185 int num_bands);
186 ~RenderWriter();
Alex Loiko890988c2017-08-31 10:25:48 +0200187 void Insert(AudioBuffer* input);
peahd0263542017-01-03 04:20:34 -0800188
189 private:
190 ApmDataDumper* data_dumper_;
191 const int sample_rate_hz_;
192 const size_t frame_length_;
193 const int num_bands_;
194 std::unique_ptr<CascadedBiQuadFilter> render_highpass_filter_;
195 std::vector<std::vector<float>> render_queue_input_frame_;
196 SwapQueue<std::vector<std::vector<float>>, Aec3RenderQueueItemVerifier>*
197 render_transfer_queue_;
198 RTC_DISALLOW_IMPLICIT_CONSTRUCTORS(RenderWriter);
199};
200
201EchoCanceller3::RenderWriter::RenderWriter(
202 ApmDataDumper* data_dumper,
203 SwapQueue<std::vector<std::vector<float>>, Aec3RenderQueueItemVerifier>*
204 render_transfer_queue,
205 std::unique_ptr<CascadedBiQuadFilter> render_highpass_filter,
206 int sample_rate_hz,
207 int frame_length,
208 int num_bands)
209 : data_dumper_(data_dumper),
210 sample_rate_hz_(sample_rate_hz),
211 frame_length_(frame_length),
212 num_bands_(num_bands),
213 render_highpass_filter_(std::move(render_highpass_filter)),
214 render_queue_input_frame_(num_bands_,
215 std::vector<float>(frame_length_, 0.f)),
216 render_transfer_queue_(render_transfer_queue) {
217 RTC_DCHECK(data_dumper);
218}
219
220EchoCanceller3::RenderWriter::~RenderWriter() = default;
221
peahcf02cf12017-04-05 14:18:07 -0700222void EchoCanceller3::RenderWriter::Insert(AudioBuffer* input) {
peahd0263542017-01-03 04:20:34 -0800223 RTC_DCHECK_EQ(1, input->num_channels());
peahd0263542017-01-03 04:20:34 -0800224 RTC_DCHECK_EQ(frame_length_, input->num_frames_per_band());
Gustaf Ullberg7d042782018-01-16 13:39:27 +0100225 RTC_DCHECK_EQ(num_bands_, input->num_bands());
226
227 // TODO(bugs.webrtc.org/8759) Temporary work-around.
228 if (num_bands_ != static_cast<int>(input->num_bands()))
229 return;
230
peahd0263542017-01-03 04:20:34 -0800231 data_dumper_->DumpWav("aec3_render_input", frame_length_,
peahcf02cf12017-04-05 14:18:07 -0700232 &input->split_bands_f(0)[0][0],
peahd0263542017-01-03 04:20:34 -0800233 LowestBandRate(sample_rate_hz_), 1);
234
peahcf02cf12017-04-05 14:18:07 -0700235 CopyBufferIntoFrame(input, num_bands_, frame_length_,
236 &render_queue_input_frame_);
peahd0263542017-01-03 04:20:34 -0800237
238 if (render_highpass_filter_) {
239 render_highpass_filter_->Process(render_queue_input_frame_[0]);
240 }
241
peah925e9d72017-04-10 04:18:38 -0700242 static_cast<void>(render_transfer_queue_->Insert(&render_queue_input_frame_));
peahd0263542017-01-03 04:20:34 -0800243}
244
peahe0eae3c2016-12-14 01:16:23 -0800245int EchoCanceller3::instance_count_ = 0;
246
Gustaf Ullbergbd83b912017-10-18 12:32:42 +0200247EchoCanceller3::EchoCanceller3(const EchoCanceller3Config& config,
248 int sample_rate_hz,
249 bool use_highpass_filter)
Per Åhgren251c7352018-03-28 16:31:57 +0200250 : EchoCanceller3(
251 AdjustConfig(config),
252 sample_rate_hz,
253 use_highpass_filter,
254 std::unique_ptr<BlockProcessor>(
255 BlockProcessor::Create(AdjustConfig(config), sample_rate_hz))) {}
Per Åhgren8ba58612017-12-01 23:01:44 +0100256EchoCanceller3::EchoCanceller3(const EchoCanceller3Config& config,
257 int sample_rate_hz,
peahd0263542017-01-03 04:20:34 -0800258 bool use_highpass_filter,
259 std::unique_ptr<BlockProcessor> block_processor)
260 : data_dumper_(
261 new ApmDataDumper(rtc::AtomicOps::Increment(&instance_count_))),
262 sample_rate_hz_(sample_rate_hz),
263 num_bands_(NumBandsForRate(sample_rate_hz_)),
264 frame_length_(rtc::CheckedDivExact(LowestBandRate(sample_rate_hz_), 100)),
265 output_framer_(num_bands_),
266 capture_blocker_(num_bands_),
267 render_blocker_(num_bands_),
268 render_transfer_queue_(
Per Åhgren8ba58612017-12-01 23:01:44 +0100269 kRenderTransferQueueSizeFrames,
peahd0263542017-01-03 04:20:34 -0800270 std::vector<std::vector<float>>(
271 num_bands_,
272 std::vector<float>(frame_length_, 0.f)),
273 Aec3RenderQueueItemVerifier(num_bands_, frame_length_)),
274 block_processor_(std::move(block_processor)),
275 render_queue_output_frame_(num_bands_,
276 std::vector<float>(frame_length_, 0.f)),
277 block_(num_bands_, std::vector<float>(kBlockSize, 0.f)),
278 sub_frame_view_(num_bands_) {
peah21920892017-02-08 05:08:56 -0800279 RTC_DCHECK(ValidFullBandRate(sample_rate_hz_));
280
peahd0263542017-01-03 04:20:34 -0800281 std::unique_ptr<CascadedBiQuadFilter> render_highpass_filter;
282 if (use_highpass_filter) {
283 render_highpass_filter.reset(new CascadedBiQuadFilter(
284 sample_rate_hz_ == 8000 ? kHighPassFilterCoefficients_8kHz
285 : kHighPassFilterCoefficients_16kHz,
286 sample_rate_hz_ == 8000 ? kNumberOfHighPassBiQuads_8kHz
287 : kNumberOfHighPassBiQuads_16kHz));
288 capture_highpass_filter_.reset(new CascadedBiQuadFilter(
289 sample_rate_hz_ == 8000 ? kHighPassFilterCoefficients_8kHz
290 : kHighPassFilterCoefficients_16kHz,
291 sample_rate_hz_ == 8000 ? kNumberOfHighPassBiQuads_8kHz
292 : kNumberOfHighPassBiQuads_16kHz));
293 }
peahe0eae3c2016-12-14 01:16:23 -0800294
peahd0263542017-01-03 04:20:34 -0800295 render_writer_.reset(
296 new RenderWriter(data_dumper_.get(), &render_transfer_queue_,
297 std::move(render_highpass_filter), sample_rate_hz_,
298 frame_length_, num_bands_));
299
300 RTC_DCHECK_EQ(num_bands_, std::max(sample_rate_hz_, 16000) / 16000);
301 RTC_DCHECK_GE(kMaxNumBands, num_bands_);
peahe0eae3c2016-12-14 01:16:23 -0800302}
303
304EchoCanceller3::~EchoCanceller3() = default;
305
peahcf02cf12017-04-05 14:18:07 -0700306void EchoCanceller3::AnalyzeRender(AudioBuffer* render) {
peahd0263542017-01-03 04:20:34 -0800307 RTC_DCHECK_RUNS_SERIALIZED(&render_race_checker_);
308 RTC_DCHECK(render);
peahcf02cf12017-04-05 14:18:07 -0700309 data_dumper_->DumpRaw("aec3_call_order",
310 static_cast<int>(EchoCanceller3ApiCall::kRender));
311
peahd0263542017-01-03 04:20:34 -0800312 return render_writer_->Insert(render);
peahe0eae3c2016-12-14 01:16:23 -0800313}
314
peahd0263542017-01-03 04:20:34 -0800315void EchoCanceller3::AnalyzeCapture(AudioBuffer* capture) {
316 RTC_DCHECK_RUNS_SERIALIZED(&capture_race_checker_);
317 RTC_DCHECK(capture);
peahebe77782017-02-27 07:29:21 -0800318 data_dumper_->DumpWav("aec3_capture_analyze_input", capture->num_frames(),
peahd0263542017-01-03 04:20:34 -0800319 capture->channels_f()[0], sample_rate_hz_, 1);
320
321 saturated_microphone_signal_ = false;
322 for (size_t k = 0; k < capture->num_channels(); ++k) {
323 saturated_microphone_signal_ |=
324 DetectSaturation(rtc::ArrayView<const float>(capture->channels_f()[k],
325 capture->num_frames()));
326 if (saturated_microphone_signal_) {
327 break;
328 }
329 }
330}
peahe0eae3c2016-12-14 01:16:23 -0800331
peah69221db2017-01-27 03:28:19 -0800332void EchoCanceller3::ProcessCapture(AudioBuffer* capture, bool level_change) {
peahd0263542017-01-03 04:20:34 -0800333 RTC_DCHECK_RUNS_SERIALIZED(&capture_race_checker_);
334 RTC_DCHECK(capture);
peahe0eae3c2016-12-14 01:16:23 -0800335 RTC_DCHECK_EQ(1u, capture->num_channels());
peahd0263542017-01-03 04:20:34 -0800336 RTC_DCHECK_EQ(num_bands_, capture->num_bands());
peahe0eae3c2016-12-14 01:16:23 -0800337 RTC_DCHECK_EQ(frame_length_, capture->num_frames_per_band());
peahcf02cf12017-04-05 14:18:07 -0700338 data_dumper_->DumpRaw("aec3_call_order",
339 static_cast<int>(EchoCanceller3ApiCall::kCapture));
peahd0263542017-01-03 04:20:34 -0800340
341 rtc::ArrayView<float> capture_lower_band =
342 rtc::ArrayView<float>(&capture->split_bands_f(0)[0][0], frame_length_);
343
344 data_dumper_->DumpWav("aec3_capture_input", capture_lower_band,
345 LowestBandRate(sample_rate_hz_), 1);
346
peahcf02cf12017-04-05 14:18:07 -0700347 EmptyRenderQueue();
peahd0263542017-01-03 04:20:34 -0800348
349 if (capture_highpass_filter_) {
350 capture_highpass_filter_->Process(capture_lower_band);
351 }
352
peah69221db2017-01-27 03:28:19 -0800353 ProcessCaptureFrameContent(
354 capture, level_change, saturated_microphone_signal_, 0, &capture_blocker_,
355 &output_framer_, block_processor_.get(), &block_, &sub_frame_view_);
peahd0263542017-01-03 04:20:34 -0800356
357 if (sample_rate_hz_ != 8000) {
358 ProcessCaptureFrameContent(
peah69221db2017-01-27 03:28:19 -0800359 capture, level_change, saturated_microphone_signal_, 1,
peahd0263542017-01-03 04:20:34 -0800360 &capture_blocker_, &output_framer_, block_processor_.get(), &block_,
361 &sub_frame_view_);
362 }
363
364 ProcessRemainingCaptureFrameContent(
peah69221db2017-01-27 03:28:19 -0800365 level_change, saturated_microphone_signal_, &capture_blocker_,
peahd0263542017-01-03 04:20:34 -0800366 &output_framer_, block_processor_.get(), &block_);
367
368 data_dumper_->DumpWav("aec3_capture_output", frame_length_,
369 &capture->split_bands_f(0)[0][0],
370 LowestBandRate(sample_rate_hz_), 1);
peahe0eae3c2016-12-14 01:16:23 -0800371}
372
Gustaf Ullberg332150d2017-11-22 14:17:39 +0100373EchoControl::Metrics EchoCanceller3::GetMetrics() const {
374 RTC_DCHECK_RUNS_SERIALIZED(&capture_race_checker_);
375 Metrics metrics;
376 block_processor_->GetMetrics(&metrics);
377 return metrics;
378}
379
peahcf02cf12017-04-05 14:18:07 -0700380void EchoCanceller3::EmptyRenderQueue() {
peahd0263542017-01-03 04:20:34 -0800381 RTC_DCHECK_RUNS_SERIALIZED(&capture_race_checker_);
peahd0263542017-01-03 04:20:34 -0800382 bool frame_to_buffer =
383 render_transfer_queue_.Remove(&render_queue_output_frame_);
384 while (frame_to_buffer) {
peahcf02cf12017-04-05 14:18:07 -0700385 BufferRenderFrameContent(&render_queue_output_frame_, 0, &render_blocker_,
386 block_processor_.get(), &block_, &sub_frame_view_);
peahd0263542017-01-03 04:20:34 -0800387
388 if (sample_rate_hz_ != 8000) {
peahcf02cf12017-04-05 14:18:07 -0700389 BufferRenderFrameContent(&render_queue_output_frame_, 1, &render_blocker_,
390 block_processor_.get(), &block_,
391 &sub_frame_view_);
peahd0263542017-01-03 04:20:34 -0800392 }
393
peahcf02cf12017-04-05 14:18:07 -0700394 BufferRemainingRenderFrameContent(&render_blocker_, block_processor_.get(),
395 &block_);
peahd0263542017-01-03 04:20:34 -0800396
397 frame_to_buffer =
398 render_transfer_queue_.Remove(&render_queue_output_frame_);
399 }
peahd0263542017-01-03 04:20:34 -0800400}
peahe0eae3c2016-12-14 01:16:23 -0800401} // namespace webrtc