peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 10 | #include "modules/audio_processing/aec3/echo_remover.h" |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 11 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 12 | #include <math.h> |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 13 | #include <stddef.h> |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 14 | #include <algorithm> |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 15 | #include <array> |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 16 | #include <memory> |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 17 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 18 | #include "api/array_view.h" |
| 19 | #include "modules/audio_processing/aec3/aec3_common.h" |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 20 | #include "modules/audio_processing/aec3/aec3_fft.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 21 | #include "modules/audio_processing/aec3/aec_state.h" |
| 22 | #include "modules/audio_processing/aec3/comfort_noise_generator.h" |
| 23 | #include "modules/audio_processing/aec3/echo_path_variability.h" |
| 24 | #include "modules/audio_processing/aec3/echo_remover_metrics.h" |
| 25 | #include "modules/audio_processing/aec3/fft_data.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 26 | #include "modules/audio_processing/aec3/render_buffer.h" |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 27 | #include "modules/audio_processing/aec3/render_signal_analyzer.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 28 | #include "modules/audio_processing/aec3/residual_echo_estimator.h" |
| 29 | #include "modules/audio_processing/aec3/subtractor.h" |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 30 | #include "modules/audio_processing/aec3/subtractor_output.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 31 | #include "modules/audio_processing/aec3/suppression_filter.h" |
| 32 | #include "modules/audio_processing/aec3/suppression_gain.h" |
| 33 | #include "modules/audio_processing/logging/apm_data_dumper.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 34 | #include "rtc_base/atomic_ops.h" |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 35 | #include "rtc_base/checks.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 36 | #include "rtc_base/constructor_magic.h" |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 37 | #include "rtc_base/logging.h" |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 38 | |
| 39 | namespace webrtc { |
| 40 | |
| 41 | namespace { |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 42 | |
| 43 | void LinearEchoPower(const FftData& E, |
| 44 | const FftData& Y, |
| 45 | std::array<float, kFftLengthBy2Plus1>* S2) { |
| 46 | for (size_t k = 0; k < E.re.size(); ++k) { |
| 47 | (*S2)[k] = (Y.re[k] - E.re[k]) * (Y.re[k] - E.re[k]) + |
| 48 | (Y.im[k] - E.im[k]) * (Y.im[k] - E.im[k]); |
| 49 | } |
| 50 | } |
| 51 | |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 52 | // Fades between two input signals using a fix-sized transition. |
| 53 | void SignalTransition(rtc::ArrayView<const float> from, |
| 54 | rtc::ArrayView<const float> to, |
| 55 | rtc::ArrayView<float> out) { |
| 56 | constexpr size_t kTransitionSize = 30; |
Gustaf Ullberg | ddb82a6 | 2018-09-11 12:55:23 +0200 | [diff] [blame] | 57 | constexpr float kOneByTransitionSizePlusOne = 1.f / (kTransitionSize + 1); |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 58 | |
| 59 | RTC_DCHECK_EQ(from.size(), to.size()); |
| 60 | RTC_DCHECK_EQ(from.size(), out.size()); |
| 61 | RTC_DCHECK_LE(kTransitionSize, out.size()); |
| 62 | |
| 63 | for (size_t k = 0; k < kTransitionSize; ++k) { |
Gustaf Ullberg | ddb82a6 | 2018-09-11 12:55:23 +0200 | [diff] [blame] | 64 | float a = (k + 1) * kOneByTransitionSizePlusOne; |
| 65 | out[k] = a * to[k] + (1.f - a) * from[k]; |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 66 | } |
| 67 | |
| 68 | std::copy(to.begin() + kTransitionSize, to.end(), |
| 69 | out.begin() + kTransitionSize); |
| 70 | } |
| 71 | |
Per Åhgren | 169c7fd | 2018-04-27 12:04:03 +0200 | [diff] [blame] | 72 | // Computes a windowed (square root Hanning) padded FFT and updates the related |
| 73 | // memory. |
| 74 | void WindowedPaddedFft(const Aec3Fft& fft, |
| 75 | rtc::ArrayView<const float> v, |
| 76 | rtc::ArrayView<float> v_old, |
| 77 | FftData* V) { |
| 78 | fft.PaddedFft(v, v_old, Aec3Fft::Window::kSqrtHanning, V); |
| 79 | std::copy(v.begin(), v.end(), v_old.begin()); |
| 80 | } |
| 81 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 82 | // Class for removing the echo from the capture signal. |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 83 | class EchoRemoverImpl final : public EchoRemover { |
| 84 | public: |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 85 | EchoRemoverImpl(const EchoCanceller3Config& config, int sample_rate_hz); |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 86 | ~EchoRemoverImpl() override; |
| 87 | |
Gustaf Ullberg | 332150d | 2017-11-22 14:17:39 +0100 | [diff] [blame] | 88 | void GetMetrics(EchoControl::Metrics* metrics) const override; |
| 89 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 90 | // Removes the echo from a block of samples from the capture signal. The |
| 91 | // supplied render signal is assumed to be pre-aligned with the capture |
| 92 | // signal. |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 93 | void ProcessCapture(EchoPathVariability echo_path_variability, |
Alex Loiko | 890988c | 2017-08-31 10:25:48 +0200 | [diff] [blame] | 94 | bool capture_signal_saturation, |
Danil Chapovalov | db9f7ab | 2018-06-19 10:50:11 +0200 | [diff] [blame] | 95 | const absl::optional<DelayEstimate>& external_delay, |
Per Åhgren | c59a576 | 2017-12-11 21:34:19 +0100 | [diff] [blame] | 96 | RenderBuffer* render_buffer, |
Alex Loiko | 890988c | 2017-08-31 10:25:48 +0200 | [diff] [blame] | 97 | std::vector<std::vector<float>>* capture) override; |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 98 | |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 99 | // Returns the internal delay estimate in blocks. |
Danil Chapovalov | db9f7ab | 2018-06-19 10:50:11 +0200 | [diff] [blame] | 100 | absl::optional<int> Delay() const override { |
Per Åhgren | e05c43c | 2018-05-09 12:26:51 +0200 | [diff] [blame] | 101 | // TODO(peah): Remove or reactivate this functionality. |
Danil Chapovalov | db9f7ab | 2018-06-19 10:50:11 +0200 | [diff] [blame] | 102 | return absl::nullopt; |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 103 | } |
| 104 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 105 | // Updates the status on whether echo leakage is detected in the output of the |
| 106 | // echo remover. |
| 107 | void UpdateEchoLeakageStatus(bool leakage_detected) override { |
| 108 | echo_leakage_detected_ = leakage_detected; |
| 109 | } |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 110 | |
| 111 | private: |
Per Åhgren | 7802675 | 2018-08-01 16:24:08 +0200 | [diff] [blame] | 112 | // Selects which of the shadow and main linear filter outputs that is most |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 113 | // appropriate to pass to the suppressor and forms the linear filter output by |
| 114 | // smoothly transition between those. |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 115 | void FormLinearFilterOutput(const SubtractorOutput& subtractor_output, |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 116 | rtc::ArrayView<float> output); |
Per Åhgren | 7802675 | 2018-08-01 16:24:08 +0200 | [diff] [blame] | 117 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 118 | static int instance_count_; |
Gustaf Ullberg | bd83b91 | 2017-10-18 12:32:42 +0200 | [diff] [blame] | 119 | const EchoCanceller3Config config_; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 120 | const Aec3Fft fft_; |
| 121 | std::unique_ptr<ApmDataDumper> data_dumper_; |
| 122 | const Aec3Optimization optimization_; |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 123 | const int sample_rate_hz_; |
Per Åhgren | 7802675 | 2018-08-01 16:24:08 +0200 | [diff] [blame] | 124 | const bool use_shadow_filter_output_; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 125 | Subtractor subtractor_; |
| 126 | SuppressionGain suppression_gain_; |
| 127 | ComfortNoiseGenerator cng_; |
| 128 | SuppressionFilter suppression_filter_; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 129 | RenderSignalAnalyzer render_signal_analyzer_; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 130 | ResidualEchoEstimator residual_echo_estimator_; |
| 131 | bool echo_leakage_detected_ = false; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 132 | AecState aec_state_; |
peah | e985b3f | 2017-02-28 22:08:53 -0800 | [diff] [blame] | 133 | EchoRemoverMetrics metrics_; |
Per Åhgren | 47d7fbd | 2018-04-24 12:44:29 +0200 | [diff] [blame] | 134 | std::array<float, kFftLengthBy2> e_old_; |
| 135 | std::array<float, kFftLengthBy2> x_old_; |
| 136 | std::array<float, kFftLengthBy2> y_old_; |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 137 | size_t block_counter_ = 0; |
| 138 | int gain_change_hangover_ = 0; |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 139 | bool main_filter_output_last_selected_ = true; |
| 140 | bool linear_filter_output_last_selected_ = true; |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 141 | |
| 142 | RTC_DISALLOW_COPY_AND_ASSIGN(EchoRemoverImpl); |
| 143 | }; |
| 144 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 145 | int EchoRemoverImpl::instance_count_ = 0; |
| 146 | |
Gustaf Ullberg | bd83b91 | 2017-10-18 12:32:42 +0200 | [diff] [blame] | 147 | EchoRemoverImpl::EchoRemoverImpl(const EchoCanceller3Config& config, |
| 148 | int sample_rate_hz) |
peah | 8cee56f | 2017-08-24 22:36:53 -0700 | [diff] [blame] | 149 | : config_(config), |
| 150 | fft_(), |
aleloi | 88b82b5 | 2017-02-23 06:27:03 -0800 | [diff] [blame] | 151 | data_dumper_( |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 152 | new ApmDataDumper(rtc::AtomicOps::Increment(&instance_count_))), |
| 153 | optimization_(DetectOptimization()), |
| 154 | sample_rate_hz_(sample_rate_hz), |
Per Åhgren | 2402154 | 2018-08-31 07:34:29 +0200 | [diff] [blame] | 155 | use_shadow_filter_output_( |
Per Åhgren | 2402154 | 2018-08-31 07:34:29 +0200 | [diff] [blame] | 156 | config_.filter.enable_shadow_filter_output_usage), |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 157 | subtractor_(config, data_dumper_.get(), optimization_), |
Per Åhgren | 47d7fbd | 2018-04-24 12:44:29 +0200 | [diff] [blame] | 158 | suppression_gain_(config_, optimization_, sample_rate_hz), |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 159 | cng_(optimization_), |
Gustaf Ullberg | 83b00f0 | 2018-11-06 16:25:37 +0100 | [diff] [blame] | 160 | suppression_filter_(optimization_, sample_rate_hz_), |
Per Åhgren | 971de07 | 2018-03-14 23:23:47 +0100 | [diff] [blame] | 161 | render_signal_analyzer_(config_), |
peah | 8cee56f | 2017-08-24 22:36:53 -0700 | [diff] [blame] | 162 | residual_echo_estimator_(config_), |
| 163 | aec_state_(config_) { |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 164 | RTC_DCHECK(ValidFullBandRate(sample_rate_hz)); |
Per Åhgren | 47d7fbd | 2018-04-24 12:44:29 +0200 | [diff] [blame] | 165 | x_old_.fill(0.f); |
| 166 | y_old_.fill(0.f); |
| 167 | e_old_.fill(0.f); |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 168 | } |
| 169 | |
| 170 | EchoRemoverImpl::~EchoRemoverImpl() = default; |
| 171 | |
Gustaf Ullberg | 332150d | 2017-11-22 14:17:39 +0100 | [diff] [blame] | 172 | void EchoRemoverImpl::GetMetrics(EchoControl::Metrics* metrics) const { |
| 173 | // Echo return loss (ERL) is inverted to go from gain to attenuation. |
| 174 | metrics->echo_return_loss = -10.0 * log10(aec_state_.ErlTimeDomain()); |
| 175 | metrics->echo_return_loss_enhancement = |
Jesús de Vicente Peña | e9a7e90 | 2018-09-27 11:49:39 +0200 | [diff] [blame] | 176 | Log2TodB(aec_state_.FullBandErleLog2()); |
Gustaf Ullberg | 332150d | 2017-11-22 14:17:39 +0100 | [diff] [blame] | 177 | } |
| 178 | |
peah | cf02cf1 | 2017-04-05 14:18:07 -0700 | [diff] [blame] | 179 | void EchoRemoverImpl::ProcessCapture( |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 180 | EchoPathVariability echo_path_variability, |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 181 | bool capture_signal_saturation, |
Danil Chapovalov | db9f7ab | 2018-06-19 10:50:11 +0200 | [diff] [blame] | 182 | const absl::optional<DelayEstimate>& external_delay, |
Per Åhgren | c59a576 | 2017-12-11 21:34:19 +0100 | [diff] [blame] | 183 | RenderBuffer* render_buffer, |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 184 | std::vector<std::vector<float>>* capture) { |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 185 | ++block_counter_; |
Per Åhgren | ec22e3f | 2017-12-20 15:20:37 +0100 | [diff] [blame] | 186 | const std::vector<std::vector<float>>& x = render_buffer->Block(0); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 187 | std::vector<std::vector<float>>* y = capture; |
Per Åhgren | c59a576 | 2017-12-11 21:34:19 +0100 | [diff] [blame] | 188 | RTC_DCHECK(render_buffer); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 189 | RTC_DCHECK(y); |
| 190 | RTC_DCHECK_EQ(x.size(), NumBandsForRate(sample_rate_hz_)); |
| 191 | RTC_DCHECK_EQ(y->size(), NumBandsForRate(sample_rate_hz_)); |
| 192 | RTC_DCHECK_EQ(x[0].size(), kBlockSize); |
| 193 | RTC_DCHECK_EQ((*y)[0].size(), kBlockSize); |
| 194 | const std::vector<float>& x0 = x[0]; |
| 195 | std::vector<float>& y0 = (*y)[0]; |
| 196 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 197 | data_dumper_->DumpWav("aec3_echo_remover_capture_input", kBlockSize, &y0[0], |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 198 | LowestBandRate(sample_rate_hz_), 1); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 199 | data_dumper_->DumpWav("aec3_echo_remover_render_input", kBlockSize, &x0[0], |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 200 | LowestBandRate(sample_rate_hz_), 1); |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 201 | data_dumper_->DumpRaw("aec3_echo_remover_capture_input", y0); |
| 202 | data_dumper_->DumpRaw("aec3_echo_remover_render_input", x0); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 203 | |
| 204 | aec_state_.UpdateCaptureSaturation(capture_signal_saturation); |
| 205 | |
| 206 | if (echo_path_variability.AudioPathChanged()) { |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 207 | // Ensure that the gain change is only acted on once per frame. |
| 208 | if (echo_path_variability.gain_change) { |
| 209 | if (gain_change_hangover_ == 0) { |
| 210 | constexpr int kMaxBlocksPerFrame = 3; |
| 211 | gain_change_hangover_ = kMaxBlocksPerFrame; |
| 212 | RTC_LOG(LS_WARNING) |
| 213 | << "Gain change detected at block " << block_counter_; |
| 214 | } else { |
| 215 | echo_path_variability.gain_change = false; |
| 216 | } |
| 217 | } |
| 218 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 219 | subtractor_.HandleEchoPathChange(echo_path_variability); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 220 | aec_state_.HandleEchoPathChange(echo_path_variability); |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 221 | |
| 222 | if (echo_path_variability.delay_change != |
| 223 | EchoPathVariability::DelayAdjustment::kNone) { |
| 224 | suppression_gain_.SetInitialState(true); |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 225 | } |
| 226 | } |
| 227 | if (gain_change_hangover_ > 0) { |
| 228 | --gain_change_hangover_; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 229 | } |
| 230 | |
| 231 | std::array<float, kFftLengthBy2Plus1> Y2; |
Per Åhgren | 169c7fd | 2018-04-27 12:04:03 +0200 | [diff] [blame] | 232 | std::array<float, kFftLengthBy2Plus1> E2; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 233 | std::array<float, kFftLengthBy2Plus1> R2; |
| 234 | std::array<float, kFftLengthBy2Plus1> S2_linear; |
| 235 | std::array<float, kFftLengthBy2Plus1> G; |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 236 | float high_bands_gain; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 237 | FftData Y; |
Per Åhgren | 169c7fd | 2018-04-27 12:04:03 +0200 | [diff] [blame] | 238 | FftData E; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 239 | FftData comfort_noise; |
| 240 | FftData high_band_comfort_noise; |
| 241 | SubtractorOutput subtractor_output; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 242 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 243 | // Analyze the render signal. |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 244 | render_signal_analyzer_.Update(*render_buffer, |
| 245 | aec_state_.FilterDelayBlocks()); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 246 | |
| 247 | // Perform linear echo cancellation. |
Jesús de Vicente Peña | 02e9e44 | 2018-08-29 13:34:07 +0200 | [diff] [blame] | 248 | if (aec_state_.TransitionTriggered()) { |
Per Åhgren | a98c807 | 2018-01-15 19:17:16 +0100 | [diff] [blame] | 249 | subtractor_.ExitInitialState(); |
Per Åhgren | 5f1a31c | 2018-03-08 15:54:41 +0100 | [diff] [blame] | 250 | suppression_gain_.SetInitialState(false); |
Per Åhgren | a98c807 | 2018-01-15 19:17:16 +0100 | [diff] [blame] | 251 | } |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 252 | |
| 253 | // If the delay is known, use the echo subtractor. |
Per Åhgren | c59a576 | 2017-12-11 21:34:19 +0100 | [diff] [blame] | 254 | subtractor_.Process(*render_buffer, y0, render_signal_analyzer_, aec_state_, |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 255 | &subtractor_output); |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 256 | std::array<float, kBlockSize> e; |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 257 | FormLinearFilterOutput(subtractor_output, e); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 258 | |
| 259 | // Compute spectra. |
Per Åhgren | 169c7fd | 2018-04-27 12:04:03 +0200 | [diff] [blame] | 260 | WindowedPaddedFft(fft_, y0, y_old_, &Y); |
| 261 | WindowedPaddedFft(fft_, e, e_old_, &E); |
| 262 | LinearEchoPower(E, Y, &S2_linear); |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 263 | Y.Spectrum(optimization_, Y2); |
Per Åhgren | 169c7fd | 2018-04-27 12:04:03 +0200 | [diff] [blame] | 264 | E.Spectrum(optimization_, E2); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 265 | |
| 266 | // Update the AEC state information. |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 267 | aec_state_.Update(external_delay, subtractor_.FilterFrequencyResponse(), |
Per Åhgren | b20b937 | 2018-07-13 00:22:54 +0200 | [diff] [blame] | 268 | subtractor_.FilterImpulseResponse(), *render_buffer, E2, Y2, |
| 269 | subtractor_output, y0); |
Per Åhgren | 169c7fd | 2018-04-27 12:04:03 +0200 | [diff] [blame] | 270 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 271 | // Choose the linear output. |
Per Åhgren | 169c7fd | 2018-04-27 12:04:03 +0200 | [diff] [blame] | 272 | data_dumper_->DumpWav("aec3_output_linear2", kBlockSize, &e[0], |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 273 | LowestBandRate(sample_rate_hz_), 1); |
Per Åhgren | 47d7fbd | 2018-04-24 12:44:29 +0200 | [diff] [blame] | 274 | if (aec_state_.UseLinearFilterOutput()) { |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 275 | if (!linear_filter_output_last_selected_) { |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 276 | SignalTransition(y0, e, y0); |
| 277 | } else { |
| 278 | std::copy(e.begin(), e.end(), y0.begin()); |
| 279 | } |
| 280 | } else { |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 281 | if (linear_filter_output_last_selected_) { |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 282 | SignalTransition(e, y0, y0); |
| 283 | } |
Per Åhgren | 47d7fbd | 2018-04-24 12:44:29 +0200 | [diff] [blame] | 284 | } |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 285 | linear_filter_output_last_selected_ = aec_state_.UseLinearFilterOutput(); |
Per Åhgren | 169c7fd | 2018-04-27 12:04:03 +0200 | [diff] [blame] | 286 | const auto& Y_fft = aec_state_.UseLinearFilterOutput() ? E : Y; |
| 287 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 288 | data_dumper_->DumpWav("aec3_output_linear", kBlockSize, &y0[0], |
| 289 | LowestBandRate(sample_rate_hz_), 1); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 290 | |
| 291 | // Estimate the residual echo power. |
Per Åhgren | c59a576 | 2017-12-11 21:34:19 +0100 | [diff] [blame] | 292 | residual_echo_estimator_.Estimate(aec_state_, *render_buffer, S2_linear, Y2, |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 293 | &R2); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 294 | |
| 295 | // Estimate the comfort noise. |
| 296 | cng_.Compute(aec_state_, Y2, &comfort_noise, &high_band_comfort_noise); |
| 297 | |
Per Åhgren | 47d7fbd | 2018-04-24 12:44:29 +0200 | [diff] [blame] | 298 | // Compute and apply the suppression gain. |
Per Åhgren | fde4aa9 | 2018-08-27 14:19:35 +0200 | [diff] [blame] | 299 | const auto& echo_spectrum = |
| 300 | aec_state_.UsableLinearEstimate() ? S2_linear : R2; |
Jesús de Vicente Peña | 0faf082 | 2018-09-24 12:48:28 +0200 | [diff] [blame] | 301 | |
| 302 | std::array<float, kFftLengthBy2Plus1> E2_bounded; |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 303 | std::transform(E2.begin(), E2.end(), Y2.begin(), E2_bounded.begin(), |
| 304 | [](float a, float b) { return std::min(a, b); }); |
Jesús de Vicente Peña | 0faf082 | 2018-09-24 12:48:28 +0200 | [diff] [blame] | 305 | |
| 306 | suppression_gain_.GetGain(E2, E2_bounded, echo_spectrum, R2, |
| 307 | cng_.NoiseSpectrum(), E, Y, render_signal_analyzer_, |
| 308 | aec_state_, x, &high_bands_gain, &G); |
Per Åhgren | 47d7fbd | 2018-04-24 12:44:29 +0200 | [diff] [blame] | 309 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 310 | suppression_filter_.ApplyGain(comfort_noise, high_band_comfort_noise, G, |
Per Åhgren | 47d7fbd | 2018-04-24 12:44:29 +0200 | [diff] [blame] | 311 | high_bands_gain, Y_fft, y); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 312 | |
peah | e985b3f | 2017-02-28 22:08:53 -0800 | [diff] [blame] | 313 | // Update the metrics. |
| 314 | metrics_.Update(aec_state_, cng_.NoiseSpectrum(), G); |
| 315 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 316 | // Debug outputs for the purpose of development and analysis. |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 317 | data_dumper_->DumpWav("aec3_echo_estimate", kBlockSize, |
| 318 | &subtractor_output.s_main[0], |
| 319 | LowestBandRate(sample_rate_hz_), 1); |
| 320 | data_dumper_->DumpRaw("aec3_output", y0); |
peah | 14c11a4 | 2017-07-11 06:13:43 -0700 | [diff] [blame] | 321 | data_dumper_->DumpRaw("aec3_narrow_render", |
| 322 | render_signal_analyzer_.NarrowPeakBand() ? 1 : 0); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 323 | data_dumper_->DumpRaw("aec3_N2", cng_.NoiseSpectrum()); |
| 324 | data_dumper_->DumpRaw("aec3_suppressor_gain", G); |
| 325 | data_dumper_->DumpWav("aec3_output", |
| 326 | rtc::ArrayView<const float>(&y0[0], kBlockSize), |
| 327 | LowestBandRate(sample_rate_hz_), 1); |
| 328 | data_dumper_->DumpRaw("aec3_using_subtractor_output", |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 329 | aec_state_.UseLinearFilterOutput() ? 1 : 0); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 330 | data_dumper_->DumpRaw("aec3_E2", E2); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 331 | data_dumper_->DumpRaw("aec3_S2_linear", S2_linear); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 332 | data_dumper_->DumpRaw("aec3_Y2", Y2); |
Jesús de Vicente Peña | 7682c6e | 2018-03-22 14:53:23 +0100 | [diff] [blame] | 333 | data_dumper_->DumpRaw( |
| 334 | "aec3_X2", render_buffer->Spectrum(aec_state_.FilterDelayBlocks())); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 335 | data_dumper_->DumpRaw("aec3_R2", R2); |
Jesús de Vicente Peña | 075cb2b | 2018-06-13 15:13:55 +0200 | [diff] [blame] | 336 | data_dumper_->DumpRaw("aec3_R2_reverb", |
| 337 | residual_echo_estimator_.GetReverbPowerSpectrum()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 338 | data_dumper_->DumpRaw("aec3_filter_delay", aec_state_.FilterDelayBlocks()); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 339 | data_dumper_->DumpRaw("aec3_capture_saturation", |
| 340 | aec_state_.SaturatedCapture() ? 1 : 0); |
| 341 | } |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 342 | |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 343 | void EchoRemoverImpl::FormLinearFilterOutput( |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 344 | const SubtractorOutput& subtractor_output, |
| 345 | rtc::ArrayView<float> output) { |
| 346 | RTC_DCHECK_EQ(subtractor_output.e_main.size(), output.size()); |
| 347 | RTC_DCHECK_EQ(subtractor_output.e_shadow.size(), output.size()); |
| 348 | bool use_main_output = true; |
| 349 | if (use_shadow_filter_output_) { |
Jesús de Vicente Peña | 02e9e44 | 2018-08-29 13:34:07 +0200 | [diff] [blame] | 350 | // As the output of the main adaptive filter generally should be better |
| 351 | // than the shadow filter output, add a margin and threshold for when |
| 352 | // choosing the shadow filter output. |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 353 | if (subtractor_output.e2_shadow < 0.9f * subtractor_output.e2_main && |
| 354 | subtractor_output.y2 > 30.f * 30.f * kBlockSize && |
| 355 | (subtractor_output.s2_main > 60.f * 60.f * kBlockSize || |
| 356 | subtractor_output.s2_shadow > 60.f * 60.f * kBlockSize)) { |
| 357 | use_main_output = false; |
| 358 | } else { |
| 359 | // If the main filter is diverged, choose the filter output that has the |
| 360 | // lowest power. |
| 361 | if (subtractor_output.e2_shadow < subtractor_output.e2_main && |
| 362 | subtractor_output.y2 < subtractor_output.e2_main) { |
| 363 | use_main_output = false; |
| 364 | } |
| 365 | } |
| 366 | } |
| 367 | |
| 368 | if (use_main_output) { |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 369 | if (!main_filter_output_last_selected_) { |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 370 | SignalTransition(subtractor_output.e_shadow, subtractor_output.e_main, |
| 371 | output); |
| 372 | } else { |
| 373 | std::copy(subtractor_output.e_main.begin(), |
| 374 | subtractor_output.e_main.end(), output.begin()); |
| 375 | } |
| 376 | } else { |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 377 | if (main_filter_output_last_selected_) { |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 378 | SignalTransition(subtractor_output.e_main, subtractor_output.e_shadow, |
| 379 | output); |
| 380 | } else { |
| 381 | std::copy(subtractor_output.e_shadow.begin(), |
| 382 | subtractor_output.e_shadow.end(), output.begin()); |
| 383 | } |
| 384 | } |
| 385 | main_filter_output_last_selected_ = use_main_output; |
| 386 | } |
| 387 | |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 388 | } // namespace |
| 389 | |
Gustaf Ullberg | bd83b91 | 2017-10-18 12:32:42 +0200 | [diff] [blame] | 390 | EchoRemover* EchoRemover::Create(const EchoCanceller3Config& config, |
| 391 | int sample_rate_hz) { |
peah | 697a590 | 2017-06-30 07:06:10 -0700 | [diff] [blame] | 392 | return new EchoRemoverImpl(config, sample_rate_hz); |
peah | 69221db | 2017-01-27 03:28:19 -0800 | [diff] [blame] | 393 | } |
| 394 | |
| 395 | } // namespace webrtc |