peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #include "modules/audio_processing/aec3/aec_state.h" |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 12 | |
| 13 | #include <math.h> |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 14 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 15 | #include <algorithm> |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 16 | #include <numeric> |
| 17 | #include <vector> |
| 18 | |
Jesús de Vicente Peña | 496cedf | 2018-07-04 11:02:09 +0200 | [diff] [blame] | 19 | #include "absl/types/optional.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 20 | #include "api/array_view.h" |
Jesús de Vicente Peña | 496cedf | 2018-07-04 11:02:09 +0200 | [diff] [blame] | 21 | #include "modules/audio_processing/aec3/aec3_common.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 22 | #include "modules/audio_processing/logging/apm_data_dumper.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 23 | #include "rtc_base/atomic_ops.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 24 | #include "rtc_base/checks.h" |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 25 | |
| 26 | namespace webrtc { |
| 27 | namespace { |
| 28 | |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 29 | constexpr size_t kBlocksSinceConvergencedFilterInit = 10000; |
| 30 | constexpr size_t kBlocksSinceConsistentEstimateInit = 10000; |
| 31 | |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 32 | void UpdateAndComputeReverb( |
| 33 | const SpectrumBuffer& spectrum_buffer, |
| 34 | int delay_blocks, |
| 35 | float reverb_decay, |
| 36 | ReverbModel* reverb_model, |
| 37 | rtc::ArrayView<float, kFftLengthBy2Plus1> reverb_power_spectrum) { |
| 38 | RTC_DCHECK(reverb_model); |
| 39 | const size_t num_render_channels = spectrum_buffer.buffer[0].size(); |
| 40 | int idx_at_delay = |
| 41 | spectrum_buffer.OffsetIndex(spectrum_buffer.read, delay_blocks); |
| 42 | int idx_past = spectrum_buffer.IncIndex(idx_at_delay); |
| 43 | |
| 44 | std::array<float, kFftLengthBy2Plus1> X2_data; |
| 45 | rtc::ArrayView<const float> X2; |
| 46 | if (num_render_channels > 1) { |
| 47 | auto sum_channels = |
| 48 | [](size_t num_render_channels, |
| 49 | const std::vector<std::vector<float>>& spectrum_band_0, |
| 50 | rtc::ArrayView<float, kFftLengthBy2Plus1> render_power) { |
| 51 | std::fill(render_power.begin(), render_power.end(), 0.f); |
| 52 | for (size_t ch = 0; ch < num_render_channels; ++ch) { |
| 53 | RTC_DCHECK_EQ(spectrum_band_0[ch].size(), kFftLengthBy2Plus1); |
| 54 | for (size_t k = 0; k < kFftLengthBy2Plus1; ++k) { |
| 55 | render_power[k] += spectrum_band_0[ch][k]; |
| 56 | } |
| 57 | } |
| 58 | }; |
| 59 | sum_channels(num_render_channels, spectrum_buffer.buffer[idx_past], |
| 60 | X2_data); |
| 61 | reverb_model->UpdateReverbNoFreqShaping( |
| 62 | X2_data, /*power_spectrum_scaling=*/1.0f, reverb_decay); |
| 63 | |
| 64 | sum_channels(num_render_channels, spectrum_buffer.buffer[idx_at_delay], |
| 65 | X2_data); |
| 66 | X2 = X2_data; |
| 67 | } else { |
| 68 | reverb_model->UpdateReverbNoFreqShaping( |
| 69 | spectrum_buffer.buffer[idx_past][/*channel=*/0], |
| 70 | /*power_spectrum_scaling=*/1.0f, reverb_decay); |
| 71 | |
| 72 | X2 = spectrum_buffer.buffer[idx_at_delay][/*channel=*/0]; |
| 73 | } |
| 74 | |
| 75 | rtc::ArrayView<const float, kFftLengthBy2Plus1> reverb_power = |
| 76 | reverb_model->reverb(); |
| 77 | for (size_t k = 0; k < X2.size(); ++k) { |
| 78 | reverb_power_spectrum[k] = X2[k] + reverb_power[k]; |
| 79 | } |
| 80 | } |
| 81 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 82 | } // namespace |
| 83 | |
| 84 | int AecState::instance_count_ = 0; |
| 85 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 86 | void AecState::GetResidualEchoScaling( |
| 87 | rtc::ArrayView<float> residual_scaling) const { |
| 88 | bool filter_has_had_time_to_converge; |
| 89 | if (config_.filter.conservative_initial_phase) { |
| 90 | filter_has_had_time_to_converge = |
| 91 | strong_not_saturated_render_blocks_ >= 1.5f * kNumBlocksPerSecond; |
| 92 | } else { |
| 93 | filter_has_had_time_to_converge = |
| 94 | strong_not_saturated_render_blocks_ >= 0.8f * kNumBlocksPerSecond; |
| 95 | } |
| 96 | echo_audibility_.GetResidualEchoScaling(filter_has_had_time_to_converge, |
| 97 | residual_scaling); |
| 98 | } |
| 99 | |
| 100 | absl::optional<float> AecState::ErleUncertainty() const { |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 101 | if (SaturatedEcho()) { |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 102 | return 1.f; |
| 103 | } |
| 104 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 105 | return absl::nullopt; |
| 106 | } |
| 107 | |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 108 | AecState::AecState(const EchoCanceller3Config& config, |
| 109 | size_t num_capture_channels) |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 110 | : data_dumper_( |
| 111 | new ApmDataDumper(rtc::AtomicOps::Increment(&instance_count_))), |
peah | 8cee56f | 2017-08-24 22:36:53 -0700 | [diff] [blame] | 112 | config_(config), |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 113 | initial_state_(config_), |
| 114 | delay_state_(config_), |
| 115 | transparent_state_(config_), |
| 116 | filter_quality_state_(config_), |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 117 | erl_estimator_(2 * kNumBlocksPerSecond), |
Per Åhgren | b4161d3 | 2019-10-08 12:35:47 +0200 | [diff] [blame] | 118 | erle_estimator_(2 * kNumBlocksPerSecond, config_, num_capture_channels), |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 119 | filter_analyzers_(num_capture_channels), |
Jesús de Vicente Peña | 836a7a2 | 2018-08-31 15:03:04 +0200 | [diff] [blame] | 120 | echo_audibility_( |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 121 | config_.echo_audibility.use_stationarity_properties_at_init), |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 122 | reverb_model_estimator_(config_), |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 123 | subtractor_output_analyzers_(num_capture_channels) { |
| 124 | for (size_t ch = 0; ch < num_capture_channels; ++ch) { |
| 125 | filter_analyzers_[ch] = std::make_unique<FilterAnalyzer>(config_); |
| 126 | } |
| 127 | } |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 128 | |
| 129 | AecState::~AecState() = default; |
| 130 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 131 | void AecState::HandleEchoPathChange( |
| 132 | const EchoPathVariability& echo_path_variability) { |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 133 | const auto full_reset = [&]() { |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 134 | for (auto& filter_analyzer : filter_analyzers_) { |
| 135 | filter_analyzer->Reset(); |
| 136 | } |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 137 | capture_signal_saturation_ = false; |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 138 | strong_not_saturated_render_blocks_ = 0; |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 139 | blocks_with_active_render_ = 0; |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 140 | initial_state_.Reset(); |
| 141 | transparent_state_.Reset(); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 142 | erle_estimator_.Reset(true); |
| 143 | erl_estimator_.Reset(); |
Jesús de Vicente Peña | 70a5963 | 2019-04-16 12:32:15 +0200 | [diff] [blame] | 144 | filter_quality_state_.Reset(); |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 145 | }; |
peah | 6d822ad | 2017-04-10 13:52:14 -0700 | [diff] [blame] | 146 | |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 147 | // TODO(peah): Refine the reset scheme according to the type of gain and |
| 148 | // delay adjustment. |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 149 | |
| 150 | if (echo_path_variability.delay_change != |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 151 | EchoPathVariability::DelayAdjustment::kNone) { |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 152 | full_reset(); |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 153 | } else if (echo_path_variability.gain_change) { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 154 | erle_estimator_.Reset(false); |
Per Åhgren | d2650d1 | 2018-10-02 17:00:59 +0200 | [diff] [blame] | 155 | } |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 156 | for (auto& analyzer : subtractor_output_analyzers_) { |
| 157 | analyzer.HandleEchoPathChange(); |
| 158 | } |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 159 | } |
| 160 | |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 161 | void AecState::Update( |
Danil Chapovalov | db9f7ab | 2018-06-19 10:50:11 +0200 | [diff] [blame] | 162 | const absl::optional<DelayEstimate>& external_delay, |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 163 | rtc::ArrayView<const std::vector<std::array<float, kFftLengthBy2Plus1>>> |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 164 | adaptive_filter_frequency_response, |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 165 | rtc::ArrayView<const std::vector<float>> adaptive_filter_impulse_response, |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 166 | const RenderBuffer& render_buffer, |
Per Åhgren | f980725 | 2019-10-09 13:57:07 +0200 | [diff] [blame^] | 167 | rtc::ArrayView<const std::array<float, kFftLengthBy2Plus1>> E2_main, |
| 168 | rtc::ArrayView<const std::array<float, kFftLengthBy2Plus1>> Y2, |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 169 | rtc::ArrayView<const SubtractorOutput> subtractor_output) { |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 170 | const size_t num_capture_channels = filter_analyzers_.size(); |
Per Åhgren | f980725 | 2019-10-09 13:57:07 +0200 | [diff] [blame^] | 171 | RTC_DCHECK_EQ(num_capture_channels, E2_main.size()); |
| 172 | RTC_DCHECK_EQ(num_capture_channels, Y2.size()); |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 173 | RTC_DCHECK_EQ(num_capture_channels, subtractor_output.size()); |
| 174 | RTC_DCHECK_EQ(num_capture_channels, subtractor_output_analyzers_.size()); |
| 175 | RTC_DCHECK_EQ(num_capture_channels, |
| 176 | adaptive_filter_frequency_response.size()); |
| 177 | RTC_DCHECK_EQ(num_capture_channels, adaptive_filter_impulse_response.size()); |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 178 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 179 | // Analyze the filter outputs and filters. |
| 180 | bool any_filter_converged = false; |
| 181 | bool all_filters_diverged = true; |
| 182 | bool any_filter_consistent = false; |
Sam Zackrisson | 0169a3e | 2019-10-09 08:00:29 +0200 | [diff] [blame] | 183 | float max_echo_path_gain = 0.f; |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 184 | for (size_t ch = 0; ch < subtractor_output.size(); ++ch) { |
| 185 | subtractor_output_analyzers_[ch].Update(subtractor_output[ch]); |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 186 | any_filter_converged = any_filter_converged || |
| 187 | subtractor_output_analyzers_[ch].ConvergedFilter(); |
| 188 | all_filters_diverged = all_filters_diverged && |
| 189 | subtractor_output_analyzers_[ch].DivergedFilter(); |
Per Åhgren | b20b937 | 2018-07-13 00:22:54 +0200 | [diff] [blame] | 190 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 191 | filter_analyzers_[ch]->Update(adaptive_filter_impulse_response[ch], |
| 192 | render_buffer); |
| 193 | any_filter_consistent = |
| 194 | any_filter_consistent || filter_analyzers_[ch]->Consistent(); |
Sam Zackrisson | 0169a3e | 2019-10-09 08:00:29 +0200 | [diff] [blame] | 195 | max_echo_path_gain = |
| 196 | std::max(max_echo_path_gain, filter_analyzers_[ch]->Gain()); |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 197 | } |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 198 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 199 | // Estimate the direct path delay of the filter. |
Gustaf Ullberg | 9466b66 | 2019-04-15 09:53:03 +0200 | [diff] [blame] | 200 | if (config_.filter.use_linear_filter) { |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 201 | delay_state_.Update(filter_analyzers_, external_delay, |
Gustaf Ullberg | 9466b66 | 2019-04-15 09:53:03 +0200 | [diff] [blame] | 202 | strong_not_saturated_render_blocks_); |
| 203 | } |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 204 | |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 205 | const std::vector<std::vector<float>>& aligned_render_block = |
| 206 | render_buffer.Block(-delay_state_.DirectPathFilterDelay())[0]; |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 207 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 208 | // Update render counters. |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 209 | bool active_render = false; |
| 210 | for (size_t ch = 0; ch < aligned_render_block.size(); ++ch) { |
| 211 | const float render_energy = std::inner_product( |
| 212 | aligned_render_block[ch].begin(), aligned_render_block[ch].end(), |
| 213 | aligned_render_block[ch].begin(), 0.f); |
| 214 | if (render_energy > (config_.render_levels.active_render_limit * |
| 215 | config_.render_levels.active_render_limit) * |
| 216 | kFftLengthBy2) { |
| 217 | active_render = true; |
| 218 | break; |
| 219 | } |
| 220 | } |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 221 | blocks_with_active_render_ += active_render ? 1 : 0; |
| 222 | strong_not_saturated_render_blocks_ += |
| 223 | active_render && !SaturatedCapture() ? 1 : 0; |
Per Åhgren | 0e6d2f5 | 2017-12-20 22:19:56 +0100 | [diff] [blame] | 224 | |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 225 | std::array<float, kFftLengthBy2Plus1> X2_reverb; |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 226 | |
| 227 | UpdateAndComputeReverb(render_buffer.GetSpectrumBuffer(), |
| 228 | delay_state_.DirectPathFilterDelay(), ReverbDecay(), |
| 229 | &reverb_model_, X2_reverb); |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 230 | |
Jesús de Vicente Peña | 70a5963 | 2019-04-16 12:32:15 +0200 | [diff] [blame] | 231 | if (config_.echo_audibility.use_stationarity_properties) { |
Jesús de Vicente Peña | d5cb477 | 2018-04-25 13:58:45 +0200 | [diff] [blame] | 232 | // Update the echo audibility evaluator. |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 233 | echo_audibility_.Update(render_buffer, reverb_model_.reverb(), |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 234 | delay_state_.DirectPathFilterDelay(), |
| 235 | delay_state_.ExternalDelayReported()); |
Jesús de Vicente Peña | d5cb477 | 2018-04-25 13:58:45 +0200 | [diff] [blame] | 236 | } |
| 237 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 238 | // Update the ERL and ERLE measures. |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 239 | if (initial_state_.TransitionTriggered()) { |
| 240 | erle_estimator_.Reset(false); |
Jesús de Vicente Peña | 02e9e44 | 2018-08-29 13:34:07 +0200 | [diff] [blame] | 241 | } |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 242 | |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 243 | // TODO(bugs.webrtc.org/10913): Take all channels into account. |
Sam Zackrisson | a81c09d | 2019-09-05 09:35:10 +0200 | [diff] [blame] | 244 | const auto& X2 = render_buffer.Spectrum(delay_state_.DirectPathFilterDelay(), |
| 245 | /*channel=*/0); |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 246 | const auto& X2_input_erle = X2_reverb; |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 247 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 248 | erle_estimator_.Update(render_buffer, adaptive_filter_frequency_response[0], |
Per Åhgren | f980725 | 2019-10-09 13:57:07 +0200 | [diff] [blame^] | 249 | X2_input_erle, Y2[0], E2_main[0], |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 250 | subtractor_output_analyzers_[0].ConvergedFilter(), |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 251 | config_.erle.onset_detection); |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 252 | |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 253 | erl_estimator_.Update(subtractor_output_analyzers_[0].ConvergedFilter(), X2, |
Per Åhgren | f980725 | 2019-10-09 13:57:07 +0200 | [diff] [blame^] | 254 | Y2[0]); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 255 | |
Per Åhgren | 63b494d | 2017-12-06 11:32:38 +0100 | [diff] [blame] | 256 | // Detect and flag echo saturation. |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 257 | saturation_detector_.Update(aligned_render_block, SaturatedCapture(), |
| 258 | UsableLinearEstimate(), subtractor_output, |
Sam Zackrisson | 0169a3e | 2019-10-09 08:00:29 +0200 | [diff] [blame] | 259 | max_echo_path_gain); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 260 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 261 | // Update the decision on whether to use the initial state parameter set. |
| 262 | initial_state_.Update(active_render, SaturatedCapture()); |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 263 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 264 | // Detect whether the transparent mode should be activated. |
| 265 | transparent_state_.Update(delay_state_.DirectPathFilterDelay(), |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 266 | any_filter_consistent, any_filter_converged, |
| 267 | all_filters_diverged, active_render, |
| 268 | SaturatedCapture()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 269 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 270 | // Analyze the quality of the filter. |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 271 | filter_quality_state_.Update(active_render, TransparentMode(), |
| 272 | SaturatedCapture(), external_delay, |
| 273 | any_filter_converged); |
Per Åhgren | a98c807 | 2018-01-15 19:17:16 +0100 | [diff] [blame] | 274 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 275 | // Update the reverb estimate. |
Per Åhgren | ef5d5af | 2018-07-31 00:03:46 +0200 | [diff] [blame] | 276 | const bool stationary_block = |
Jesús de Vicente Peña | 70a5963 | 2019-04-16 12:32:15 +0200 | [diff] [blame] | 277 | config_.echo_audibility.use_stationarity_properties && |
Per Åhgren | f4801a1 | 2018-09-27 13:14:02 +0200 | [diff] [blame] | 278 | echo_audibility_.IsBlockStationary(); |
Per Åhgren | ef5d5af | 2018-07-31 00:03:46 +0200 | [diff] [blame] | 279 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 280 | reverb_model_estimator_.Update(filter_analyzers_[0]->GetAdjustedFilter(), |
| 281 | adaptive_filter_frequency_response[0], |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 282 | erle_estimator_.GetInstLinearQualityEstimate(), |
| 283 | delay_state_.DirectPathFilterDelay(), |
| 284 | UsableLinearEstimate(), stationary_block); |
Jesús de Vicente Peña | 075cb2b | 2018-06-13 15:13:55 +0200 | [diff] [blame] | 285 | |
Jesús de Vicente Peña | 496cedf | 2018-07-04 11:02:09 +0200 | [diff] [blame] | 286 | erle_estimator_.Dump(data_dumper_); |
Per Åhgren | ef5d5af | 2018-07-31 00:03:46 +0200 | [diff] [blame] | 287 | reverb_model_estimator_.Dump(data_dumper_.get()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 288 | data_dumper_->DumpRaw("aec3_erl", Erl()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 289 | data_dumper_->DumpRaw("aec3_erl_time_domain", ErlTimeDomain()); |
Per Åhgren | b4161d3 | 2019-10-08 12:35:47 +0200 | [diff] [blame] | 290 | data_dumper_->DumpRaw("aec3_erle", Erle()[0]); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 291 | data_dumper_->DumpRaw("aec3_usable_linear_estimate", UsableLinearEstimate()); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 292 | data_dumper_->DumpRaw("aec3_transparent_mode", TransparentMode()); |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 293 | data_dumper_->DumpRaw("aec3_filter_delay", |
| 294 | filter_analyzers_[0]->DelayBlocks()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 295 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 296 | data_dumper_->DumpRaw("aec3_any_filter_consistent", any_filter_consistent); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 297 | data_dumper_->DumpRaw("aec3_initial_state", |
| 298 | initial_state_.InitialStateActive()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 299 | data_dumper_->DumpRaw("aec3_capture_saturation", SaturatedCapture()); |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 300 | data_dumper_->DumpRaw("aec3_echo_saturation", SaturatedEcho()); |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 301 | data_dumper_->DumpRaw("aec3_any_filter_converged", any_filter_converged); |
| 302 | data_dumper_->DumpRaw("aec3_all_filters_diverged", all_filters_diverged); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 303 | |
| 304 | data_dumper_->DumpRaw("aec3_external_delay_avaliable", |
| 305 | external_delay ? 1 : 0); |
Per Åhgren | ef5d5af | 2018-07-31 00:03:46 +0200 | [diff] [blame] | 306 | data_dumper_->DumpRaw("aec3_filter_tail_freq_resp_est", |
| 307 | GetReverbFrequencyResponse()); |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 308 | } |
| 309 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 310 | AecState::InitialState::InitialState(const EchoCanceller3Config& config) |
| 311 | : conservative_initial_phase_(config.filter.conservative_initial_phase), |
| 312 | initial_state_seconds_(config.filter.initial_state_seconds) { |
| 313 | Reset(); |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 314 | } |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 315 | void AecState::InitialState::InitialState::Reset() { |
| 316 | initial_state_ = true; |
| 317 | strong_not_saturated_render_blocks_ = 0; |
| 318 | } |
| 319 | void AecState::InitialState::InitialState::Update(bool active_render, |
| 320 | bool saturated_capture) { |
| 321 | strong_not_saturated_render_blocks_ += |
| 322 | active_render && !saturated_capture ? 1 : 0; |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 323 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 324 | // Flag whether the initial state is still active. |
| 325 | bool prev_initial_state = initial_state_; |
| 326 | if (conservative_initial_phase_) { |
| 327 | initial_state_ = |
| 328 | strong_not_saturated_render_blocks_ < 5 * kNumBlocksPerSecond; |
Per Åhgren | 31122d6 | 2018-04-10 16:33:55 +0200 | [diff] [blame] | 329 | } else { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 330 | initial_state_ = strong_not_saturated_render_blocks_ < |
| 331 | initial_state_seconds_ * kNumBlocksPerSecond; |
Per Åhgren | 31122d6 | 2018-04-10 16:33:55 +0200 | [diff] [blame] | 332 | } |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 333 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 334 | // Flag whether the transition from the initial state has started. |
| 335 | transition_triggered_ = !initial_state_ && prev_initial_state; |
| 336 | } |
| 337 | |
| 338 | AecState::FilterDelay::FilterDelay(const EchoCanceller3Config& config) |
Gustaf Ullberg | 9249fbf | 2019-03-14 11:24:54 +0100 | [diff] [blame] | 339 | : delay_headroom_samples_(config.delay.delay_headroom_samples) {} |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 340 | |
| 341 | void AecState::FilterDelay::Update( |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 342 | const std::vector<std::unique_ptr<FilterAnalyzer>>& filter_analyzers, |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 343 | const absl::optional<DelayEstimate>& external_delay, |
| 344 | size_t blocks_with_proper_filter_adaptation) { |
| 345 | // Update the delay based on the external delay. |
| 346 | if (external_delay && |
| 347 | (!external_delay_ || external_delay_->delay != external_delay->delay)) { |
| 348 | external_delay_ = external_delay; |
| 349 | external_delay_reported_ = true; |
| 350 | } |
| 351 | |
| 352 | // Override the estimated delay if it is not certain that the filter has had |
| 353 | // time to converge. |
| 354 | const bool delay_estimator_may_not_have_converged = |
| 355 | blocks_with_proper_filter_adaptation < 2 * kNumBlocksPerSecond; |
| 356 | if (delay_estimator_may_not_have_converged && external_delay_) { |
Gustaf Ullberg | 9249fbf | 2019-03-14 11:24:54 +0100 | [diff] [blame] | 357 | filter_delay_blocks_ = delay_headroom_samples_ / kBlockSize; |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 358 | } else { |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 359 | // Conservatively use the min delay among the filters. |
| 360 | filter_delay_blocks_ = filter_analyzers[0]->DelayBlocks(); |
| 361 | for (size_t ch = 1; ch < filter_analyzers.size(); ++ch) { |
| 362 | filter_delay_blocks_ = |
| 363 | std::min(filter_delay_blocks_, filter_analyzers[ch]->DelayBlocks()); |
| 364 | } |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 365 | } |
| 366 | } |
| 367 | |
| 368 | AecState::TransparentMode::TransparentMode(const EchoCanceller3Config& config) |
| 369 | : bounded_erl_(config.ep_strength.bounded_erl), |
| 370 | linear_and_stable_echo_path_( |
| 371 | config.echo_removal_control.linear_and_stable_echo_path), |
| 372 | active_blocks_since_sane_filter_(kBlocksSinceConsistentEstimateInit), |
| 373 | non_converged_sequence_size_(kBlocksSinceConvergencedFilterInit) {} |
| 374 | |
| 375 | void AecState::TransparentMode::Reset() { |
| 376 | non_converged_sequence_size_ = kBlocksSinceConvergencedFilterInit; |
| 377 | diverged_sequence_size_ = 0; |
| 378 | strong_not_saturated_render_blocks_ = 0; |
| 379 | if (linear_and_stable_echo_path_) { |
| 380 | recent_convergence_during_activity_ = false; |
| 381 | } |
| 382 | } |
| 383 | |
| 384 | void AecState::TransparentMode::Update(int filter_delay_blocks, |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 385 | bool any_filter_consistent, |
| 386 | bool any_filter_converged, |
| 387 | bool all_filters_diverged, |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 388 | bool active_render, |
| 389 | bool saturated_capture) { |
| 390 | ++capture_block_counter_; |
| 391 | strong_not_saturated_render_blocks_ += |
| 392 | active_render && !saturated_capture ? 1 : 0; |
| 393 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 394 | if (any_filter_consistent && filter_delay_blocks < 5) { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 395 | sane_filter_observed_ = true; |
| 396 | active_blocks_since_sane_filter_ = 0; |
| 397 | } else if (active_render) { |
| 398 | ++active_blocks_since_sane_filter_; |
| 399 | } |
| 400 | |
| 401 | bool sane_filter_recently_seen; |
| 402 | if (!sane_filter_observed_) { |
| 403 | sane_filter_recently_seen = |
| 404 | capture_block_counter_ <= 5 * kNumBlocksPerSecond; |
| 405 | } else { |
| 406 | sane_filter_recently_seen = |
| 407 | active_blocks_since_sane_filter_ <= 30 * kNumBlocksPerSecond; |
| 408 | } |
| 409 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 410 | if (any_filter_converged) { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 411 | recent_convergence_during_activity_ = true; |
| 412 | active_non_converged_sequence_size_ = 0; |
| 413 | non_converged_sequence_size_ = 0; |
| 414 | ++num_converged_blocks_; |
| 415 | } else { |
| 416 | if (++non_converged_sequence_size_ > 20 * kNumBlocksPerSecond) { |
| 417 | num_converged_blocks_ = 0; |
| 418 | } |
| 419 | |
| 420 | if (active_render && |
| 421 | ++active_non_converged_sequence_size_ > 60 * kNumBlocksPerSecond) { |
| 422 | recent_convergence_during_activity_ = false; |
| 423 | } |
| 424 | } |
| 425 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 426 | if (!all_filters_diverged) { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 427 | diverged_sequence_size_ = 0; |
| 428 | } else if (++diverged_sequence_size_ >= 60) { |
| 429 | // TODO(peah): Change these lines to ensure proper triggering of usable |
| 430 | // filter. |
| 431 | non_converged_sequence_size_ = kBlocksSinceConvergencedFilterInit; |
| 432 | } |
| 433 | |
| 434 | if (active_non_converged_sequence_size_ > 60 * kNumBlocksPerSecond) { |
| 435 | finite_erl_recently_detected_ = false; |
| 436 | } |
| 437 | if (num_converged_blocks_ > 50) { |
| 438 | finite_erl_recently_detected_ = true; |
| 439 | } |
| 440 | |
| 441 | if (bounded_erl_) { |
| 442 | transparency_activated_ = false; |
| 443 | } else if (finite_erl_recently_detected_) { |
| 444 | transparency_activated_ = false; |
| 445 | } else if (sane_filter_recently_seen && recent_convergence_during_activity_) { |
| 446 | transparency_activated_ = false; |
| 447 | } else { |
| 448 | const bool filter_should_have_converged = |
| 449 | strong_not_saturated_render_blocks_ > 6 * kNumBlocksPerSecond; |
| 450 | transparency_activated_ = filter_should_have_converged; |
| 451 | } |
| 452 | } |
| 453 | |
| 454 | AecState::FilteringQualityAnalyzer::FilteringQualityAnalyzer( |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 455 | const EchoCanceller3Config& config) {} |
| 456 | |
| 457 | void AecState::FilteringQualityAnalyzer::Reset() { |
| 458 | usable_linear_estimate_ = false; |
| 459 | filter_update_blocks_since_reset_ = 0; |
| 460 | } |
| 461 | |
| 462 | void AecState::FilteringQualityAnalyzer::Update( |
| 463 | bool active_render, |
| 464 | bool transparent_mode, |
| 465 | bool saturated_capture, |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 466 | const absl::optional<DelayEstimate>& external_delay, |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 467 | bool any_filter_converged) { |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 468 | // Update blocks counter. |
| 469 | const bool filter_update = active_render && !saturated_capture; |
| 470 | filter_update_blocks_since_reset_ += filter_update ? 1 : 0; |
| 471 | filter_update_blocks_since_start_ += filter_update ? 1 : 0; |
| 472 | |
| 473 | // Store convergence flag when observed. |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 474 | convergence_seen_ = convergence_seen_ || any_filter_converged; |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 475 | |
| 476 | // Verify requirements for achieving a decent filter. The requirements for |
| 477 | // filter adaptation at call startup are more restrictive than after an |
| 478 | // in-call reset. |
| 479 | const bool sufficient_data_to_converge_at_startup = |
| 480 | filter_update_blocks_since_start_ > kNumBlocksPerSecond * 0.4f; |
| 481 | const bool sufficient_data_to_converge_at_reset = |
| 482 | sufficient_data_to_converge_at_startup && |
| 483 | filter_update_blocks_since_reset_ > kNumBlocksPerSecond * 0.2f; |
| 484 | |
| 485 | // The linear filter can only be used it has had time to converge. |
| 486 | usable_linear_estimate_ = sufficient_data_to_converge_at_startup && |
| 487 | sufficient_data_to_converge_at_reset; |
| 488 | |
| 489 | // The linear filter can only be used if an external delay or convergence have |
| 490 | // been identified |
| 491 | usable_linear_estimate_ = |
| 492 | usable_linear_estimate_ && (external_delay || convergence_seen_); |
| 493 | |
| 494 | // If transparent mode is on, deactivate usign the linear filter. |
| 495 | usable_linear_estimate_ = usable_linear_estimate_ && !transparent_mode; |
| 496 | } |
| 497 | |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 498 | void AecState::SaturationDetector::Update( |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 499 | rtc::ArrayView<const std::vector<float>> x, |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 500 | bool saturated_capture, |
| 501 | bool usable_linear_estimate, |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 502 | rtc::ArrayView<const SubtractorOutput> subtractor_output, |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 503 | float echo_path_gain) { |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 504 | saturated_echo_ = false; |
| 505 | if (!saturated_capture) { |
| 506 | return; |
| 507 | } |
| 508 | |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 509 | if (usable_linear_estimate) { |
| 510 | constexpr float kSaturationThreshold = 20000.f; |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 511 | for (size_t ch = 0; ch < subtractor_output.size(); ++ch) { |
| 512 | saturated_echo_ = |
| 513 | saturated_echo_ || |
| 514 | (subtractor_output[ch].s_main_max_abs > kSaturationThreshold || |
| 515 | subtractor_output[ch].s_shadow_max_abs > kSaturationThreshold); |
| 516 | } |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 517 | } else { |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 518 | float max_sample = 0.f; |
| 519 | for (auto& channel : x) { |
| 520 | for (float sample : channel) { |
| 521 | max_sample = std::max(max_sample, fabsf(sample)); |
| 522 | } |
| 523 | } |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 524 | |
| 525 | const float kMargin = 10.f; |
| 526 | float peak_echo_amplitude = max_sample * echo_path_gain * kMargin; |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 527 | saturated_echo_ = saturated_echo_ || peak_echo_amplitude > 32000; |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 528 | } |
| 529 | } |
| 530 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 531 | } // namespace webrtc |