peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #include "modules/audio_processing/aec3/aec_state.h" |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 12 | |
| 13 | #include <math.h> |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 14 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 15 | #include <algorithm> |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 16 | #include <numeric> |
| 17 | #include <vector> |
| 18 | |
Jesús de Vicente Peña | 496cedf | 2018-07-04 11:02:09 +0200 | [diff] [blame] | 19 | #include "absl/types/optional.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 20 | #include "api/array_view.h" |
Jesús de Vicente Peña | 496cedf | 2018-07-04 11:02:09 +0200 | [diff] [blame] | 21 | #include "modules/audio_processing/aec3/aec3_common.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 22 | #include "modules/audio_processing/logging/apm_data_dumper.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 23 | #include "rtc_base/atomic_ops.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 24 | #include "rtc_base/checks.h" |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 25 | |
| 26 | namespace webrtc { |
| 27 | namespace { |
| 28 | |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 29 | constexpr size_t kBlocksSinceConvergencedFilterInit = 10000; |
| 30 | constexpr size_t kBlocksSinceConsistentEstimateInit = 10000; |
| 31 | |
Per Åhgren | 8718afb | 2019-10-15 10:31:35 +0200 | [diff] [blame] | 32 | void ComputeAvgRenderReverb( |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 33 | const SpectrumBuffer& spectrum_buffer, |
| 34 | int delay_blocks, |
| 35 | float reverb_decay, |
| 36 | ReverbModel* reverb_model, |
| 37 | rtc::ArrayView<float, kFftLengthBy2Plus1> reverb_power_spectrum) { |
| 38 | RTC_DCHECK(reverb_model); |
| 39 | const size_t num_render_channels = spectrum_buffer.buffer[0].size(); |
| 40 | int idx_at_delay = |
| 41 | spectrum_buffer.OffsetIndex(spectrum_buffer.read, delay_blocks); |
| 42 | int idx_past = spectrum_buffer.IncIndex(idx_at_delay); |
| 43 | |
| 44 | std::array<float, kFftLengthBy2Plus1> X2_data; |
| 45 | rtc::ArrayView<const float> X2; |
| 46 | if (num_render_channels > 1) { |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 47 | auto average_channels = |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 48 | [](size_t num_render_channels, |
Sam Zackrisson | 98872dc | 2019-10-18 08:20:09 +0200 | [diff] [blame] | 49 | rtc::ArrayView<const std::array<float, kFftLengthBy2Plus1>> |
| 50 | spectrum_band_0, |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 51 | rtc::ArrayView<float, kFftLengthBy2Plus1> render_power) { |
| 52 | std::fill(render_power.begin(), render_power.end(), 0.f); |
| 53 | for (size_t ch = 0; ch < num_render_channels; ++ch) { |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 54 | for (size_t k = 0; k < kFftLengthBy2Plus1; ++k) { |
| 55 | render_power[k] += spectrum_band_0[ch][k]; |
| 56 | } |
| 57 | } |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 58 | const float normalizer = 1.f / num_render_channels; |
| 59 | for (size_t k = 0; k < kFftLengthBy2Plus1; ++k) { |
| 60 | render_power[k] *= normalizer; |
| 61 | } |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 62 | }; |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 63 | average_channels(num_render_channels, spectrum_buffer.buffer[idx_past], |
| 64 | X2_data); |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 65 | reverb_model->UpdateReverbNoFreqShaping( |
| 66 | X2_data, /*power_spectrum_scaling=*/1.0f, reverb_decay); |
| 67 | |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 68 | average_channels(num_render_channels, spectrum_buffer.buffer[idx_at_delay], |
| 69 | X2_data); |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 70 | X2 = X2_data; |
| 71 | } else { |
| 72 | reverb_model->UpdateReverbNoFreqShaping( |
| 73 | spectrum_buffer.buffer[idx_past][/*channel=*/0], |
| 74 | /*power_spectrum_scaling=*/1.0f, reverb_decay); |
| 75 | |
| 76 | X2 = spectrum_buffer.buffer[idx_at_delay][/*channel=*/0]; |
| 77 | } |
| 78 | |
| 79 | rtc::ArrayView<const float, kFftLengthBy2Plus1> reverb_power = |
| 80 | reverb_model->reverb(); |
| 81 | for (size_t k = 0; k < X2.size(); ++k) { |
| 82 | reverb_power_spectrum[k] = X2[k] + reverb_power[k]; |
| 83 | } |
| 84 | } |
| 85 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 86 | } // namespace |
| 87 | |
| 88 | int AecState::instance_count_ = 0; |
| 89 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 90 | void AecState::GetResidualEchoScaling( |
| 91 | rtc::ArrayView<float> residual_scaling) const { |
| 92 | bool filter_has_had_time_to_converge; |
| 93 | if (config_.filter.conservative_initial_phase) { |
| 94 | filter_has_had_time_to_converge = |
| 95 | strong_not_saturated_render_blocks_ >= 1.5f * kNumBlocksPerSecond; |
| 96 | } else { |
| 97 | filter_has_had_time_to_converge = |
| 98 | strong_not_saturated_render_blocks_ >= 0.8f * kNumBlocksPerSecond; |
| 99 | } |
| 100 | echo_audibility_.GetResidualEchoScaling(filter_has_had_time_to_converge, |
| 101 | residual_scaling); |
| 102 | } |
| 103 | |
| 104 | absl::optional<float> AecState::ErleUncertainty() const { |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 105 | if (SaturatedEcho()) { |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 106 | return 1.f; |
| 107 | } |
| 108 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 109 | return absl::nullopt; |
| 110 | } |
| 111 | |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 112 | AecState::AecState(const EchoCanceller3Config& config, |
| 113 | size_t num_capture_channels) |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 114 | : data_dumper_( |
| 115 | new ApmDataDumper(rtc::AtomicOps::Increment(&instance_count_))), |
peah | 8cee56f | 2017-08-24 22:36:53 -0700 | [diff] [blame] | 116 | config_(config), |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 117 | num_capture_channels_(num_capture_channels), |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 118 | initial_state_(config_), |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 119 | delay_state_(config_, num_capture_channels_), |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 120 | transparent_state_(config_), |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 121 | filter_quality_state_(config_, num_capture_channels_), |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 122 | erl_estimator_(2 * kNumBlocksPerSecond), |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 123 | erle_estimator_(2 * kNumBlocksPerSecond, config_, num_capture_channels_), |
| 124 | filter_analyzer_(config_, num_capture_channels_), |
Jesús de Vicente Peña | 836a7a2 | 2018-08-31 15:03:04 +0200 | [diff] [blame] | 125 | echo_audibility_( |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 126 | config_.echo_audibility.use_stationarity_properties_at_init), |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 127 | reverb_model_estimator_(config_, num_capture_channels_), |
| 128 | subtractor_output_analyzer_(num_capture_channels_) {} |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 129 | |
| 130 | AecState::~AecState() = default; |
| 131 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 132 | void AecState::HandleEchoPathChange( |
| 133 | const EchoPathVariability& echo_path_variability) { |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 134 | const auto full_reset = [&]() { |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 135 | filter_analyzer_.Reset(); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 136 | capture_signal_saturation_ = false; |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 137 | strong_not_saturated_render_blocks_ = 0; |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 138 | blocks_with_active_render_ = 0; |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 139 | initial_state_.Reset(); |
| 140 | transparent_state_.Reset(); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 141 | erle_estimator_.Reset(true); |
| 142 | erl_estimator_.Reset(); |
Jesús de Vicente Peña | 70a5963 | 2019-04-16 12:32:15 +0200 | [diff] [blame] | 143 | filter_quality_state_.Reset(); |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 144 | }; |
peah | 6d822ad | 2017-04-10 13:52:14 -0700 | [diff] [blame] | 145 | |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 146 | // TODO(peah): Refine the reset scheme according to the type of gain and |
| 147 | // delay adjustment. |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 148 | |
| 149 | if (echo_path_variability.delay_change != |
Per Åhgren | 88cf050 | 2018-07-16 17:08:41 +0200 | [diff] [blame] | 150 | EchoPathVariability::DelayAdjustment::kNone) { |
Per Åhgren | 8ba5861 | 2017-12-01 23:01:44 +0100 | [diff] [blame] | 151 | full_reset(); |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 152 | } else if (echo_path_variability.gain_change) { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 153 | erle_estimator_.Reset(false); |
Per Åhgren | d2650d1 | 2018-10-02 17:00:59 +0200 | [diff] [blame] | 154 | } |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 155 | subtractor_output_analyzer_.HandleEchoPathChange(); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 156 | } |
| 157 | |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 158 | void AecState::Update( |
Danil Chapovalov | db9f7ab | 2018-06-19 10:50:11 +0200 | [diff] [blame] | 159 | const absl::optional<DelayEstimate>& external_delay, |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 160 | rtc::ArrayView<const std::vector<std::array<float, kFftLengthBy2Plus1>>> |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 161 | adaptive_filter_frequency_responses, |
| 162 | rtc::ArrayView<const std::vector<float>> adaptive_filter_impulse_responses, |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 163 | const RenderBuffer& render_buffer, |
Per Åhgren | f980725 | 2019-10-09 13:57:07 +0200 | [diff] [blame] | 164 | rtc::ArrayView<const std::array<float, kFftLengthBy2Plus1>> E2_main, |
| 165 | rtc::ArrayView<const std::array<float, kFftLengthBy2Plus1>> Y2, |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 166 | rtc::ArrayView<const SubtractorOutput> subtractor_output) { |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 167 | RTC_DCHECK_EQ(num_capture_channels_, Y2.size()); |
| 168 | RTC_DCHECK_EQ(num_capture_channels_, subtractor_output.size()); |
| 169 | RTC_DCHECK_EQ(num_capture_channels_, |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 170 | adaptive_filter_frequency_responses.size()); |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 171 | RTC_DCHECK_EQ(num_capture_channels_, |
| 172 | adaptive_filter_impulse_responses.size()); |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 173 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 174 | // Analyze the filter outputs and filters. |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 175 | bool any_filter_converged; |
| 176 | bool all_filters_diverged; |
| 177 | subtractor_output_analyzer_.Update(subtractor_output, &any_filter_converged, |
| 178 | &all_filters_diverged); |
| 179 | |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 180 | bool any_filter_consistent; |
| 181 | float max_echo_path_gain; |
| 182 | filter_analyzer_.Update(adaptive_filter_impulse_responses, render_buffer, |
| 183 | &any_filter_consistent, &max_echo_path_gain); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 184 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 185 | // Estimate the direct path delay of the filter. |
Gustaf Ullberg | 9466b66 | 2019-04-15 09:53:03 +0200 | [diff] [blame] | 186 | if (config_.filter.use_linear_filter) { |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 187 | delay_state_.Update(filter_analyzer_.FilterDelaysBlocks(), external_delay, |
Gustaf Ullberg | 9466b66 | 2019-04-15 09:53:03 +0200 | [diff] [blame] | 188 | strong_not_saturated_render_blocks_); |
| 189 | } |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 190 | |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 191 | const std::vector<std::vector<float>>& aligned_render_block = |
Per Åhgren | 88d662a | 2019-10-16 15:32:39 +0200 | [diff] [blame] | 192 | render_buffer.Block(-delay_state_.MinDirectPathFilterDelay())[0]; |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 193 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 194 | // Update render counters. |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 195 | bool active_render = false; |
| 196 | for (size_t ch = 0; ch < aligned_render_block.size(); ++ch) { |
| 197 | const float render_energy = std::inner_product( |
| 198 | aligned_render_block[ch].begin(), aligned_render_block[ch].end(), |
| 199 | aligned_render_block[ch].begin(), 0.f); |
| 200 | if (render_energy > (config_.render_levels.active_render_limit * |
| 201 | config_.render_levels.active_render_limit) * |
| 202 | kFftLengthBy2) { |
| 203 | active_render = true; |
| 204 | break; |
| 205 | } |
| 206 | } |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 207 | blocks_with_active_render_ += active_render ? 1 : 0; |
| 208 | strong_not_saturated_render_blocks_ += |
| 209 | active_render && !SaturatedCapture() ? 1 : 0; |
Per Åhgren | 0e6d2f5 | 2017-12-20 22:19:56 +0100 | [diff] [blame] | 210 | |
Per Åhgren | 8718afb | 2019-10-15 10:31:35 +0200 | [diff] [blame] | 211 | std::array<float, kFftLengthBy2Plus1> avg_render_spectrum_with_reverb; |
Per Åhgren | 1d3008b | 2019-10-09 12:54:43 +0200 | [diff] [blame] | 212 | |
Per Åhgren | 8718afb | 2019-10-15 10:31:35 +0200 | [diff] [blame] | 213 | ComputeAvgRenderReverb(render_buffer.GetSpectrumBuffer(), |
| 214 | delay_state_.MinDirectPathFilterDelay(), ReverbDecay(), |
| 215 | &avg_render_reverb_, avg_render_spectrum_with_reverb); |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 216 | |
Jesús de Vicente Peña | 70a5963 | 2019-04-16 12:32:15 +0200 | [diff] [blame] | 217 | if (config_.echo_audibility.use_stationarity_properties) { |
Jesús de Vicente Peña | d5cb477 | 2018-04-25 13:58:45 +0200 | [diff] [blame] | 218 | // Update the echo audibility evaluator. |
Per Åhgren | 8718afb | 2019-10-15 10:31:35 +0200 | [diff] [blame] | 219 | echo_audibility_.Update(render_buffer, avg_render_reverb_.reverb(), |
| 220 | delay_state_.MinDirectPathFilterDelay(), |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 221 | delay_state_.ExternalDelayReported()); |
Jesús de Vicente Peña | d5cb477 | 2018-04-25 13:58:45 +0200 | [diff] [blame] | 222 | } |
| 223 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 224 | // Update the ERL and ERLE measures. |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 225 | if (initial_state_.TransitionTriggered()) { |
| 226 | erle_estimator_.Reset(false); |
Jesús de Vicente Peña | 02e9e44 | 2018-08-29 13:34:07 +0200 | [diff] [blame] | 227 | } |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 228 | |
Per Åhgren | 785d4c4 | 2019-10-17 14:40:54 +0200 | [diff] [blame] | 229 | erle_estimator_.Update(render_buffer, adaptive_filter_frequency_responses, |
| 230 | avg_render_spectrum_with_reverb, Y2, E2_main, |
| 231 | subtractor_output_analyzer_.ConvergedFilters()); |
Jesús de Vicente Peña | c98849c | 2018-10-22 11:41:05 +0200 | [diff] [blame] | 232 | |
Sam Zackrisson | 6e5433c | 2019-10-18 16:49:13 +0200 | [diff] [blame] | 233 | erl_estimator_.Update( |
| 234 | subtractor_output_analyzer_.ConvergedFilters(), |
| 235 | render_buffer.Spectrum(delay_state_.MinDirectPathFilterDelay()), Y2); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 236 | |
Per Åhgren | 63b494d | 2017-12-06 11:32:38 +0100 | [diff] [blame] | 237 | // Detect and flag echo saturation. |
Gustaf Ullberg | 68d6d44 | 2019-01-29 10:08:15 +0100 | [diff] [blame] | 238 | saturation_detector_.Update(aligned_render_block, SaturatedCapture(), |
| 239 | UsableLinearEstimate(), subtractor_output, |
Sam Zackrisson | 0169a3e | 2019-10-09 08:00:29 +0200 | [diff] [blame] | 240 | max_echo_path_gain); |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 241 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 242 | // Update the decision on whether to use the initial state parameter set. |
| 243 | initial_state_.Update(active_render, SaturatedCapture()); |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 244 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 245 | // Detect whether the transparent mode should be activated. |
Per Åhgren | 88d662a | 2019-10-16 15:32:39 +0200 | [diff] [blame] | 246 | transparent_state_.Update(delay_state_.MinDirectPathFilterDelay(), |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 247 | any_filter_consistent, any_filter_converged, |
| 248 | all_filters_diverged, active_render, |
| 249 | SaturatedCapture()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 250 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 251 | // Analyze the quality of the filter. |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 252 | filter_quality_state_.Update(active_render, TransparentMode(), |
| 253 | SaturatedCapture(), external_delay, |
| 254 | any_filter_converged); |
Per Åhgren | a98c807 | 2018-01-15 19:17:16 +0100 | [diff] [blame] | 255 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 256 | // Update the reverb estimate. |
Per Åhgren | ef5d5af | 2018-07-31 00:03:46 +0200 | [diff] [blame] | 257 | const bool stationary_block = |
Jesús de Vicente Peña | 70a5963 | 2019-04-16 12:32:15 +0200 | [diff] [blame] | 258 | config_.echo_audibility.use_stationarity_properties && |
Per Åhgren | f4801a1 | 2018-09-27 13:14:02 +0200 | [diff] [blame] | 259 | echo_audibility_.IsBlockStationary(); |
Per Åhgren | ef5d5af | 2018-07-31 00:03:46 +0200 | [diff] [blame] | 260 | |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 261 | reverb_model_estimator_.Update( |
| 262 | filter_analyzer_.GetAdjustedFilters(), |
| 263 | adaptive_filter_frequency_responses, |
| 264 | erle_estimator_.GetInstLinearQualityEstimates(), |
| 265 | delay_state_.DirectPathFilterDelays(), |
| 266 | filter_quality_state_.UsableLinearFilterOutputs(), stationary_block); |
Jesús de Vicente Peña | 075cb2b | 2018-06-13 15:13:55 +0200 | [diff] [blame] | 267 | |
Jesús de Vicente Peña | 496cedf | 2018-07-04 11:02:09 +0200 | [diff] [blame] | 268 | erle_estimator_.Dump(data_dumper_); |
Per Åhgren | ef5d5af | 2018-07-31 00:03:46 +0200 | [diff] [blame] | 269 | reverb_model_estimator_.Dump(data_dumper_.get()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 270 | data_dumper_->DumpRaw("aec3_erl", Erl()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 271 | data_dumper_->DumpRaw("aec3_erl_time_domain", ErlTimeDomain()); |
Per Åhgren | b4161d3 | 2019-10-08 12:35:47 +0200 | [diff] [blame] | 272 | data_dumper_->DumpRaw("aec3_erle", Erle()[0]); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 273 | data_dumper_->DumpRaw("aec3_usable_linear_estimate", UsableLinearEstimate()); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 274 | data_dumper_->DumpRaw("aec3_transparent_mode", TransparentMode()); |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 275 | data_dumper_->DumpRaw("aec3_filter_delay", |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 276 | filter_analyzer_.MinFilterDelayBlocks()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 277 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 278 | data_dumper_->DumpRaw("aec3_any_filter_consistent", any_filter_consistent); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 279 | data_dumper_->DumpRaw("aec3_initial_state", |
| 280 | initial_state_.InitialStateActive()); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 281 | data_dumper_->DumpRaw("aec3_capture_saturation", SaturatedCapture()); |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 282 | data_dumper_->DumpRaw("aec3_echo_saturation", SaturatedEcho()); |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 283 | data_dumper_->DumpRaw("aec3_any_filter_converged", any_filter_converged); |
| 284 | data_dumper_->DumpRaw("aec3_all_filters_diverged", all_filters_diverged); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 285 | |
| 286 | data_dumper_->DumpRaw("aec3_external_delay_avaliable", |
| 287 | external_delay ? 1 : 0); |
Per Åhgren | ef5d5af | 2018-07-31 00:03:46 +0200 | [diff] [blame] | 288 | data_dumper_->DumpRaw("aec3_filter_tail_freq_resp_est", |
| 289 | GetReverbFrequencyResponse()); |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 290 | } |
| 291 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 292 | AecState::InitialState::InitialState(const EchoCanceller3Config& config) |
| 293 | : conservative_initial_phase_(config.filter.conservative_initial_phase), |
| 294 | initial_state_seconds_(config.filter.initial_state_seconds) { |
| 295 | Reset(); |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 296 | } |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 297 | void AecState::InitialState::InitialState::Reset() { |
| 298 | initial_state_ = true; |
| 299 | strong_not_saturated_render_blocks_ = 0; |
| 300 | } |
| 301 | void AecState::InitialState::InitialState::Update(bool active_render, |
| 302 | bool saturated_capture) { |
| 303 | strong_not_saturated_render_blocks_ += |
| 304 | active_render && !saturated_capture ? 1 : 0; |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 305 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 306 | // Flag whether the initial state is still active. |
| 307 | bool prev_initial_state = initial_state_; |
| 308 | if (conservative_initial_phase_) { |
| 309 | initial_state_ = |
| 310 | strong_not_saturated_render_blocks_ < 5 * kNumBlocksPerSecond; |
Per Åhgren | 31122d6 | 2018-04-10 16:33:55 +0200 | [diff] [blame] | 311 | } else { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 312 | initial_state_ = strong_not_saturated_render_blocks_ < |
| 313 | initial_state_seconds_ * kNumBlocksPerSecond; |
Per Åhgren | 31122d6 | 2018-04-10 16:33:55 +0200 | [diff] [blame] | 314 | } |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 315 | |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 316 | // Flag whether the transition from the initial state has started. |
| 317 | transition_triggered_ = !initial_state_ && prev_initial_state; |
| 318 | } |
| 319 | |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 320 | AecState::FilterDelay::FilterDelay(const EchoCanceller3Config& config, |
| 321 | size_t num_capture_channels) |
| 322 | : delay_headroom_samples_(config.delay.delay_headroom_samples), |
| 323 | filter_delays_blocks_(num_capture_channels, 0) {} |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 324 | |
| 325 | void AecState::FilterDelay::Update( |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 326 | rtc::ArrayView<const int> analyzer_filter_delay_estimates_blocks, |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 327 | const absl::optional<DelayEstimate>& external_delay, |
| 328 | size_t blocks_with_proper_filter_adaptation) { |
| 329 | // Update the delay based on the external delay. |
| 330 | if (external_delay && |
| 331 | (!external_delay_ || external_delay_->delay != external_delay->delay)) { |
| 332 | external_delay_ = external_delay; |
| 333 | external_delay_reported_ = true; |
| 334 | } |
| 335 | |
| 336 | // Override the estimated delay if it is not certain that the filter has had |
| 337 | // time to converge. |
| 338 | const bool delay_estimator_may_not_have_converged = |
| 339 | blocks_with_proper_filter_adaptation < 2 * kNumBlocksPerSecond; |
| 340 | if (delay_estimator_may_not_have_converged && external_delay_) { |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 341 | int delay_guess = delay_headroom_samples_ / kBlockSize; |
| 342 | std::fill(filter_delays_blocks_.begin(), filter_delays_blocks_.end(), |
| 343 | delay_guess); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 344 | } else { |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 345 | RTC_DCHECK_EQ(filter_delays_blocks_.size(), |
| 346 | analyzer_filter_delay_estimates_blocks.size()); |
| 347 | std::copy(analyzer_filter_delay_estimates_blocks.begin(), |
| 348 | analyzer_filter_delay_estimates_blocks.end(), |
| 349 | filter_delays_blocks_.begin()); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 350 | } |
Per Åhgren | 8718afb | 2019-10-15 10:31:35 +0200 | [diff] [blame] | 351 | |
| 352 | min_filter_delay_ = *std::min_element(filter_delays_blocks_.begin(), |
| 353 | filter_delays_blocks_.end()); |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 354 | } |
| 355 | |
| 356 | AecState::TransparentMode::TransparentMode(const EchoCanceller3Config& config) |
| 357 | : bounded_erl_(config.ep_strength.bounded_erl), |
| 358 | linear_and_stable_echo_path_( |
| 359 | config.echo_removal_control.linear_and_stable_echo_path), |
| 360 | active_blocks_since_sane_filter_(kBlocksSinceConsistentEstimateInit), |
| 361 | non_converged_sequence_size_(kBlocksSinceConvergencedFilterInit) {} |
| 362 | |
| 363 | void AecState::TransparentMode::Reset() { |
| 364 | non_converged_sequence_size_ = kBlocksSinceConvergencedFilterInit; |
| 365 | diverged_sequence_size_ = 0; |
| 366 | strong_not_saturated_render_blocks_ = 0; |
| 367 | if (linear_and_stable_echo_path_) { |
| 368 | recent_convergence_during_activity_ = false; |
| 369 | } |
| 370 | } |
| 371 | |
| 372 | void AecState::TransparentMode::Update(int filter_delay_blocks, |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 373 | bool any_filter_consistent, |
| 374 | bool any_filter_converged, |
| 375 | bool all_filters_diverged, |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 376 | bool active_render, |
| 377 | bool saturated_capture) { |
| 378 | ++capture_block_counter_; |
| 379 | strong_not_saturated_render_blocks_ += |
| 380 | active_render && !saturated_capture ? 1 : 0; |
| 381 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 382 | if (any_filter_consistent && filter_delay_blocks < 5) { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 383 | sane_filter_observed_ = true; |
| 384 | active_blocks_since_sane_filter_ = 0; |
| 385 | } else if (active_render) { |
| 386 | ++active_blocks_since_sane_filter_; |
| 387 | } |
| 388 | |
| 389 | bool sane_filter_recently_seen; |
| 390 | if (!sane_filter_observed_) { |
| 391 | sane_filter_recently_seen = |
| 392 | capture_block_counter_ <= 5 * kNumBlocksPerSecond; |
| 393 | } else { |
| 394 | sane_filter_recently_seen = |
| 395 | active_blocks_since_sane_filter_ <= 30 * kNumBlocksPerSecond; |
| 396 | } |
| 397 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 398 | if (any_filter_converged) { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 399 | recent_convergence_during_activity_ = true; |
| 400 | active_non_converged_sequence_size_ = 0; |
| 401 | non_converged_sequence_size_ = 0; |
| 402 | ++num_converged_blocks_; |
| 403 | } else { |
| 404 | if (++non_converged_sequence_size_ > 20 * kNumBlocksPerSecond) { |
| 405 | num_converged_blocks_ = 0; |
| 406 | } |
| 407 | |
| 408 | if (active_render && |
| 409 | ++active_non_converged_sequence_size_ > 60 * kNumBlocksPerSecond) { |
| 410 | recent_convergence_during_activity_ = false; |
| 411 | } |
| 412 | } |
| 413 | |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 414 | if (!all_filters_diverged) { |
Per Åhgren | c5a38ad | 2018-10-04 15:37:54 +0200 | [diff] [blame] | 415 | diverged_sequence_size_ = 0; |
| 416 | } else if (++diverged_sequence_size_ >= 60) { |
| 417 | // TODO(peah): Change these lines to ensure proper triggering of usable |
| 418 | // filter. |
| 419 | non_converged_sequence_size_ = kBlocksSinceConvergencedFilterInit; |
| 420 | } |
| 421 | |
| 422 | if (active_non_converged_sequence_size_ > 60 * kNumBlocksPerSecond) { |
| 423 | finite_erl_recently_detected_ = false; |
| 424 | } |
| 425 | if (num_converged_blocks_ > 50) { |
| 426 | finite_erl_recently_detected_ = true; |
| 427 | } |
| 428 | |
| 429 | if (bounded_erl_) { |
| 430 | transparency_activated_ = false; |
| 431 | } else if (finite_erl_recently_detected_) { |
| 432 | transparency_activated_ = false; |
| 433 | } else if (sane_filter_recently_seen && recent_convergence_during_activity_) { |
| 434 | transparency_activated_ = false; |
| 435 | } else { |
| 436 | const bool filter_should_have_converged = |
| 437 | strong_not_saturated_render_blocks_ > 6 * kNumBlocksPerSecond; |
| 438 | transparency_activated_ = filter_should_have_converged; |
| 439 | } |
| 440 | } |
| 441 | |
| 442 | AecState::FilteringQualityAnalyzer::FilteringQualityAnalyzer( |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 443 | const EchoCanceller3Config& config, |
| 444 | size_t num_capture_channels) |
| 445 | : use_linear_filter_(config.filter.use_linear_filter), |
| 446 | usable_linear_filter_estimates_(num_capture_channels, false) {} |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 447 | |
| 448 | void AecState::FilteringQualityAnalyzer::Reset() { |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 449 | std::fill(usable_linear_filter_estimates_.begin(), |
| 450 | usable_linear_filter_estimates_.end(), false); |
| 451 | overall_usable_linear_estimates_ = false; |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 452 | filter_update_blocks_since_reset_ = 0; |
| 453 | } |
| 454 | |
| 455 | void AecState::FilteringQualityAnalyzer::Update( |
| 456 | bool active_render, |
| 457 | bool transparent_mode, |
| 458 | bool saturated_capture, |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 459 | const absl::optional<DelayEstimate>& external_delay, |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 460 | bool any_filter_converged) { |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 461 | // Update blocks counter. |
| 462 | const bool filter_update = active_render && !saturated_capture; |
| 463 | filter_update_blocks_since_reset_ += filter_update ? 1 : 0; |
| 464 | filter_update_blocks_since_start_ += filter_update ? 1 : 0; |
| 465 | |
| 466 | // Store convergence flag when observed. |
Sam Zackrisson | 46b0140 | 2019-10-08 16:17:48 +0200 | [diff] [blame] | 467 | convergence_seen_ = convergence_seen_ || any_filter_converged; |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 468 | |
| 469 | // Verify requirements for achieving a decent filter. The requirements for |
| 470 | // filter adaptation at call startup are more restrictive than after an |
| 471 | // in-call reset. |
| 472 | const bool sufficient_data_to_converge_at_startup = |
| 473 | filter_update_blocks_since_start_ > kNumBlocksPerSecond * 0.4f; |
| 474 | const bool sufficient_data_to_converge_at_reset = |
| 475 | sufficient_data_to_converge_at_startup && |
| 476 | filter_update_blocks_since_reset_ > kNumBlocksPerSecond * 0.2f; |
| 477 | |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 478 | // The linear filter can only be used if it has had time to converge. |
| 479 | overall_usable_linear_estimates_ = sufficient_data_to_converge_at_startup && |
| 480 | sufficient_data_to_converge_at_reset; |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 481 | |
| 482 | // The linear filter can only be used if an external delay or convergence have |
| 483 | // been identified |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 484 | overall_usable_linear_estimates_ = |
| 485 | overall_usable_linear_estimates_ && (external_delay || convergence_seen_); |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 486 | |
| 487 | // If transparent mode is on, deactivate usign the linear filter. |
Per Åhgren | 8be669f | 2019-10-11 23:02:26 +0200 | [diff] [blame] | 488 | overall_usable_linear_estimates_ = |
| 489 | overall_usable_linear_estimates_ && !transparent_mode; |
| 490 | |
| 491 | if (use_linear_filter_) { |
| 492 | std::fill(usable_linear_filter_estimates_.begin(), |
| 493 | usable_linear_filter_estimates_.end(), |
| 494 | overall_usable_linear_estimates_); |
| 495 | } |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 496 | } |
| 497 | |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 498 | void AecState::SaturationDetector::Update( |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 499 | rtc::ArrayView<const std::vector<float>> x, |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 500 | bool saturated_capture, |
| 501 | bool usable_linear_estimate, |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 502 | rtc::ArrayView<const SubtractorOutput> subtractor_output, |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 503 | float echo_path_gain) { |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 504 | saturated_echo_ = false; |
| 505 | if (!saturated_capture) { |
| 506 | return; |
| 507 | } |
| 508 | |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 509 | if (usable_linear_estimate) { |
| 510 | constexpr float kSaturationThreshold = 20000.f; |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 511 | for (size_t ch = 0; ch < subtractor_output.size(); ++ch) { |
| 512 | saturated_echo_ = |
| 513 | saturated_echo_ || |
| 514 | (subtractor_output[ch].s_main_max_abs > kSaturationThreshold || |
| 515 | subtractor_output[ch].s_shadow_max_abs > kSaturationThreshold); |
| 516 | } |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 517 | } else { |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 518 | float max_sample = 0.f; |
| 519 | for (auto& channel : x) { |
| 520 | for (float sample : channel) { |
| 521 | max_sample = std::max(max_sample, fabsf(sample)); |
| 522 | } |
| 523 | } |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 524 | |
| 525 | const float kMargin = 10.f; |
| 526 | float peak_echo_amplitude = max_sample * echo_path_gain * kMargin; |
Sam Zackrisson | 8f736c0 | 2019-10-01 12:47:53 +0200 | [diff] [blame] | 527 | saturated_echo_ = saturated_echo_ || peak_echo_amplitude > 32000; |
Per Åhgren | 3e7b7b1 | 2018-10-16 14:38:10 +0200 | [diff] [blame] | 528 | } |
| 529 | } |
| 530 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 531 | } // namespace webrtc |