peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #ifndef MODULES_AUDIO_PROCESSING_AEC3_AEC_STATE_H_ |
| 12 | #define MODULES_AUDIO_PROCESSING_AEC3_AEC_STATE_H_ |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 13 | |
Christian Schuldt | f4e99db | 2018-03-01 11:32:50 +0100 | [diff] [blame^] | 14 | #include <math.h> |
| 15 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 16 | #include <algorithm> |
| 17 | #include <memory> |
| 18 | #include <vector> |
| 19 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 20 | #include "api/array_view.h" |
Gustaf Ullberg | 3646f97 | 2018-02-14 15:19:04 +0100 | [diff] [blame] | 21 | #include "api/audio/echo_canceller3_config.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 22 | #include "api/optional.h" |
| 23 | #include "modules/audio_processing/aec3/aec3_common.h" |
Per Åhgren | 3ab308f | 2018-02-21 08:46:03 +0100 | [diff] [blame] | 24 | #include "modules/audio_processing/aec3/delay_estimate.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 25 | #include "modules/audio_processing/aec3/echo_path_variability.h" |
| 26 | #include "modules/audio_processing/aec3/erl_estimator.h" |
| 27 | #include "modules/audio_processing/aec3/erle_estimator.h" |
| 28 | #include "modules/audio_processing/aec3/render_buffer.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 29 | #include "rtc_base/constructormagic.h" |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 30 | |
| 31 | namespace webrtc { |
| 32 | |
| 33 | class ApmDataDumper; |
| 34 | |
| 35 | // Handles the state and the conditions for the echo removal functionality. |
| 36 | class AecState { |
| 37 | public: |
Gustaf Ullberg | bd83b91 | 2017-10-18 12:32:42 +0200 | [diff] [blame] | 38 | explicit AecState(const EchoCanceller3Config& config); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 39 | ~AecState(); |
| 40 | |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 41 | // Returns whether the echo subtractor can be used to determine the residual |
| 42 | // echo. |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 43 | bool UsableLinearEstimate() const { return usable_linear_estimate_; } |
| 44 | |
| 45 | // Returns whether there has been echo leakage detected. |
| 46 | bool EchoLeakageDetected() const { return echo_leakage_detected_; } |
| 47 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 48 | // Returns whether the render signal is currently active. |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 49 | bool ActiveRender() const { return blocks_with_active_render_ > 200; } |
peah | ebe7778 | 2017-02-27 07:29:21 -0800 | [diff] [blame] | 50 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 51 | // Returns the ERLE. |
| 52 | const std::array<float, kFftLengthBy2Plus1>& Erle() const { |
| 53 | return erle_estimator_.Erle(); |
| 54 | } |
| 55 | |
Gustaf Ullberg | 332150d | 2017-11-22 14:17:39 +0100 | [diff] [blame] | 56 | // Returns the time-domain ERLE. |
| 57 | float ErleTimeDomain() const { return erle_estimator_.ErleTimeDomain(); } |
| 58 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 59 | // Returns the ERL. |
| 60 | const std::array<float, kFftLengthBy2Plus1>& Erl() const { |
| 61 | return erl_estimator_.Erl(); |
| 62 | } |
| 63 | |
Gustaf Ullberg | 332150d | 2017-11-22 14:17:39 +0100 | [diff] [blame] | 64 | // Returns the time-domain ERL. |
| 65 | float ErlTimeDomain() const { return erl_estimator_.ErlTimeDomain(); } |
| 66 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 67 | // Returns the delay estimate based on the linear filter. |
Per Åhgren | 0e6d2f5 | 2017-12-20 22:19:56 +0100 | [diff] [blame] | 68 | int FilterDelay() const { return filter_delay_; } |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 69 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 70 | // Returns whether the capture signal is saturated. |
| 71 | bool SaturatedCapture() const { return capture_signal_saturation_; } |
| 72 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 73 | // Returns whether the echo signal is saturated. |
| 74 | bool SaturatedEcho() const { return echo_saturation_; } |
| 75 | |
Per Åhgren | 7ddd463 | 2017-10-25 02:59:45 +0200 | [diff] [blame] | 76 | // Returns whether the echo path can saturate. |
| 77 | bool SaturatingEchoPath() const { return saturating_echo_path_; } |
| 78 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 79 | // Updates the capture signal saturation. |
| 80 | void UpdateCaptureSaturation(bool capture_signal_saturation) { |
| 81 | capture_signal_saturation_ = capture_signal_saturation; |
| 82 | } |
| 83 | |
Per Åhgren | 1b4059e | 2017-10-15 20:19:21 +0200 | [diff] [blame] | 84 | // Returns whether the transparent mode is active |
| 85 | bool TransparentMode() const { return transparent_mode_; } |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 86 | |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 87 | // Takes appropriate action at an echo path change. |
| 88 | void HandleEchoPathChange(const EchoPathVariability& echo_path_variability); |
| 89 | |
peah | 8942045 | 2017-04-07 06:13:39 -0700 | [diff] [blame] | 90 | // Returns the decay factor for the echo reverberation. |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 91 | float ReverbDecay() const { return reverb_decay_; } |
peah | 8942045 | 2017-04-07 06:13:39 -0700 | [diff] [blame] | 92 | |
Per Åhgren | b6b00dc | 2018-02-20 22:18:27 +0100 | [diff] [blame] | 93 | // Returns the upper limit for the echo suppression gain. |
| 94 | float SuppressionGainLimit() const { return suppressor_gain_limit_; } |
peah | 6d822ad | 2017-04-10 13:52:14 -0700 | [diff] [blame] | 95 | |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 96 | // Returns whether the echo in the capture signal is audible. |
| 97 | bool InaudibleEcho() const { return echo_audibility_.InaudibleEcho(); } |
| 98 | |
| 99 | // Updates the aec state with the AEC output signal. |
| 100 | void UpdateWithOutput(rtc::ArrayView<const float> e) { |
| 101 | echo_audibility_.UpdateWithOutput(e); |
| 102 | } |
| 103 | |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 104 | // Returns whether the linear filter should have been able to properly adapt. |
| 105 | bool FilterHasHadTimeToConverge() const { |
| 106 | return filter_has_had_time_to_converge_; |
| 107 | } |
Per Åhgren | 1b4059e | 2017-10-15 20:19:21 +0200 | [diff] [blame] | 108 | |
Per Åhgren | a98c807 | 2018-01-15 19:17:16 +0100 | [diff] [blame] | 109 | // Returns whether the filter adaptation is still in the initial state. |
| 110 | bool InitialState() const { return initial_state_; } |
| 111 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 112 | // Updates the aec state. |
Per Åhgren | 3ab308f | 2018-02-21 08:46:03 +0100 | [diff] [blame] | 113 | void Update(const rtc::Optional<DelayEstimate>& delay_estimate, |
| 114 | const std::vector<std::array<float, kFftLengthBy2Plus1>>& |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 115 | adaptive_filter_frequency_response, |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 116 | const std::vector<float>& adaptive_filter_impulse_response, |
Per Åhgren | 1b4059e | 2017-10-15 20:19:21 +0200 | [diff] [blame] | 117 | bool converged_filter, |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 118 | const RenderBuffer& render_buffer, |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 119 | const std::array<float, kFftLengthBy2Plus1>& E2_main, |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 120 | const std::array<float, kFftLengthBy2Plus1>& Y2, |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 121 | const std::array<float, kBlockSize>& s_main, |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 122 | bool echo_leakage_detected); |
| 123 | |
| 124 | private: |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 125 | class EchoAudibility { |
| 126 | public: |
| 127 | void Update(rtc::ArrayView<const float> x, |
Per Åhgren | 1b4059e | 2017-10-15 20:19:21 +0200 | [diff] [blame] | 128 | const std::array<float, kBlockSize>& s, |
| 129 | bool converged_filter); |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 130 | void UpdateWithOutput(rtc::ArrayView<const float> e); |
| 131 | bool InaudibleEcho() const { return inaudible_echo_; } |
| 132 | |
| 133 | private: |
| 134 | float max_nearend_ = 0.f; |
| 135 | size_t max_nearend_counter_ = 0; |
| 136 | size_t low_farend_counter_ = 0; |
| 137 | bool inaudible_echo_ = false; |
| 138 | }; |
| 139 | |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 140 | void UpdateReverb(const std::vector<float>& impulse_response); |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 141 | bool DetectActiveRender(rtc::ArrayView<const float> x) const; |
Per Åhgren | b6b00dc | 2018-02-20 22:18:27 +0100 | [diff] [blame] | 142 | void UpdateSuppressorGainLimit(bool render_activity); |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 143 | bool DetectEchoSaturation(rtc::ArrayView<const float> x); |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 144 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 145 | static int instance_count_; |
| 146 | std::unique_ptr<ApmDataDumper> data_dumper_; |
| 147 | ErlEstimator erl_estimator_; |
| 148 | ErleEstimator erle_estimator_; |
Per Åhgren | 1b4059e | 2017-10-15 20:19:21 +0200 | [diff] [blame] | 149 | size_t capture_block_counter_ = 0; |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 150 | size_t blocks_with_proper_filter_adaptation_ = 0; |
| 151 | size_t blocks_with_active_render_ = 0; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 152 | bool usable_linear_estimate_ = false; |
| 153 | bool echo_leakage_detected_ = false; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 154 | bool capture_signal_saturation_ = false; |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 155 | bool echo_saturation_ = false; |
Per Åhgren | 1b4059e | 2017-10-15 20:19:21 +0200 | [diff] [blame] | 156 | bool transparent_mode_ = false; |
Per Åhgren | 63b494d | 2017-12-06 11:32:38 +0100 | [diff] [blame] | 157 | float previous_max_sample_ = 0.f; |
peah | e52a203 | 2017-04-19 09:03:40 -0700 | [diff] [blame] | 158 | bool render_received_ = false; |
Per Åhgren | b6b00dc | 2018-02-20 22:18:27 +0100 | [diff] [blame] | 159 | int realignment_counter_ = 0; |
| 160 | float suppressor_gain_limit_ = 1.f; |
| 161 | bool active_render_seen_ = false; |
Per Åhgren | 0e6d2f5 | 2017-12-20 22:19:56 +0100 | [diff] [blame] | 162 | int filter_delay_ = 0; |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 163 | size_t blocks_since_last_saturation_ = 1000; |
Christian Schuldt | f4e99db | 2018-03-01 11:32:50 +0100 | [diff] [blame^] | 164 | float tail_energy_ = 0.f; |
| 165 | float accumulated_nz_ = 0.f; |
| 166 | float accumulated_nn_ = 0.f; |
| 167 | float accumulated_count_ = 0.f; |
| 168 | size_t current_reverb_decay_section_ = 0; |
| 169 | size_t num_reverb_decay_sections_ = 0; |
| 170 | size_t num_reverb_decay_sections_next_ = 0; |
| 171 | bool found_end_of_reverb_decay_ = false; |
| 172 | bool main_filter_is_adapting_ = true; |
| 173 | std::array<float, kMaxAdaptiveFilterLength> block_energies_; |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 174 | EchoAudibility echo_audibility_; |
Gustaf Ullberg | bd83b91 | 2017-10-18 12:32:42 +0200 | [diff] [blame] | 175 | const EchoCanceller3Config config_; |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 176 | std::vector<float> max_render_; |
Christian Schuldt | f4e99db | 2018-03-01 11:32:50 +0100 | [diff] [blame^] | 177 | float reverb_decay_ = fabsf(config_.ep_strength.default_len); |
Per Åhgren | 7ddd463 | 2017-10-25 02:59:45 +0200 | [diff] [blame] | 178 | bool saturating_echo_path_ = false; |
Per Åhgren | 4b3bc0f | 2017-12-20 15:26:13 +0100 | [diff] [blame] | 179 | bool filter_has_had_time_to_converge_ = false; |
Per Åhgren | a98c807 | 2018-01-15 19:17:16 +0100 | [diff] [blame] | 180 | bool initial_state_ = true; |
Per Åhgren | b6b00dc | 2018-02-20 22:18:27 +0100 | [diff] [blame] | 181 | const float gain_rampup_increase_; |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 182 | |
peah | 8cee56f | 2017-08-24 22:36:53 -0700 | [diff] [blame] | 183 | RTC_DISALLOW_COPY_AND_ASSIGN(AecState); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 184 | }; |
| 185 | |
| 186 | } // namespace webrtc |
| 187 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 188 | #endif // MODULES_AUDIO_PROCESSING_AEC3_AEC_STATE_H_ |