peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #ifndef MODULES_AUDIO_PROCESSING_AEC3_SUBTRACTOR_H_ |
| 12 | #define MODULES_AUDIO_PROCESSING_AEC3_SUBTRACTOR_H_ |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 13 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 14 | #include <math.h> |
| 15 | #include <stddef.h> |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 16 | |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 17 | #include <array> |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 18 | #include <vector> |
| 19 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 20 | #include "api/array_view.h" |
| 21 | #include "api/audio/echo_canceller3_config.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 22 | #include "modules/audio_processing/aec3/adaptive_fir_filter.h" |
| 23 | #include "modules/audio_processing/aec3/aec3_common.h" |
| 24 | #include "modules/audio_processing/aec3/aec3_fft.h" |
| 25 | #include "modules/audio_processing/aec3/aec_state.h" |
Per Åhgren | 9d66198 | 2020-03-20 11:26:48 +0100 | [diff] [blame] | 26 | #include "modules/audio_processing/aec3/coarse_filter_update_gain.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 27 | #include "modules/audio_processing/aec3/echo_path_variability.h" |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 28 | #include "modules/audio_processing/aec3/refined_filter_update_gain.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 29 | #include "modules/audio_processing/aec3/render_buffer.h" |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 30 | #include "modules/audio_processing/aec3/render_signal_analyzer.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 31 | #include "modules/audio_processing/aec3/subtractor_output.h" |
| 32 | #include "modules/audio_processing/logging/apm_data_dumper.h" |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 33 | #include "rtc_base/checks.h" |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 34 | |
| 35 | namespace webrtc { |
| 36 | |
| 37 | // Proves linear echo cancellation functionality |
| 38 | class Subtractor { |
| 39 | public: |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 40 | Subtractor(const EchoCanceller3Config& config, |
Per Åhgren | a33dc01 | 2019-09-03 23:59:52 +0200 | [diff] [blame] | 41 | size_t num_render_channels, |
| 42 | size_t num_capture_channels, |
Per Åhgren | 09a718a | 2017-12-11 22:28:45 +0100 | [diff] [blame] | 43 | ApmDataDumper* data_dumper, |
| 44 | Aec3Optimization optimization); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 45 | ~Subtractor(); |
Per Åhgren | d4e6904 | 2019-09-05 15:55:58 +0200 | [diff] [blame] | 46 | Subtractor(const Subtractor&) = delete; |
| 47 | Subtractor& operator=(const Subtractor&) = delete; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 48 | |
| 49 | // Performs the echo subtraction. |
peah | cf02cf1 | 2017-04-05 14:18:07 -0700 | [diff] [blame] | 50 | void Process(const RenderBuffer& render_buffer, |
Per Åhgren | 7bdf073 | 2019-09-25 14:53:30 +0200 | [diff] [blame] | 51 | const std::vector<std::vector<float>>& capture, |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 52 | const RenderSignalAnalyzer& render_signal_analyzer, |
peah | 86afe9d | 2017-04-06 15:45:32 -0700 | [diff] [blame] | 53 | const AecState& aec_state, |
Per Åhgren | 7bdf073 | 2019-09-25 14:53:30 +0200 | [diff] [blame] | 54 | rtc::ArrayView<SubtractorOutput> outputs); |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 55 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 56 | void HandleEchoPathChange(const EchoPathVariability& echo_path_variability); |
| 57 | |
Per Åhgren | a98c807 | 2018-01-15 19:17:16 +0100 | [diff] [blame] | 58 | // Exits the initial state. |
| 59 | void ExitInitialState(); |
| 60 | |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 61 | // Returns the block-wise frequency responses for the refined adaptive |
| 62 | // filters. |
Per Åhgren | b441acf | 2019-10-05 09:07:24 +0200 | [diff] [blame] | 63 | const std::vector<std::vector<std::array<float, kFftLengthBy2Plus1>>>& |
Per Åhgren | 119e219 | 2019-10-18 08:50:50 +0200 | [diff] [blame] | 64 | FilterFrequencyResponses() const { |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 65 | return refined_frequency_responses_; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 66 | } |
| 67 | |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 68 | // Returns the estimates of the impulse responses for the refined adaptive |
Per Åhgren | 7bdf073 | 2019-09-25 14:53:30 +0200 | [diff] [blame] | 69 | // filters. |
Per Åhgren | 119e219 | 2019-10-18 08:50:50 +0200 | [diff] [blame] | 70 | const std::vector<std::vector<float>>& FilterImpulseResponses() const { |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 71 | return refined_impulse_responses_; |
peah | 2910357 | 2017-07-11 02:54:02 -0700 | [diff] [blame] | 72 | } |
| 73 | |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 74 | void DumpFilters() { |
Per Åhgren | b441acf | 2019-10-05 09:07:24 +0200 | [diff] [blame] | 75 | data_dumper_->DumpRaw( |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 76 | "aec3_subtractor_h_refined", |
Per Åhgren | b441acf | 2019-10-05 09:07:24 +0200 | [diff] [blame] | 77 | rtc::ArrayView<const float>( |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 78 | refined_impulse_responses_[0].data(), |
Per Åhgren | b441acf | 2019-10-05 09:07:24 +0200 | [diff] [blame] | 79 | GetTimeDomainLength( |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 80 | refined_filters_[0]->max_filter_size_partitions()))); |
Per Åhgren | 91a892f | 2021-05-07 23:28:42 +0000 | [diff] [blame] | 81 | if (ApmDataDumper::IsAvailable()) { |
| 82 | RTC_DCHECK_GT(coarse_impulse_responses_.size(), 0); |
| 83 | data_dumper_->DumpRaw( |
| 84 | "aec3_subtractor_h_coarse", |
| 85 | rtc::ArrayView<const float>( |
| 86 | coarse_impulse_responses_[0].data(), |
| 87 | GetTimeDomainLength( |
| 88 | coarse_filter_[0]->max_filter_size_partitions()))); |
| 89 | } |
Per Åhgren | d4e6904 | 2019-09-05 15:55:58 +0200 | [diff] [blame] | 90 | |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 91 | refined_filters_[0]->DumpFilter("aec3_subtractor_H_refined"); |
Per Åhgren | 9d66198 | 2020-03-20 11:26:48 +0100 | [diff] [blame] | 92 | coarse_filter_[0]->DumpFilter("aec3_subtractor_H_coarse"); |
Per Åhgren | 5c532d3 | 2018-03-22 00:29:25 +0100 | [diff] [blame] | 93 | } |
| 94 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 95 | private: |
Jesús de Vicente Peña | 2e79d2b | 2018-06-29 16:35:08 +0200 | [diff] [blame] | 96 | class FilterMisadjustmentEstimator { |
| 97 | public: |
| 98 | FilterMisadjustmentEstimator() = default; |
| 99 | ~FilterMisadjustmentEstimator() = default; |
| 100 | // Update the misadjustment estimator. |
Per Åhgren | e4db6a1 | 2018-07-26 15:32:24 +0200 | [diff] [blame] | 101 | void Update(const SubtractorOutput& output); |
Jesús de Vicente Peña | 2e79d2b | 2018-06-29 16:35:08 +0200 | [diff] [blame] | 102 | // GetMisadjustment() Returns a recommended scale for the filter so the |
| 103 | // prediction error energy gets closer to the energy that is seen at the |
| 104 | // microphone input. |
| 105 | float GetMisadjustment() const { |
| 106 | RTC_DCHECK_GT(inv_misadjustment_, 0.0f); |
| 107 | // It is not aiming to adjust all the estimated mismatch. Instead, |
| 108 | // it adjusts half of that estimated mismatch. |
| 109 | return 2.f / sqrtf(inv_misadjustment_); |
| 110 | } |
| 111 | // Returns true if the prediciton error energy is significantly larger |
| 112 | // than the microphone signal energy and, therefore, an adjustment is |
| 113 | // recommended. |
| 114 | bool IsAdjustmentNeeded() const { return inv_misadjustment_ > 10.f; } |
| 115 | void Reset(); |
| 116 | void Dump(ApmDataDumper* data_dumper) const; |
| 117 | |
| 118 | private: |
| 119 | const int n_blocks_ = 4; |
| 120 | int n_blocks_acum_ = 0; |
| 121 | float e2_acum_ = 0.f; |
| 122 | float y2_acum_ = 0.f; |
| 123 | float inv_misadjustment_ = 0.f; |
| 124 | int overhang_ = 0.f; |
| 125 | }; |
| 126 | |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 127 | const Aec3Fft fft_; |
| 128 | ApmDataDumper* data_dumper_; |
| 129 | const Aec3Optimization optimization_; |
Per Åhgren | a98c807 | 2018-01-15 19:17:16 +0100 | [diff] [blame] | 130 | const EchoCanceller3Config config_; |
Per Åhgren | 7bdf073 | 2019-09-25 14:53:30 +0200 | [diff] [blame] | 131 | const size_t num_capture_channels_; |
Gustaf Ullberg | 992a96f | 2020-12-08 13:03:55 +0100 | [diff] [blame] | 132 | const bool use_coarse_filter_reset_hangover_; |
Per Åhgren | 2275439 | 2018-08-10 18:37:38 +0200 | [diff] [blame] | 133 | |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 134 | std::vector<std::unique_ptr<AdaptiveFirFilter>> refined_filters_; |
Per Åhgren | 9d66198 | 2020-03-20 11:26:48 +0100 | [diff] [blame] | 135 | std::vector<std::unique_ptr<AdaptiveFirFilter>> coarse_filter_; |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 136 | std::vector<std::unique_ptr<RefinedFilterUpdateGain>> refined_gains_; |
Per Åhgren | 9d66198 | 2020-03-20 11:26:48 +0100 | [diff] [blame] | 137 | std::vector<std::unique_ptr<CoarseFilterUpdateGain>> coarse_gains_; |
Per Åhgren | 119e219 | 2019-10-18 08:50:50 +0200 | [diff] [blame] | 138 | std::vector<FilterMisadjustmentEstimator> filter_misadjustment_estimators_; |
Per Åhgren | 9d66198 | 2020-03-20 11:26:48 +0100 | [diff] [blame] | 139 | std::vector<size_t> poor_coarse_filter_counters_; |
Gustaf Ullberg | 992a96f | 2020-12-08 13:03:55 +0100 | [diff] [blame] | 140 | std::vector<int> coarse_filter_reset_hangover_; |
Per Åhgren | 7bdf073 | 2019-09-25 14:53:30 +0200 | [diff] [blame] | 141 | std::vector<std::vector<std::array<float, kFftLengthBy2Plus1>>> |
Per Åhgren | ff04511 | 2020-03-20 11:20:39 +0100 | [diff] [blame] | 142 | refined_frequency_responses_; |
| 143 | std::vector<std::vector<float>> refined_impulse_responses_; |
Per Åhgren | 91a892f | 2021-05-07 23:28:42 +0000 | [diff] [blame] | 144 | std::vector<std::vector<float>> coarse_impulse_responses_; |
peah | 522d71b | 2017-02-23 05:16:26 -0800 | [diff] [blame] | 145 | }; |
| 146 | |
| 147 | } // namespace webrtc |
| 148 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 149 | #endif // MODULES_AUDIO_PROCESSING_AEC3_SUBTRACTOR_H_ |