niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 1 | /* |
bjornv@webrtc.org | 0c6f931 | 2012-01-30 09:39:08 +0000 | [diff] [blame] | 2 | * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #include "modules/audio_processing/noise_suppression_impl.h" |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 12 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 13 | #include "modules/audio_processing/audio_buffer.h" |
| 14 | #include "rtc_base/constructormagic.h" |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 15 | #if defined(WEBRTC_NS_FLOAT) |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 16 | #include "modules/audio_processing/ns/noise_suppression.h" |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 17 | #define NS_CREATE WebRtcNs_Create |
| 18 | #define NS_FREE WebRtcNs_Free |
| 19 | #define NS_INIT WebRtcNs_Init |
| 20 | #define NS_SET_POLICY WebRtcNs_set_policy |
| 21 | typedef NsHandle NsState; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 22 | #elif defined(WEBRTC_NS_FIXED) |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 23 | #include "modules/audio_processing/ns/noise_suppression_x.h" |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 24 | #define NS_CREATE WebRtcNsx_Create |
| 25 | #define NS_FREE WebRtcNsx_Free |
| 26 | #define NS_INIT WebRtcNsx_Init |
| 27 | #define NS_SET_POLICY WebRtcNsx_set_policy |
| 28 | typedef NsxHandle NsState; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 29 | #endif |
| 30 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 31 | namespace webrtc { |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 32 | class NoiseSuppressionImpl::Suppressor { |
| 33 | public: |
| 34 | explicit Suppressor(int sample_rate_hz) { |
| 35 | state_ = NS_CREATE(); |
| 36 | RTC_CHECK(state_); |
| 37 | int error = NS_INIT(state_, sample_rate_hz); |
| 38 | RTC_DCHECK_EQ(0, error); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 39 | } |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame^] | 40 | ~Suppressor() { NS_FREE(state_); } |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 41 | NsState* state() { return state_; } |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame^] | 42 | |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 43 | private: |
| 44 | NsState* state_ = nullptr; |
| 45 | RTC_DISALLOW_IMPLICIT_CONSTRUCTORS(Suppressor); |
| 46 | }; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 47 | |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 48 | NoiseSuppressionImpl::NoiseSuppressionImpl(rtc::CriticalSection* crit) |
| 49 | : crit_(crit) { |
peah | df3efa8 | 2015-11-28 12:35:15 -0800 | [diff] [blame] | 50 | RTC_DCHECK(crit); |
| 51 | } |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 52 | |
| 53 | NoiseSuppressionImpl::~NoiseSuppressionImpl() {} |
| 54 | |
Peter Kasting | 6955870 | 2016-01-12 16:26:35 -0800 | [diff] [blame] | 55 | void NoiseSuppressionImpl::Initialize(size_t channels, int sample_rate_hz) { |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 56 | rtc::CritScope cs(crit_); |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 57 | channels_ = channels; |
| 58 | sample_rate_hz_ = sample_rate_hz; |
kwiberg | 88788ad | 2016-02-19 07:04:49 -0800 | [diff] [blame] | 59 | std::vector<std::unique_ptr<Suppressor>> new_suppressors; |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 60 | if (enabled_) { |
| 61 | new_suppressors.resize(channels); |
Peter Kasting | 6955870 | 2016-01-12 16:26:35 -0800 | [diff] [blame] | 62 | for (size_t i = 0; i < channels; i++) { |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 63 | new_suppressors[i].reset(new Suppressor(sample_rate_hz)); |
| 64 | } |
| 65 | } |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 66 | suppressors_.swap(new_suppressors); |
| 67 | set_level(level_); |
| 68 | } |
| 69 | |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 70 | void NoiseSuppressionImpl::AnalyzeCaptureAudio(AudioBuffer* audio) { |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 71 | RTC_DCHECK(audio); |
aluebs@webrtc.org | fda2c2e | 2014-09-18 09:54:06 +0000 | [diff] [blame] | 72 | #if defined(WEBRTC_NS_FLOAT) |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 73 | rtc::CritScope cs(crit_); |
| 74 | if (!enabled_) { |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 75 | return; |
aluebs@webrtc.org | fda2c2e | 2014-09-18 09:54:06 +0000 | [diff] [blame] | 76 | } |
aluebs@webrtc.org | fda2c2e | 2014-09-18 09:54:06 +0000 | [diff] [blame] | 77 | |
kwiberg | af476c7 | 2016-11-28 15:21:39 -0800 | [diff] [blame] | 78 | RTC_DCHECK_GE(160, audio->num_frames_per_band()); |
Peter Kasting | 6955870 | 2016-01-12 16:26:35 -0800 | [diff] [blame] | 79 | RTC_DCHECK_EQ(suppressors_.size(), audio->num_channels()); |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 80 | for (size_t i = 0; i < suppressors_.size(); i++) { |
| 81 | WebRtcNs_Analyze(suppressors_[i]->state(), |
| 82 | audio->split_bands_const_f(i)[kBand0To8kHz]); |
aluebs@webrtc.org | fda2c2e | 2014-09-18 09:54:06 +0000 | [diff] [blame] | 83 | } |
| 84 | #endif |
aluebs@webrtc.org | fda2c2e | 2014-09-18 09:54:06 +0000 | [diff] [blame] | 85 | } |
| 86 | |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 87 | void NoiseSuppressionImpl::ProcessCaptureAudio(AudioBuffer* audio) { |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 88 | RTC_DCHECK(audio); |
peah | df3efa8 | 2015-11-28 12:35:15 -0800 | [diff] [blame] | 89 | rtc::CritScope cs(crit_); |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 90 | if (!enabled_) { |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 91 | return; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 92 | } |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 93 | |
kwiberg | af476c7 | 2016-11-28 15:21:39 -0800 | [diff] [blame] | 94 | RTC_DCHECK_GE(160, audio->num_frames_per_band()); |
Peter Kasting | 6955870 | 2016-01-12 16:26:35 -0800 | [diff] [blame] | 95 | RTC_DCHECK_EQ(suppressors_.size(), audio->num_channels()); |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 96 | for (size_t i = 0; i < suppressors_.size(); i++) { |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 97 | #if defined(WEBRTC_NS_FLOAT) |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame^] | 98 | WebRtcNs_Process(suppressors_[i]->state(), audio->split_bands_const_f(i), |
| 99 | audio->num_bands(), audio->split_bands_f(i)); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 100 | #elif defined(WEBRTC_NS_FIXED) |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame^] | 101 | WebRtcNsx_Process(suppressors_[i]->state(), audio->split_bands_const(i), |
| 102 | audio->num_bands(), audio->split_bands(i)); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 103 | #endif |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 104 | } |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 105 | } |
| 106 | |
| 107 | int NoiseSuppressionImpl::Enable(bool enable) { |
peah | df3efa8 | 2015-11-28 12:35:15 -0800 | [diff] [blame] | 108 | rtc::CritScope cs(crit_); |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 109 | if (enabled_ != enable) { |
| 110 | enabled_ = enable; |
| 111 | Initialize(channels_, sample_rate_hz_); |
| 112 | } |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 113 | return AudioProcessing::kNoError; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 114 | } |
| 115 | |
| 116 | bool NoiseSuppressionImpl::is_enabled() const { |
peah | df3efa8 | 2015-11-28 12:35:15 -0800 | [diff] [blame] | 117 | rtc::CritScope cs(crit_); |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 118 | return enabled_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 119 | } |
| 120 | |
| 121 | int NoiseSuppressionImpl::set_level(Level level) { |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 122 | int policy = 1; |
| 123 | switch (level) { |
| 124 | case NoiseSuppression::kLow: |
| 125 | policy = 0; |
| 126 | break; |
| 127 | case NoiseSuppression::kModerate: |
| 128 | policy = 1; |
| 129 | break; |
| 130 | case NoiseSuppression::kHigh: |
| 131 | policy = 2; |
| 132 | break; |
| 133 | case NoiseSuppression::kVeryHigh: |
| 134 | policy = 3; |
| 135 | break; |
| 136 | default: |
| 137 | RTC_NOTREACHED(); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 138 | } |
solenberg | 29e2f93 | 2015-12-16 01:18:15 -0800 | [diff] [blame] | 139 | rtc::CritScope cs(crit_); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 140 | level_ = level; |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 141 | for (auto& suppressor : suppressors_) { |
| 142 | int error = NS_SET_POLICY(suppressor->state(), policy); |
| 143 | RTC_DCHECK_EQ(0, error); |
| 144 | } |
| 145 | return AudioProcessing::kNoError; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 146 | } |
| 147 | |
| 148 | NoiseSuppression::Level NoiseSuppressionImpl::level() const { |
peah | df3efa8 | 2015-11-28 12:35:15 -0800 | [diff] [blame] | 149 | rtc::CritScope cs(crit_); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 150 | return level_; |
| 151 | } |
| 152 | |
bjornv@webrtc.org | 08329f4 | 2012-07-12 21:00:43 +0000 | [diff] [blame] | 153 | float NoiseSuppressionImpl::speech_probability() const { |
peah | df3efa8 | 2015-11-28 12:35:15 -0800 | [diff] [blame] | 154 | rtc::CritScope cs(crit_); |
bjornv@webrtc.org | 08329f4 | 2012-07-12 21:00:43 +0000 | [diff] [blame] | 155 | #if defined(WEBRTC_NS_FLOAT) |
| 156 | float probability_average = 0.0f; |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 157 | for (auto& suppressor : suppressors_) { |
| 158 | probability_average += |
| 159 | WebRtcNs_prior_speech_probability(suppressor->state()); |
bjornv@webrtc.org | 08329f4 | 2012-07-12 21:00:43 +0000 | [diff] [blame] | 160 | } |
pkasting | 25702cb | 2016-01-08 13:50:27 -0800 | [diff] [blame] | 161 | if (!suppressors_.empty()) { |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 162 | probability_average /= suppressors_.size(); |
| 163 | } |
| 164 | return probability_average; |
bjornv@webrtc.org | 08329f4 | 2012-07-12 21:00:43 +0000 | [diff] [blame] | 165 | #elif defined(WEBRTC_NS_FIXED) |
solenberg | 5e465c3 | 2015-12-08 13:22:33 -0800 | [diff] [blame] | 166 | // TODO(peah): Returning error code as a float! Remove this. |
bjornv@webrtc.org | 08329f4 | 2012-07-12 21:00:43 +0000 | [diff] [blame] | 167 | // Currently not available for the fixed point implementation. |
peah | df3efa8 | 2015-11-28 12:35:15 -0800 | [diff] [blame] | 168 | return AudioProcessing::kUnsupportedFunctionError; |
bjornv@webrtc.org | 08329f4 | 2012-07-12 21:00:43 +0000 | [diff] [blame] | 169 | #endif |
| 170 | } |
Alejandro Luebs | fa639f0 | 2016-02-09 11:24:32 -0800 | [diff] [blame] | 171 | |
| 172 | std::vector<float> NoiseSuppressionImpl::NoiseEstimate() { |
| 173 | rtc::CritScope cs(crit_); |
| 174 | std::vector<float> noise_estimate; |
| 175 | #if defined(WEBRTC_NS_FLOAT) |
Alejandro Luebs | 3b14996 | 2016-04-01 13:54:36 -0700 | [diff] [blame] | 176 | const float kNumChannelsFraction = 1.f / suppressors_.size(); |
Alejandro Luebs | fa639f0 | 2016-02-09 11:24:32 -0800 | [diff] [blame] | 177 | noise_estimate.assign(WebRtcNs_num_freq(), 0.f); |
| 178 | for (auto& suppressor : suppressors_) { |
| 179 | const float* noise = WebRtcNs_noise_estimate(suppressor->state()); |
| 180 | for (size_t i = 0; i < noise_estimate.size(); ++i) { |
Alejandro Luebs | 3b14996 | 2016-04-01 13:54:36 -0700 | [diff] [blame] | 181 | noise_estimate[i] += kNumChannelsFraction * noise[i]; |
Alejandro Luebs | fa639f0 | 2016-02-09 11:24:32 -0800 | [diff] [blame] | 182 | } |
| 183 | } |
| 184 | #elif defined(WEBRTC_NS_FIXED) |
Alejandro Luebs | fa639f0 | 2016-02-09 11:24:32 -0800 | [diff] [blame] | 185 | noise_estimate.assign(WebRtcNsx_num_freq(), 0.f); |
| 186 | for (auto& suppressor : suppressors_) { |
Alejandro Luebs | 3b14996 | 2016-04-01 13:54:36 -0700 | [diff] [blame] | 187 | int q_noise; |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame^] | 188 | const uint32_t* noise = |
| 189 | WebRtcNsx_noise_estimate(suppressor->state(), &q_noise); |
Alejandro Luebs | 3b14996 | 2016-04-01 13:54:36 -0700 | [diff] [blame] | 190 | const float kNormalizationFactor = |
| 191 | 1.f / ((1 << q_noise) * suppressors_.size()); |
Alejandro Luebs | fa639f0 | 2016-02-09 11:24:32 -0800 | [diff] [blame] | 192 | for (size_t i = 0; i < noise_estimate.size(); ++i) { |
Alejandro Luebs | 3b14996 | 2016-04-01 13:54:36 -0700 | [diff] [blame] | 193 | noise_estimate[i] += kNormalizationFactor * noise[i]; |
Alejandro Luebs | fa639f0 | 2016-02-09 11:24:32 -0800 | [diff] [blame] | 194 | } |
| 195 | } |
| 196 | #endif |
| 197 | return noise_estimate; |
| 198 | } |
| 199 | |
Alex Luebs | 57ae829 | 2016-03-09 16:24:34 +0100 | [diff] [blame] | 200 | size_t NoiseSuppressionImpl::num_noise_bins() { |
| 201 | #if defined(WEBRTC_NS_FLOAT) |
| 202 | return WebRtcNs_num_freq(); |
| 203 | #elif defined(WEBRTC_NS_FIXED) |
| 204 | return WebRtcNsx_num_freq(); |
| 205 | #endif |
| 206 | } |
| 207 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 208 | } // namespace webrtc |