niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 1 | /* |
andrew@webrtc.org | 6f9f817 | 2012-03-06 19:03:39 +0000 | [diff] [blame] | 2 | * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 11 | #ifndef WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_ |
| 12 | #define WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_ |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 13 | |
| 14 | #include <list> |
ajm@google.com | 808e0e0 | 2011-08-03 21:08:51 +0000 | [diff] [blame] | 15 | #include <string> |
Michael Graczyk | 86c6d33 | 2015-07-23 11:41:39 -0700 | [diff] [blame] | 16 | #include <vector> |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 17 | |
kwiberg@webrtc.org | 00b8f6b | 2015-02-26 14:34:55 +0000 | [diff] [blame] | 18 | #include "webrtc/base/scoped_ptr.h" |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 19 | #include "webrtc/base/thread_annotations.h" |
Michael Graczyk | dfa3605 | 2015-03-25 16:37:27 -0700 | [diff] [blame] | 20 | #include "webrtc/modules/audio_processing/include/audio_processing.h" |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 21 | |
| 22 | namespace webrtc { |
andrew@webrtc.org | ddbb8a2 | 2014-04-22 21:00:04 +0000 | [diff] [blame] | 23 | |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 24 | class AgcManagerDirect; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 25 | class AudioBuffer; |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 26 | class AudioConverter; |
Michael Graczyk | dfa3605 | 2015-03-25 16:37:27 -0700 | [diff] [blame] | 27 | |
| 28 | template<typename T> |
| 29 | class Beamformer; |
| 30 | |
ajm@google.com | 808e0e0 | 2011-08-03 21:08:51 +0000 | [diff] [blame] | 31 | class CriticalSectionWrapper; |
andrew@webrtc.org | 56e4a05 | 2014-02-27 22:23:17 +0000 | [diff] [blame] | 32 | class EchoCancellationImpl; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 33 | class EchoControlMobileImpl; |
ajm@google.com | 808e0e0 | 2011-08-03 21:08:51 +0000 | [diff] [blame] | 34 | class FileWrapper; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 35 | class GainControlImpl; |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 36 | class GainControlForNewAgc; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 37 | class HighPassFilterImpl; |
| 38 | class LevelEstimatorImpl; |
| 39 | class NoiseSuppressionImpl; |
| 40 | class ProcessingComponent; |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 41 | class TransientSuppressor; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 42 | class VoiceDetectionImpl; |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 43 | class IntelligibilityEnhancer; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 44 | |
andrew@webrtc.org | 7bf2646 | 2011-12-03 00:03:31 +0000 | [diff] [blame] | 45 | #ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP |
| 46 | namespace audioproc { |
| 47 | |
| 48 | class Event; |
| 49 | |
| 50 | } // namespace audioproc |
| 51 | #endif |
| 52 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 53 | class AudioProcessingImpl : public AudioProcessing { |
| 54 | public: |
andrew@webrtc.org | e84978f | 2014-01-25 02:09:06 +0000 | [diff] [blame] | 55 | explicit AudioProcessingImpl(const Config& config); |
Michael Graczyk | dfa3605 | 2015-03-25 16:37:27 -0700 | [diff] [blame] | 56 | |
| 57 | // AudioProcessingImpl takes ownership of beamformer. |
| 58 | AudioProcessingImpl(const Config& config, Beamformer<float>* beamformer); |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 59 | virtual ~AudioProcessingImpl(); |
| 60 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 61 | // AudioProcessing methods. |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 62 | int Initialize() override; |
| 63 | int Initialize(int input_sample_rate_hz, |
| 64 | int output_sample_rate_hz, |
| 65 | int reverse_sample_rate_hz, |
| 66 | ChannelLayout input_layout, |
| 67 | ChannelLayout output_layout, |
| 68 | ChannelLayout reverse_layout) override; |
Michael Graczyk | 86c6d33 | 2015-07-23 11:41:39 -0700 | [diff] [blame] | 69 | int Initialize(const ProcessingConfig& processing_config) override; |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 70 | void SetExtraOptions(const Config& config) override; |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 71 | int proc_sample_rate_hz() const override; |
| 72 | int proc_split_sample_rate_hz() const override; |
| 73 | int num_input_channels() const override; |
| 74 | int num_output_channels() const override; |
| 75 | int num_reverse_channels() const override; |
| 76 | void set_output_will_be_muted(bool muted) override; |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 77 | int ProcessStream(AudioFrame* frame) override; |
| 78 | int ProcessStream(const float* const* src, |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 79 | size_t samples_per_channel, |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 80 | int input_sample_rate_hz, |
| 81 | ChannelLayout input_layout, |
| 82 | int output_sample_rate_hz, |
| 83 | ChannelLayout output_layout, |
| 84 | float* const* dest) override; |
Michael Graczyk | 86c6d33 | 2015-07-23 11:41:39 -0700 | [diff] [blame] | 85 | int ProcessStream(const float* const* src, |
| 86 | const StreamConfig& input_config, |
| 87 | const StreamConfig& output_config, |
| 88 | float* const* dest) override; |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 89 | int AnalyzeReverseStream(AudioFrame* frame) override; |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 90 | int ProcessReverseStream(AudioFrame* frame) override; |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 91 | int AnalyzeReverseStream(const float* const* data, |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 92 | size_t samples_per_channel, |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 93 | int sample_rate_hz, |
| 94 | ChannelLayout layout) override; |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 95 | int ProcessReverseStream(const float* const* src, |
| 96 | const StreamConfig& reverse_input_config, |
| 97 | const StreamConfig& reverse_output_config, |
| 98 | float* const* dest) override; |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 99 | int set_stream_delay_ms(int delay) override; |
| 100 | int stream_delay_ms() const override; |
| 101 | bool was_stream_delay_set() const override; |
| 102 | void set_delay_offset_ms(int offset) override; |
| 103 | int delay_offset_ms() const override; |
| 104 | void set_stream_key_pressed(bool key_pressed) override; |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 105 | int StartDebugRecording(const char filename[kMaxFilenameSize]) override; |
| 106 | int StartDebugRecording(FILE* handle) override; |
| 107 | int StartDebugRecordingForPlatformFile(rtc::PlatformFile handle) override; |
| 108 | int StopDebugRecording() override; |
Bjorn Volcker | 4e7aa43 | 2015-07-07 11:50:05 +0200 | [diff] [blame] | 109 | void UpdateHistogramsOnCallEnd() override; |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 110 | EchoCancellation* echo_cancellation() const override; |
| 111 | EchoControlMobile* echo_control_mobile() const override; |
| 112 | GainControl* gain_control() const override; |
| 113 | HighPassFilter* high_pass_filter() const override; |
| 114 | LevelEstimator* level_estimator() const override; |
| 115 | NoiseSuppression* noise_suppression() const override; |
| 116 | VoiceDetection* voice_detection() const override; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 117 | |
andrew@webrtc.org | 60730cf | 2014-01-07 17:45:09 +0000 | [diff] [blame] | 118 | protected: |
andrew@webrtc.org | a8b9737 | 2014-03-10 22:26:12 +0000 | [diff] [blame] | 119 | // Overridden in a mock. |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 120 | virtual int InitializeLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_); |
andrew@webrtc.org | 60730cf | 2014-01-07 17:45:09 +0000 | [diff] [blame] | 121 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 122 | private: |
Michael Graczyk | 86c6d33 | 2015-07-23 11:41:39 -0700 | [diff] [blame] | 123 | int InitializeLocked(const ProcessingConfig& config) |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 124 | EXCLUSIVE_LOCKS_REQUIRED(crit_); |
Michael Graczyk | 86c6d33 | 2015-07-23 11:41:39 -0700 | [diff] [blame] | 125 | int MaybeInitializeLocked(const ProcessingConfig& config) |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 126 | EXCLUSIVE_LOCKS_REQUIRED(crit_); |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 127 | // TODO(ekm): Remove once all clients updated to new interface. |
| 128 | int AnalyzeReverseStream(const float* const* src, |
| 129 | const StreamConfig& input_config, |
| 130 | const StreamConfig& output_config); |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 131 | int ProcessStreamLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_); |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 132 | int ProcessReverseStreamLocked() EXCLUSIVE_LOCKS_REQUIRED(crit_); |
andrew@webrtc.org | 17e4064 | 2014-03-04 20:58:13 +0000 | [diff] [blame] | 133 | |
andrew@webrtc.org | 369166a | 2012-04-24 18:38:03 +0000 | [diff] [blame] | 134 | bool is_data_processed() const; |
andrew@webrtc.org | 17e4064 | 2014-03-04 20:58:13 +0000 | [diff] [blame] | 135 | bool output_copy_needed(bool is_data_processed) const; |
andrew@webrtc.org | 369166a | 2012-04-24 18:38:03 +0000 | [diff] [blame] | 136 | bool synthesis_needed(bool is_data_processed) const; |
| 137 | bool analysis_needed(bool is_data_processed) const; |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 138 | bool is_rev_processed() const; |
| 139 | bool rev_conversion_needed() const; |
Bjorn Volcker | adc46c4 | 2015-04-15 11:42:40 +0200 | [diff] [blame] | 140 | void InitializeExperimentalAgc() EXCLUSIVE_LOCKS_REQUIRED(crit_); |
| 141 | void InitializeTransient() EXCLUSIVE_LOCKS_REQUIRED(crit_); |
aluebs@webrtc.org | ae643ce | 2014-12-19 19:57:34 +0000 | [diff] [blame] | 142 | void InitializeBeamformer() EXCLUSIVE_LOCKS_REQUIRED(crit_); |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 143 | void InitializeIntelligibility() EXCLUSIVE_LOCKS_REQUIRED(crit_); |
Bjorn Volcker | 1ca324f | 2015-06-29 14:57:29 +0200 | [diff] [blame] | 144 | void MaybeUpdateHistograms() EXCLUSIVE_LOCKS_REQUIRED(crit_); |
ajm@google.com | 808e0e0 | 2011-08-03 21:08:51 +0000 | [diff] [blame] | 145 | |
andrew@webrtc.org | 56e4a05 | 2014-02-27 22:23:17 +0000 | [diff] [blame] | 146 | EchoCancellationImpl* echo_cancellation_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 147 | EchoControlMobileImpl* echo_control_mobile_; |
| 148 | GainControlImpl* gain_control_; |
| 149 | HighPassFilterImpl* high_pass_filter_; |
| 150 | LevelEstimatorImpl* level_estimator_; |
| 151 | NoiseSuppressionImpl* noise_suppression_; |
| 152 | VoiceDetectionImpl* voice_detection_; |
kwiberg@webrtc.org | 00b8f6b | 2015-02-26 14:34:55 +0000 | [diff] [blame] | 153 | rtc::scoped_ptr<GainControlForNewAgc> gain_control_for_new_agc_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 154 | |
| 155 | std::list<ProcessingComponent*> component_list_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 156 | CriticalSectionWrapper* crit_; |
kwiberg@webrtc.org | 00b8f6b | 2015-02-26 14:34:55 +0000 | [diff] [blame] | 157 | rtc::scoped_ptr<AudioBuffer> render_audio_; |
| 158 | rtc::scoped_ptr<AudioBuffer> capture_audio_; |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 159 | rtc::scoped_ptr<AudioConverter> render_converter_; |
andrew@webrtc.org | 7bf2646 | 2011-12-03 00:03:31 +0000 | [diff] [blame] | 160 | #ifdef WEBRTC_AUDIOPROC_DEBUG_DUMP |
| 161 | // TODO(andrew): make this more graceful. Ideally we would split this stuff |
| 162 | // out into a separate class with an "enabled" and "disabled" implementation. |
| 163 | int WriteMessageToDebugFile(); |
| 164 | int WriteInitMessage(); |
Minyue | 13b96ba | 2015-10-03 00:39:14 +0200 | [diff] [blame] | 165 | |
| 166 | // Writes Config message. If not |forced|, only writes the current config if |
| 167 | // it is different from the last saved one; if |forced|, writes the config |
| 168 | // regardless of the last saved. |
| 169 | int WriteConfigMessage(bool forced); |
| 170 | |
kwiberg@webrtc.org | 00b8f6b | 2015-02-26 14:34:55 +0000 | [diff] [blame] | 171 | rtc::scoped_ptr<FileWrapper> debug_file_; |
| 172 | rtc::scoped_ptr<audioproc::Event> event_msg_; // Protobuf message. |
andrew@webrtc.org | 60730cf | 2014-01-07 17:45:09 +0000 | [diff] [blame] | 173 | std::string event_str_; // Memory for protobuf serialization. |
Minyue | 13b96ba | 2015-10-03 00:39:14 +0200 | [diff] [blame] | 174 | |
| 175 | // Serialized string of last saved APM configuration. |
| 176 | std::string last_serialized_config_; |
andrew@webrtc.org | 7bf2646 | 2011-12-03 00:03:31 +0000 | [diff] [blame] | 177 | #endif |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 178 | |
peah | 192164e | 2015-11-17 02:16:45 -0800 | [diff] [blame^] | 179 | // State that is written to while holding both the render and capture locks |
| 180 | // but can be read while holding only one of the locks. |
| 181 | struct SharedState { |
| 182 | SharedState() |
| 183 | : // Format of processing streams at input/output call sites. |
| 184 | api_format_({{{kSampleRate16kHz, 1, false}, |
| 185 | {kSampleRate16kHz, 1, false}, |
| 186 | {kSampleRate16kHz, 1, false}, |
| 187 | {kSampleRate16kHz, 1, false}}}) {} |
| 188 | ProcessingConfig api_format_; |
| 189 | } shared_state_; |
Michael Graczyk | 86c6d33 | 2015-07-23 11:41:39 -0700 | [diff] [blame] | 190 | |
| 191 | // Only the rate and samples fields of fwd_proc_format_ are used because the |
| 192 | // forward processing number of channels is mutable and is tracked by the |
| 193 | // capture_audio_. |
| 194 | StreamConfig fwd_proc_format_; |
| 195 | StreamConfig rev_proc_format_; |
andrew@webrtc.org | ddbb8a2 | 2014-04-22 21:00:04 +0000 | [diff] [blame] | 196 | int split_rate_; |
| 197 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 198 | int stream_delay_ms_; |
andrew@webrtc.org | 6f9f817 | 2012-03-06 19:03:39 +0000 | [diff] [blame] | 199 | int delay_offset_ms_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 200 | bool was_stream_delay_set_; |
Bjorn Volcker | 1ca324f | 2015-06-29 14:57:29 +0200 | [diff] [blame] | 201 | int last_stream_delay_ms_; |
| 202 | int last_aec_system_delay_ms_; |
Bjorn Volcker | 4e7aa43 | 2015-07-07 11:50:05 +0200 | [diff] [blame] | 203 | int stream_delay_jumps_; |
| 204 | int aec_system_delay_jumps_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 205 | |
Bjorn Volcker | 424694c | 2015-03-27 11:30:43 +0100 | [diff] [blame] | 206 | bool output_will_be_muted_ GUARDED_BY(crit_); |
andrew@webrtc.org | 75dd288 | 2014-02-11 20:52:30 +0000 | [diff] [blame] | 207 | |
| 208 | bool key_pressed_; |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 209 | |
| 210 | // Only set through the constructor's Config parameter. |
| 211 | const bool use_new_agc_; |
kwiberg@webrtc.org | 00b8f6b | 2015-02-26 14:34:55 +0000 | [diff] [blame] | 212 | rtc::scoped_ptr<AgcManagerDirect> agc_manager_ GUARDED_BY(crit_); |
Bjorn Volcker | adc46c4 | 2015-04-15 11:42:40 +0200 | [diff] [blame] | 213 | int agc_startup_min_volume_; |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 214 | |
| 215 | bool transient_suppressor_enabled_; |
kwiberg@webrtc.org | 00b8f6b | 2015-02-26 14:34:55 +0000 | [diff] [blame] | 216 | rtc::scoped_ptr<TransientSuppressor> transient_suppressor_; |
aluebs@webrtc.org | ae643ce | 2014-12-19 19:57:34 +0000 | [diff] [blame] | 217 | const bool beamformer_enabled_; |
Michael Graczyk | dfa3605 | 2015-03-25 16:37:27 -0700 | [diff] [blame] | 218 | rtc::scoped_ptr<Beamformer<float>> beamformer_; |
aluebs@webrtc.org | fb7a039 | 2015-01-05 21:58:58 +0000 | [diff] [blame] | 219 | const std::vector<Point> array_geometry_; |
Alejandro Luebs | cb3f9bd | 2015-10-29 18:21:34 -0700 | [diff] [blame] | 220 | const SphericalPointf target_direction_; |
ekmeyerson | 60d9b33 | 2015-08-14 10:35:55 -0700 | [diff] [blame] | 221 | |
| 222 | bool intelligibility_enabled_; |
| 223 | rtc::scoped_ptr<IntelligibilityEnhancer> intelligibility_enhancer_; |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 224 | }; |
andrew@webrtc.org | ddbb8a2 | 2014-04-22 21:00:04 +0000 | [diff] [blame] | 225 | |
niklase@google.com | 470e71d | 2011-07-07 08:21:25 +0000 | [diff] [blame] | 226 | } // namespace webrtc |
| 227 | |
pbos@webrtc.org | 788acd1 | 2014-12-15 09:41:24 +0000 | [diff] [blame] | 228 | #endif // WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_PROCESSING_IMPL_H_ |