henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #ifndef MODULES_AUDIO_CODING_NETEQ_EXPAND_H_ |
| 12 | #define MODULES_AUDIO_CODING_NETEQ_EXPAND_H_ |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 13 | |
| 14 | #include <assert.h> |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame^] | 15 | |
kwiberg | 2d0c332 | 2016-02-14 09:28:33 -0800 | [diff] [blame] | 16 | #include <memory> |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 17 | |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 18 | #include "modules/audio_coding/neteq/audio_vector.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 19 | #include "rtc_base/constructor_magic.h" |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 20 | |
| 21 | namespace webrtc { |
| 22 | |
| 23 | // Forward declarations. |
Yves Gerey | 988cc08 | 2018-10-23 12:03:01 +0200 | [diff] [blame] | 24 | class AudioMultiVector; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 25 | class BackgroundNoise; |
| 26 | class RandomVector; |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 27 | class StatisticsCalculator; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 28 | class SyncBuffer; |
| 29 | |
| 30 | // This class handles extrapolation of audio data from the sync_buffer to |
| 31 | // produce packet-loss concealment. |
| 32 | // TODO(hlundin): Refactor this class to divide the long methods into shorter |
| 33 | // ones. |
| 34 | class Expand { |
| 35 | public: |
| 36 | Expand(BackgroundNoise* background_noise, |
| 37 | SyncBuffer* sync_buffer, |
| 38 | RandomVector* random_vector, |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 39 | StatisticsCalculator* statistics, |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 40 | int fs, |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 41 | size_t num_channels); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 42 | |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 43 | virtual ~Expand(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 44 | |
| 45 | // Resets the object. |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 46 | virtual void Reset(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 47 | |
| 48 | // The main method to produce concealment data. The data is appended to the |
| 49 | // end of |output|. |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 50 | virtual int Process(AudioMultiVector* output); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 51 | |
| 52 | // Prepare the object to do extra expansion during normal operation following |
| 53 | // a period of expands. |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 54 | virtual void SetParametersForNormalAfterExpand(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 55 | |
| 56 | // Prepare the object to do extra expansion during merge operation following |
| 57 | // a period of expands. |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 58 | virtual void SetParametersForMergeAfterExpand(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 59 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 60 | // Returns the mute factor for |channel|. |
Ivo Creusen | c7f09ad | 2018-05-22 13:21:01 +0200 | [diff] [blame] | 61 | int16_t MuteFactor(size_t channel) const { |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 62 | assert(channel < num_channels_); |
| 63 | return channel_parameters_[channel].mute_factor; |
| 64 | } |
| 65 | |
henrik.lundin | f3995f7 | 2016-05-10 05:54:35 -0700 | [diff] [blame] | 66 | // Returns true if expansion has been faded down to zero amplitude (for all |
| 67 | // channels); false otherwise. |
| 68 | bool Muted() const; |
| 69 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 70 | // Accessors and mutators. |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 71 | virtual size_t overlap_length() const; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 72 | size_t max_lag() const { return max_lag_; } |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 73 | |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 74 | protected: |
| 75 | static const int kMaxConsecutiveExpands = 200; |
Peter Kasting | b7e5054 | 2015-06-11 12:55:50 -0700 | [diff] [blame] | 76 | void GenerateRandomVector(int16_t seed_increment, |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 77 | size_t length, |
| 78 | int16_t* random_vector); |
| 79 | |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 80 | // Initializes member variables at the beginning of an expand period. |
| 81 | void InitializeForAnExpandPeriod(); |
| 82 | |
| 83 | bool TooManyExpands(); |
| 84 | |
| 85 | // Analyzes the signal history in |sync_buffer_|, and set up all parameters |
| 86 | // necessary to produce concealment data. |
| 87 | void AnalyzeSignal(int16_t* random_vector); |
| 88 | |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 89 | RandomVector* const random_vector_; |
| 90 | SyncBuffer* const sync_buffer_; |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 91 | bool first_expand_; |
| 92 | const int fs_hz_; |
| 93 | const size_t num_channels_; |
| 94 | int consecutive_expands_; |
| 95 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 96 | private: |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 97 | static const size_t kUnvoicedLpcOrder = 6; |
| 98 | static const size_t kNumCorrelationCandidates = 3; |
| 99 | static const size_t kDistortionLength = 20; |
| 100 | static const size_t kLpcAnalysisLength = 160; |
| 101 | static const size_t kMaxSampleRate = 48000; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 102 | static const int kNumLags = 3; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 103 | |
| 104 | struct ChannelParameters { |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 105 | ChannelParameters(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 106 | int16_t mute_factor; |
| 107 | int16_t ar_filter[kUnvoicedLpcOrder + 1]; |
| 108 | int16_t ar_filter_state[kUnvoicedLpcOrder]; |
| 109 | int16_t ar_gain; |
| 110 | int16_t ar_gain_scale; |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 111 | int16_t voice_mix_factor; /* Q14 */ |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 112 | int16_t current_voice_mix_factor; /* Q14 */ |
henrik.lundin@webrtc.org | 1871dd2 | 2013-10-14 20:33:25 +0000 | [diff] [blame] | 113 | AudioVector expand_vector0; |
| 114 | AudioVector expand_vector1; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 115 | bool onset; |
Peter Kasting | 36b7cc3 | 2015-06-11 19:57:18 -0700 | [diff] [blame] | 116 | int mute_slope; /* Q20 */ |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 117 | }; |
| 118 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 119 | // Calculate the auto-correlation of |input|, with length |input_length| |
| 120 | // samples. The correlation is calculated from a downsampled version of |
minyue | 53ff70f | 2016-05-02 01:50:30 -0700 | [diff] [blame] | 121 | // |input|, and is written to |output|. |
Peter Kasting | 728d903 | 2015-06-11 14:31:38 -0700 | [diff] [blame] | 122 | void Correlation(const int16_t* input, |
| 123 | size_t input_length, |
minyue | 53ff70f | 2016-05-02 01:50:30 -0700 | [diff] [blame] | 124 | int16_t* output) const; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 125 | |
| 126 | void UpdateLagIndex(); |
| 127 | |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 128 | BackgroundNoise* const background_noise_; |
| 129 | StatisticsCalculator* const statistics_; |
henrik.lundin@webrtc.org | 340746a | 2014-02-17 11:37:16 +0000 | [diff] [blame] | 130 | const size_t overlap_length_; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 131 | size_t max_lag_; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 132 | size_t expand_lags_[kNumLags]; |
| 133 | int lag_index_direction_; |
| 134 | int current_lag_index_; |
| 135 | bool stop_muting_; |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 136 | size_t expand_duration_samples_; |
kwiberg | 2d0c332 | 2016-02-14 09:28:33 -0800 | [diff] [blame] | 137 | std::unique_ptr<ChannelParameters[]> channel_parameters_; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 138 | |
henrikg | 3c089d7 | 2015-09-16 05:37:44 -0700 | [diff] [blame] | 139 | RTC_DISALLOW_COPY_AND_ASSIGN(Expand); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 140 | }; |
| 141 | |
henrik.lundin@webrtc.org | d9faa46 | 2014-01-14 10:18:45 +0000 | [diff] [blame] | 142 | struct ExpandFactory { |
| 143 | ExpandFactory() {} |
| 144 | virtual ~ExpandFactory() {} |
| 145 | |
| 146 | virtual Expand* Create(BackgroundNoise* background_noise, |
| 147 | SyncBuffer* sync_buffer, |
| 148 | RandomVector* random_vector, |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 149 | StatisticsCalculator* statistics, |
henrik.lundin@webrtc.org | d9faa46 | 2014-01-14 10:18:45 +0000 | [diff] [blame] | 150 | int fs, |
| 151 | size_t num_channels) const; |
| 152 | }; |
| 153 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 154 | } // namespace webrtc |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 155 | #endif // MODULES_AUDIO_CODING_NETEQ_EXPAND_H_ |