henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
henrik.lundin@webrtc.org | 9c55f0f | 2014-06-09 08:10:28 +0000 | [diff] [blame] | 11 | #ifndef WEBRTC_MODULES_AUDIO_CODING_NETEQ_EXPAND_H_ |
| 12 | #define WEBRTC_MODULES_AUDIO_CODING_NETEQ_EXPAND_H_ |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 13 | |
| 14 | #include <assert.h> |
| 15 | |
henrike@webrtc.org | 88fbb2d | 2014-05-21 21:18:46 +0000 | [diff] [blame] | 16 | #include "webrtc/base/constructormagic.h" |
kwiberg@webrtc.org | 00b8f6b | 2015-02-26 14:34:55 +0000 | [diff] [blame] | 17 | #include "webrtc/base/scoped_ptr.h" |
henrik.lundin@webrtc.org | 9c55f0f | 2014-06-09 08:10:28 +0000 | [diff] [blame] | 18 | #include "webrtc/modules/audio_coding/neteq/audio_multi_vector.h" |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 19 | #include "webrtc/typedefs.h" |
| 20 | |
| 21 | namespace webrtc { |
| 22 | |
| 23 | // Forward declarations. |
| 24 | class BackgroundNoise; |
| 25 | class RandomVector; |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 26 | class StatisticsCalculator; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 27 | class SyncBuffer; |
| 28 | |
| 29 | // This class handles extrapolation of audio data from the sync_buffer to |
| 30 | // produce packet-loss concealment. |
| 31 | // TODO(hlundin): Refactor this class to divide the long methods into shorter |
| 32 | // ones. |
| 33 | class Expand { |
| 34 | public: |
| 35 | Expand(BackgroundNoise* background_noise, |
| 36 | SyncBuffer* sync_buffer, |
| 37 | RandomVector* random_vector, |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 38 | StatisticsCalculator* statistics, |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 39 | int fs, |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 40 | size_t num_channels); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 41 | |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 42 | virtual ~Expand(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 43 | |
| 44 | // Resets the object. |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 45 | virtual void Reset(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 46 | |
| 47 | // The main method to produce concealment data. The data is appended to the |
| 48 | // end of |output|. |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 49 | virtual int Process(AudioMultiVector* output); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 50 | |
| 51 | // Prepare the object to do extra expansion during normal operation following |
| 52 | // a period of expands. |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 53 | virtual void SetParametersForNormalAfterExpand(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 54 | |
| 55 | // Prepare the object to do extra expansion during merge operation following |
| 56 | // a period of expands. |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 57 | virtual void SetParametersForMergeAfterExpand(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 58 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 59 | // Returns the mute factor for |channel|. |
| 60 | int16_t MuteFactor(size_t channel) { |
| 61 | assert(channel < num_channels_); |
| 62 | return channel_parameters_[channel].mute_factor; |
| 63 | } |
| 64 | |
| 65 | // Accessors and mutators. |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 66 | virtual size_t overlap_length() const; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame^] | 67 | size_t max_lag() const { return max_lag_; } |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 68 | |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 69 | protected: |
| 70 | static const int kMaxConsecutiveExpands = 200; |
Peter Kasting | b7e5054 | 2015-06-11 12:55:50 -0700 | [diff] [blame] | 71 | void GenerateRandomVector(int16_t seed_increment, |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 72 | size_t length, |
| 73 | int16_t* random_vector); |
| 74 | |
| 75 | void GenerateBackgroundNoise(int16_t* random_vector, |
| 76 | size_t channel, |
Peter Kasting | 36b7cc3 | 2015-06-11 19:57:18 -0700 | [diff] [blame] | 77 | int mute_slope, |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 78 | bool too_many_expands, |
| 79 | size_t num_noise_samples, |
| 80 | int16_t* buffer); |
| 81 | |
| 82 | // Initializes member variables at the beginning of an expand period. |
| 83 | void InitializeForAnExpandPeriod(); |
| 84 | |
| 85 | bool TooManyExpands(); |
| 86 | |
| 87 | // Analyzes the signal history in |sync_buffer_|, and set up all parameters |
| 88 | // necessary to produce concealment data. |
| 89 | void AnalyzeSignal(int16_t* random_vector); |
| 90 | |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 91 | RandomVector* const random_vector_; |
| 92 | SyncBuffer* const sync_buffer_; |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 93 | bool first_expand_; |
| 94 | const int fs_hz_; |
| 95 | const size_t num_channels_; |
| 96 | int consecutive_expands_; |
| 97 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 98 | private: |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame^] | 99 | static const size_t kUnvoicedLpcOrder = 6; |
| 100 | static const size_t kNumCorrelationCandidates = 3; |
| 101 | static const size_t kDistortionLength = 20; |
| 102 | static const size_t kLpcAnalysisLength = 160; |
| 103 | static const size_t kMaxSampleRate = 48000; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 104 | static const int kNumLags = 3; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 105 | |
| 106 | struct ChannelParameters { |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 107 | ChannelParameters(); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 108 | int16_t mute_factor; |
| 109 | int16_t ar_filter[kUnvoicedLpcOrder + 1]; |
| 110 | int16_t ar_filter_state[kUnvoicedLpcOrder]; |
| 111 | int16_t ar_gain; |
| 112 | int16_t ar_gain_scale; |
| 113 | int16_t voice_mix_factor; /* Q14 */ |
| 114 | int16_t current_voice_mix_factor; /* Q14 */ |
henrik.lundin@webrtc.org | 1871dd2 | 2013-10-14 20:33:25 +0000 | [diff] [blame] | 115 | AudioVector expand_vector0; |
| 116 | AudioVector expand_vector1; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 117 | bool onset; |
Peter Kasting | 36b7cc3 | 2015-06-11 19:57:18 -0700 | [diff] [blame] | 118 | int mute_slope; /* Q20 */ |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 119 | }; |
| 120 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 121 | // Calculate the auto-correlation of |input|, with length |input_length| |
| 122 | // samples. The correlation is calculated from a downsampled version of |
| 123 | // |input|, and is written to |output|. The scale factor is written to |
Peter Kasting | 728d903 | 2015-06-11 14:31:38 -0700 | [diff] [blame] | 124 | // |output_scale|. |
| 125 | void Correlation(const int16_t* input, |
| 126 | size_t input_length, |
| 127 | int16_t* output, |
Peter Kasting | 36b7cc3 | 2015-06-11 19:57:18 -0700 | [diff] [blame] | 128 | int* output_scale) const; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 129 | |
| 130 | void UpdateLagIndex(); |
| 131 | |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 132 | BackgroundNoise* const background_noise_; |
| 133 | StatisticsCalculator* const statistics_; |
henrik.lundin@webrtc.org | 340746a | 2014-02-17 11:37:16 +0000 | [diff] [blame] | 134 | const size_t overlap_length_; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame^] | 135 | size_t max_lag_; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 136 | size_t expand_lags_[kNumLags]; |
| 137 | int lag_index_direction_; |
| 138 | int current_lag_index_; |
| 139 | bool stop_muting_; |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 140 | size_t expand_duration_samples_; |
kwiberg@webrtc.org | 00b8f6b | 2015-02-26 14:34:55 +0000 | [diff] [blame] | 141 | rtc::scoped_ptr<ChannelParameters[]> channel_parameters_; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 142 | |
| 143 | DISALLOW_COPY_AND_ASSIGN(Expand); |
| 144 | }; |
| 145 | |
henrik.lundin@webrtc.org | d9faa46 | 2014-01-14 10:18:45 +0000 | [diff] [blame] | 146 | struct ExpandFactory { |
| 147 | ExpandFactory() {} |
| 148 | virtual ~ExpandFactory() {} |
| 149 | |
| 150 | virtual Expand* Create(BackgroundNoise* background_noise, |
| 151 | SyncBuffer* sync_buffer, |
| 152 | RandomVector* random_vector, |
Henrik Lundin | bef77e2 | 2015-08-18 14:58:09 +0200 | [diff] [blame] | 153 | StatisticsCalculator* statistics, |
henrik.lundin@webrtc.org | d9faa46 | 2014-01-14 10:18:45 +0000 | [diff] [blame] | 154 | int fs, |
| 155 | size_t num_channels) const; |
| 156 | }; |
| 157 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 158 | } // namespace webrtc |
henrik.lundin@webrtc.org | 9c55f0f | 2014-06-09 08:10:28 +0000 | [diff] [blame] | 159 | #endif // WEBRTC_MODULES_AUDIO_CODING_NETEQ_EXPAND_H_ |