henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #ifndef MODULES_AUDIO_CODING_NETEQ_MERGE_H_ |
| 12 | #define MODULES_AUDIO_CODING_NETEQ_MERGE_H_ |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 13 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 14 | #include "modules/audio_coding/neteq/audio_multi_vector.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame^] | 15 | #include "rtc_base/constructor_magic.h" |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 16 | |
| 17 | namespace webrtc { |
| 18 | |
| 19 | // Forward declarations. |
| 20 | class Expand; |
| 21 | class SyncBuffer; |
| 22 | |
| 23 | // This class handles the transition from expansion to normal operation. |
| 24 | // When a packet is not available for decoding when needed, the expand operation |
| 25 | // is called to generate extrapolation data. If the missing packet arrives, |
| 26 | // i.e., it was just delayed, it can be decoded and appended directly to the |
| 27 | // end of the expanded data (thanks to how the Expand class operates). However, |
| 28 | // if a later packet arrives instead, the loss is a fact, and the new data must |
| 29 | // be stitched together with the end of the expanded data. This stitching is |
| 30 | // what the Merge class does. |
| 31 | class Merge { |
| 32 | public: |
Karl Wiberg | 7f6c4d4 | 2015-04-09 15:44:22 +0200 | [diff] [blame] | 33 | Merge(int fs_hz, |
| 34 | size_t num_channels, |
| 35 | Expand* expand, |
| 36 | SyncBuffer* sync_buffer); |
minyue | 5bd3397 | 2016-05-02 04:46:11 -0700 | [diff] [blame] | 37 | virtual ~Merge(); |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 38 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 39 | // The main method to produce the audio data. The decoded data is supplied in |
| 40 | // |input|, having |input_length| samples in total for all channels |
| 41 | // (interleaved). The result is written to |output|. The number of channels |
| 42 | // allocated in |output| defines the number of channels that will be used when |
Henrik Lundin | 6dc82e8 | 2018-05-22 10:40:23 +0200 | [diff] [blame] | 43 | // de-interleaving |input|. |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 44 | virtual size_t Process(int16_t* input, |
| 45 | size_t input_length, |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 46 | AudioMultiVector* output); |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 47 | |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 48 | virtual size_t RequiredFutureSamples(); |
turaj@webrtc.org | 8d1cdaa | 2014-04-11 18:47:55 +0000 | [diff] [blame] | 49 | |
| 50 | protected: |
| 51 | const int fs_hz_; |
| 52 | const size_t num_channels_; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 53 | |
| 54 | private: |
| 55 | static const int kMaxSampleRate = 48000; |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 56 | static const size_t kExpandDownsampLength = 100; |
| 57 | static const size_t kInputDownsampLength = 40; |
| 58 | static const size_t kMaxCorrelationLength = 60; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 59 | |
| 60 | // Calls |expand_| to get more expansion data to merge with. The data is |
| 61 | // written to |expanded_signal_|. Returns the length of the expanded data, |
| 62 | // while |expand_period| will be the number of samples in one expansion period |
| 63 | // (typically one pitch period). The value of |old_length| will be the number |
| 64 | // of samples that were taken from the |sync_buffer_|. |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 65 | size_t GetExpandedSignal(size_t* old_length, size_t* expand_period); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 66 | |
minyue | 53ff70f | 2016-05-02 01:50:30 -0700 | [diff] [blame] | 67 | // Analyzes |input| and |expanded_signal| and returns muting factor (Q14) to |
| 68 | // be used on the new data. |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 69 | int16_t SignalScaling(const int16_t* input, |
| 70 | size_t input_length, |
minyue | 53ff70f | 2016-05-02 01:50:30 -0700 | [diff] [blame] | 71 | const int16_t* expanded_signal) const; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 72 | |
| 73 | // Downsamples |input| (|input_length| samples) and |expanded_signal| to |
| 74 | // 4 kHz sample rate. The downsampled signals are written to |
| 75 | // |input_downsampled_| and |expanded_downsampled_|, respectively. |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 76 | void Downsample(const int16_t* input, |
| 77 | size_t input_length, |
| 78 | const int16_t* expanded_signal, |
| 79 | size_t expanded_length); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 80 | |
| 81 | // Calculates cross-correlation between |input_downsampled_| and |
| 82 | // |expanded_downsampled_|, and finds the correlation maximum. The maximizing |
| 83 | // lag is returned. |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 84 | size_t CorrelateAndPeakSearch(size_t start_position, |
| 85 | size_t input_length, |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 86 | size_t expand_period) const; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 87 | |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 88 | const int fs_mult_; // fs_hz_ / 8000. |
Peter Kasting | dce40cf | 2015-08-24 14:52:23 -0700 | [diff] [blame] | 89 | const size_t timestamps_per_call_; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 90 | Expand* expand_; |
| 91 | SyncBuffer* sync_buffer_; |
| 92 | int16_t expanded_downsampled_[kExpandDownsampLength]; |
| 93 | int16_t input_downsampled_[kInputDownsampLength]; |
henrik.lundin@webrtc.org | fd11bbf | 2013-09-30 20:38:44 +0000 | [diff] [blame] | 94 | AudioMultiVector expanded_; |
minyue | 5bd3397 | 2016-05-02 04:46:11 -0700 | [diff] [blame] | 95 | std::vector<int16_t> temp_data_; |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 96 | |
henrikg | 3c089d7 | 2015-09-16 05:37:44 -0700 | [diff] [blame] | 97 | RTC_DISALLOW_COPY_AND_ASSIGN(Merge); |
henrik.lundin@webrtc.org | d94659d | 2013-01-29 12:09:21 +0000 | [diff] [blame] | 98 | }; |
| 99 | |
| 100 | } // namespace webrtc |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 101 | #endif // MODULES_AUDIO_CODING_NETEQ_MERGE_H_ |