blob: 5f1a41401902f934a1d85686904b413b9ea12a7d [file] [log] [blame]
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +00001/*
2 * Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_
12#define MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000013
Ivo Creusen3ce44a32019-10-31 14:38:11 +010014#include "api/neteq/neteq.h"
15#include "api/neteq/neteq_controller.h"
16#include "api/neteq/tick_timer.h"
Ivo Creusen53a31f72019-10-24 15:20:39 +020017#include "modules/audio_coding/neteq/buffer_level_filter.h"
Ivo Creusen53a31f72019-10-24 15:20:39 +020018#include "modules/audio_coding/neteq/delay_manager.h"
Steve Anton10542f22019-01-11 09:11:00 -080019#include "rtc_base/constructor_magic.h"
Jakob Ivarsson46dda832019-07-03 16:00:30 +020020#include "rtc_base/experiments/field_trial_parser.h"
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000021
22namespace webrtc {
23
Henrik Lundin7687ad52018-07-02 10:14:46 +020024// This is the class for the decision tree implementation.
Ivo Creusen53a31f72019-10-24 15:20:39 +020025class DecisionLogic : public NetEqController {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000026 public:
Henrik Lundin7687ad52018-07-02 10:14:46 +020027 static const int kReinitAfterExpands = 100;
28 static const int kMaxWaitForPacket = 10;
29
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000030 // Constructor.
Ivo Creusen53a31f72019-10-24 15:20:39 +020031 DecisionLogic(NetEqController::Config config);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000032
Ivo Creusen53a31f72019-10-24 15:20:39 +020033 ~DecisionLogic() override;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000034
35 // Resets object to a clean state.
Ivo Creusen53a31f72019-10-24 15:20:39 +020036 void Reset() override;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000037
38 // Resets parts of the state. Typically done when switching codecs.
Ivo Creusen53a31f72019-10-24 15:20:39 +020039 void SoftReset() override;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000040
41 // Sets the sample rate and the output block size.
Ivo Creusen53a31f72019-10-24 15:20:39 +020042 void SetSampleRate(int fs_hz, size_t output_size_samples) override;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000043
Ivo Creusen53a31f72019-10-24 15:20:39 +020044 // Given info about the latest received packet, and current jitter buffer
45 // status, returns the operation. |target_timestamp| and |expand_mutefactor|
46 // are provided for reference. |last_packet_samples| is the number of samples
ossu7a377612016-10-18 04:06:13 -070047 // obtained from the last decoded frame. If there is a packet available, it
Ivo Creusen53a31f72019-10-24 15:20:39 +020048 // should be supplied in |packet|; otherwise it should be NULL. The mode
ossu7a377612016-10-18 04:06:13 -070049 // resulting from the last call to NetEqImpl::GetAudio is supplied in
Ivo Creusen53a31f72019-10-24 15:20:39 +020050 // |last_mode|. If there is a DTMF event to play, |play_dtmf| should be set to
ossu7a377612016-10-18 04:06:13 -070051 // true. The output variable |reset_decoder| will be set to true if a reset is
52 // required; otherwise it is left unchanged (i.e., it can remain true if it
Ivo Creusen53a31f72019-10-24 15:20:39 +020053 // was true before the call).
Ivo Creusen3ce44a32019-10-31 14:38:11 +010054 NetEq::Operation GetDecision(const NetEqController::NetEqStatus& status,
55 bool* reset_decoder) override;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000056
57 // These methods test the |cng_state_| for different conditions.
Ivo Creusen53a31f72019-10-24 15:20:39 +020058 bool CngRfc3389On() const override { return cng_state_ == kCngRfc3389On; }
59 bool CngOff() const override { return cng_state_ == kCngOff; }
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000060
61 // Resets the |cng_state_| to kCngOff.
Ivo Creusen53a31f72019-10-24 15:20:39 +020062 void SetCngOff() override { cng_state_ = kCngOff; }
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000063
64 // Reports back to DecisionLogic whether the decision to do expand remains or
65 // not. Note that this is necessary, since an expand decision can be changed
66 // to kNormal in NetEqImpl::GetDecision if there is still enough data in the
67 // sync buffer.
Ivo Creusen3ce44a32019-10-31 14:38:11 +010068 void ExpandDecision(NetEq::Operation operation) override;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000069
70 // Adds |value| to |sample_memory_|.
Ivo Creusen53a31f72019-10-24 15:20:39 +020071 void AddSampleMemory(int32_t value) override { sample_memory_ += value; }
72
73 int TargetLevelMs() override {
74 return ((delay_manager_->TargetLevel() * packet_length_samples_) >> 8) /
75 rtc::CheckedDivExact(sample_rate_, 1000);
76 }
77
78 absl::optional<int> PacketArrived(bool last_cng_or_dtmf,
79 size_t packet_length_samples,
80 bool should_update_stats,
81 uint16_t main_sequence_number,
82 uint32_t main_timestamp,
83 int fs_hz) override;
84
85 void RegisterEmptyPacket() override { delay_manager_->RegisterEmptyPacket(); }
86
87 bool SetMaximumDelay(int delay_ms) override {
88 return delay_manager_->SetMaximumDelay(delay_ms);
89 }
90 bool SetMinimumDelay(int delay_ms) override {
91 return delay_manager_->SetMinimumDelay(delay_ms);
92 }
93 bool SetBaseMinimumDelay(int delay_ms) override {
94 return delay_manager_->SetBaseMinimumDelay(delay_ms);
95 }
96 int GetBaseMinimumDelay() const override {
97 return delay_manager_->GetBaseMinimumDelay();
98 }
Jakob Ivarssonbd5874a2020-01-07 17:07:40 +010099 bool PeakFound() const override { return false; }
Ivo Creusen53a31f72019-10-24 15:20:39 +0200100
Ivo Creusenca585bb2019-11-04 16:40:04 +0100101 int GetFilteredBufferLevel() const override {
Ivo Creusen53a31f72019-10-24 15:20:39 +0200102 return buffer_level_filter_.filtered_current_level();
103 }
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000104
105 // Accessors and mutators.
Ivo Creusen53a31f72019-10-24 15:20:39 +0200106 void set_sample_memory(int32_t value) override { sample_memory_ = value; }
107 size_t noise_fast_forward() const override { return noise_fast_forward_; }
108 size_t packet_length_samples() const override {
109 return packet_length_samples_;
110 }
111 void set_packet_length_samples(size_t value) override {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000112 packet_length_samples_ = value;
113 }
Ivo Creusen53a31f72019-10-24 15:20:39 +0200114 void set_prev_time_scale(bool value) override { prev_time_scale_ = value; }
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000115
Henrik Lundin7687ad52018-07-02 10:14:46 +0200116 private:
Henrik Lundin47b17dc2016-05-10 10:20:59 +0200117 // The value 5 sets maximum time-stretch rate to about 100 ms/s.
118 static const int kMinTimescaleInterval = 5;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000119
Yves Gerey665174f2018-06-19 15:03:05 +0200120 enum CngState { kCngOff, kCngRfc3389On, kCngInternalOn };
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000121
Henrik Lundin7687ad52018-07-02 10:14:46 +0200122 // Updates the |buffer_level_filter_| with the current buffer level
123 // |buffer_size_packets|.
Minyue Li7d204d52019-04-16 11:44:49 +0200124 void FilterBufferLevel(size_t buffer_size_packets);
Henrik Lundin7687ad52018-07-02 10:14:46 +0200125
Henrik Lundin7687ad52018-07-02 10:14:46 +0200126 // Returns the operation given that the next available packet is a comfort
127 // noise payload (RFC 3389 only, not codec-internal).
Ivo Creusenca585bb2019-11-04 16:40:04 +0100128 virtual NetEq::Operation CngOperation(NetEq::Mode prev_mode,
129 uint32_t target_timestamp,
130 uint32_t available_timestamp,
131 size_t generated_noise_samples);
Henrik Lundin7687ad52018-07-02 10:14:46 +0200132
133 // Returns the operation given that no packets are available (except maybe
134 // a DTMF event, flagged by setting |play_dtmf| true).
Ivo Creusenca585bb2019-11-04 16:40:04 +0100135 virtual NetEq::Operation NoPacket(bool play_dtmf);
Henrik Lundin7687ad52018-07-02 10:14:46 +0200136
137 // Returns the operation to do given that the expected packet is available.
Ivo Creusenca585bb2019-11-04 16:40:04 +0100138 virtual NetEq::Operation ExpectedPacketAvailable(NetEq::Mode prev_mode,
139 bool play_dtmf);
Henrik Lundin7687ad52018-07-02 10:14:46 +0200140
141 // Returns the operation to do given that the expected packet is not
142 // available, but a packet further into the future is at hand.
Ivo Creusenca585bb2019-11-04 16:40:04 +0100143 virtual NetEq::Operation FuturePacketAvailable(
144 size_t decoder_frame_length,
145 NetEq::Mode prev_mode,
146 uint32_t target_timestamp,
147 uint32_t available_timestamp,
148 bool play_dtmf,
149 size_t generated_noise_samples,
150 size_t span_samples_in_packet_buffer,
151 size_t num_packets_in_packet_buffer);
Henrik Lundin7687ad52018-07-02 10:14:46 +0200152
153 // Checks if enough time has elapsed since the last successful timescale
154 // operation was done (i.e., accelerate or preemptive expand).
155 bool TimescaleAllowed() const {
156 return !timescale_countdown_ || timescale_countdown_->Finished();
157 }
158
159 // Checks if the current (filtered) buffer level is under the target level.
160 bool UnderTargetLevel() const;
161
162 // Checks if |timestamp_leap| is so long into the future that a reset due
163 // to exceeding kReinitAfterExpands will be done.
164 bool ReinitAfterExpands(uint32_t timestamp_leap) const;
165
166 // Checks if we still have not done enough expands to cover the distance from
167 // the last decoded packet to the next available packet, the distance beeing
168 // conveyed in |timestamp_leap|.
169 bool PacketTooEarly(uint32_t timestamp_leap) const;
170
171 // Checks if num_consecutive_expands_ >= kMaxWaitForPacket.
172 bool MaxWaitForPacket() const;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000173
Ivo Creusen53a31f72019-10-24 15:20:39 +0200174 std::unique_ptr<DelayManager> delay_manager_;
175 BufferLevelFilter buffer_level_filter_;
Henrik Lundin47b17dc2016-05-10 10:20:59 +0200176 const TickTimer* tick_timer_;
Jakob Ivarsson46dda832019-07-03 16:00:30 +0200177 int sample_rate_;
Peter Kastingdce40cf2015-08-24 14:52:23 -0700178 size_t output_size_samples_;
Ivo Creusen53a31f72019-10-24 15:20:39 +0200179 CngState cng_state_ = kCngOff; // Remember if comfort noise is interrupted by
180 // other event (e.g., DTMF).
henrik.lundinb1fb72b2016-05-03 08:18:47 -0700181 size_t noise_fast_forward_ = 0;
Ivo Creusen53a31f72019-10-24 15:20:39 +0200182 size_t packet_length_samples_ = 0;
183 int sample_memory_ = 0;
184 bool prev_time_scale_ = false;
Henrik Lundin7687ad52018-07-02 10:14:46 +0200185 bool disallow_time_stretching_;
Henrik Lundin47b17dc2016-05-10 10:20:59 +0200186 std::unique_ptr<TickTimer::Countdown> timescale_countdown_;
Ivo Creusen53a31f72019-10-24 15:20:39 +0200187 int num_consecutive_expands_ = 0;
188 int time_stretched_cn_samples_ = 0;
Jakob Ivarsson46dda832019-07-03 16:00:30 +0200189 FieldTrialParameter<bool> estimate_dtx_delay_;
190 FieldTrialParameter<bool> time_stretch_cn_;
191 FieldTrialConstrained<int> target_level_window_ms_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000192
henrikg3c089d72015-09-16 05:37:44 -0700193 RTC_DISALLOW_COPY_AND_ASSIGN(DecisionLogic);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000194};
195
196} // namespace webrtc
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200197#endif // MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_