blob: 01819eac659a32635bd088c294d1262fef9de023 [file] [log] [blame]
philipel02447bc2016-05-13 06:01:03 -07001/*
2 * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_
12#define MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_
philipel02447bc2016-05-13 06:01:03 -070013
14#include <array>
Yves Gerey665174f2018-06-19 15:03:05 +020015#include <deque>
philipel02447bc2016-05-13 06:01:03 -070016#include <map>
kwibergfd8be342016-05-14 19:44:11 -070017#include <memory>
philipel02447bc2016-05-13 06:01:03 -070018#include <set>
19#include <utility>
20
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020021#include "modules/include/module_common_types.h"
philipel2837edc2018-10-02 13:55:47 +020022#include "modules/rtp_rtcp/source/rtp_generic_frame_descriptor.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020023#include "rtc_base/criticalsection.h"
Bjorn Tereliusa194e582017-10-25 13:07:09 +020024#include "rtc_base/numerics/sequence_number_util.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020025#include "rtc_base/thread_annotations.h"
philipel02447bc2016-05-13 06:01:03 -070026
27namespace webrtc {
28namespace video_coding {
29
philipele7c891f2018-02-22 14:35:06 +010030class EncodedFrame;
philipel02447bc2016-05-13 06:01:03 -070031class RtpFrameObject;
philipel17deeb42016-08-11 15:09:26 +020032
33// A complete frame is a frame which has received all its packets and all its
34// references are known.
35class OnCompleteFrameCallback {
36 public:
37 virtual ~OnCompleteFrameCallback() {}
philipele7c891f2018-02-22 14:35:06 +010038 virtual void OnCompleteFrame(std::unique_ptr<EncodedFrame> frame) = 0;
philipel17deeb42016-08-11 15:09:26 +020039};
philipel02447bc2016-05-13 06:01:03 -070040
41class RtpFrameReferenceFinder {
42 public:
43 explicit RtpFrameReferenceFinder(OnCompleteFrameCallback* frame_callback);
Mirko Bonadei8fdcac32018-08-28 16:30:18 +020044 ~RtpFrameReferenceFinder();
philipel463d3012016-09-09 03:32:44 -070045
46 // Manage this frame until:
47 // - We have all information needed to determine its references, after
48 // which |frame_callback_| is called with the completed frame, or
philipelafcf7f52017-04-26 08:17:35 -070049 // - We have too many stashed frames (determined by |kMaxStashedFrames|)
philipel463d3012016-09-09 03:32:44 -070050 // so we drop this frame, or
51 // - It gets cleared by ClearTo, which also means we drop it.
philipel02447bc2016-05-13 06:01:03 -070052 void ManageFrame(std::unique_ptr<RtpFrameObject> frame);
philipel463d3012016-09-09 03:32:44 -070053
54 // Notifies that padding has been received, which the reference finder
55 // might need to calculate the references of a frame.
philipel9b2ce6b2016-07-05 05:04:46 -070056 void PaddingReceived(uint16_t seq_num);
philipel02447bc2016-05-13 06:01:03 -070057
philipel463d3012016-09-09 03:32:44 -070058 // Clear all stashed frames that include packets older than |seq_num|.
59 void ClearTo(uint16_t seq_num);
60
philipel02447bc2016-05-13 06:01:03 -070061 private:
philipelfd5a20f2016-11-15 00:57:57 -080062 static const uint16_t kPicIdLength = 1 << 15;
philipel02447bc2016-05-13 06:01:03 -070063 static const uint8_t kMaxTemporalLayers = 5;
philipelfd5a20f2016-11-15 00:57:57 -080064 static const int kMaxLayerInfo = 50;
Sergey Silkin52233a32018-07-31 14:30:54 +020065 static const int kMaxStashedFrames = 100;
philipelfd5a20f2016-11-15 00:57:57 -080066 static const int kMaxNotYetReceivedFrames = 100;
67 static const int kMaxGofSaved = 50;
philipel9b2ce6b2016-07-05 05:04:46 -070068 static const int kMaxPaddingAge = 100;
philipel02447bc2016-05-13 06:01:03 -070069
philipelafcf7f52017-04-26 08:17:35 -070070 enum FrameDecision { kStash, kHandOff, kDrop };
philipelc9b27d52016-07-15 06:50:27 -070071
72 struct GofInfo {
73 GofInfo(GofInfoVP9* gof, uint16_t last_picture_id)
74 : gof(gof), last_picture_id(last_picture_id) {}
75 GofInfoVP9* gof;
76 uint16_t last_picture_id;
77 };
78
philipel02447bc2016-05-13 06:01:03 -070079 rtc::CriticalSection crit_;
80
philipel9b2ce6b2016-07-05 05:04:46 -070081 // Find the relevant group of pictures and update its "last-picture-id-with
82 // padding" sequence number.
83 void UpdateLastPictureIdWithPadding(uint16_t seq_num)
danilchap56359be2017-09-07 07:53:45 -070084 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel9b2ce6b2016-07-05 05:04:46 -070085
philipelafcf7f52017-04-26 08:17:35 -070086 // Retry stashed frames until no more complete frames are found.
danilchap56359be2017-09-07 07:53:45 -070087 void RetryStashedFrames() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -070088
philipelafcf7f52017-04-26 08:17:35 -070089 FrameDecision ManageFrameInternal(RtpFrameObject* frame)
danilchap56359be2017-09-07 07:53:45 -070090 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipelafcf7f52017-04-26 08:17:35 -070091
philipel2837edc2018-10-02 13:55:47 +020092 FrameDecision ManageFrameGeneric(RtpFrameObject* frame,
93 const RtpGenericFrameDescriptor& descriptor)
philipeldabfcae2018-09-25 12:54:37 +020094 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
95
96 // Find references for frames with no or very limited information in the
97 // descriptor. If |picture_id| is unspecified then packet sequence numbers
98 // will be used to determine the references of the frames.
99 FrameDecision ManageFramePidOrSeqNum(RtpFrameObject* frame, int picture_id)
danilchap56359be2017-09-07 07:53:45 -0700100 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700101
philipelafcf7f52017-04-26 08:17:35 -0700102 // Find references for Vp8 frames
103 FrameDecision ManageFrameVp8(RtpFrameObject* frame)
danilchap56359be2017-09-07 07:53:45 -0700104 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipelafcf7f52017-04-26 08:17:35 -0700105
106 // Updates necessary layer info state used to determine frame references for
107 // Vp8.
philipel1610f942017-12-12 13:58:31 +0100108 void UpdateLayerInfoVp8(RtpFrameObject* frame,
philipel57ec6852018-07-03 18:09:32 +0200109 int64_t unwrapped_tl0,
110 uint8_t temporal_idx)
danilchap56359be2017-09-07 07:53:45 -0700111 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700112
113 // Find references for Vp9 frames
philipelafcf7f52017-04-26 08:17:35 -0700114 FrameDecision ManageFrameVp9(RtpFrameObject* frame)
danilchap56359be2017-09-07 07:53:45 -0700115 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700116
117 // Check if we are missing a frame necessary to determine the references
118 // for this frame.
philipelc9b27d52016-07-15 06:50:27 -0700119 bool MissingRequiredFrameVp9(uint16_t picture_id, const GofInfo& info)
danilchap56359be2017-09-07 07:53:45 -0700120 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700121
122 // Updates which frames that have been received. If there is a gap,
123 // missing frames will be added to |missing_frames_for_layer_| or
124 // if this is an already missing frame then it will be removed.
philipelc9b27d52016-07-15 06:50:27 -0700125 void FrameReceivedVp9(uint16_t picture_id, GofInfo* info)
danilchap56359be2017-09-07 07:53:45 -0700126 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700127
128 // Check if there is a frame with the up-switch flag set in the interval
129 // (|pid_ref|, |picture_id|) with temporal layer smaller than |temporal_idx|.
130 bool UpSwitchInIntervalVp9(uint16_t picture_id,
131 uint8_t temporal_idx,
danilchap56359be2017-09-07 07:53:45 -0700132 uint16_t pid_ref)
133 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700134
philipelafcf7f52017-04-26 08:17:35 -0700135 // Unwrap |frame|s picture id and its references to 16 bits.
danilchap56359be2017-09-07 07:53:45 -0700136 void UnwrapPictureIds(RtpFrameObject* frame)
137 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700138
philipel9b2ce6b2016-07-05 05:04:46 -0700139 // For every group of pictures, hold two sequence numbers. The first being
140 // the sequence number of the last packet of the last completed frame, and
141 // the second being the sequence number of the last packet of the last
142 // completed frame advanced by any potential continuous packets of padding.
143 std::map<uint16_t,
144 std::pair<uint16_t, uint16_t>,
145 DescendingSeqNumComp<uint16_t>>
danilchap56359be2017-09-07 07:53:45 -0700146 last_seq_num_gop_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700147
148 // Save the last picture id in order to detect when there is a gap in frames
149 // that have not yet been fully received.
danilchap56359be2017-09-07 07:53:45 -0700150 int last_picture_id_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700151
philipel9b2ce6b2016-07-05 05:04:46 -0700152 // Padding packets that have been received but that are not yet continuous
153 // with any group of pictures.
154 std::set<uint16_t, DescendingSeqNumComp<uint16_t>> stashed_padding_
danilchap56359be2017-09-07 07:53:45 -0700155 RTC_GUARDED_BY(crit_);
philipel9b2ce6b2016-07-05 05:04:46 -0700156
philipel02447bc2016-05-13 06:01:03 -0700157 // Frames earlier than the last received frame that have not yet been
158 // fully received.
159 std::set<uint16_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>
danilchap56359be2017-09-07 07:53:45 -0700160 not_yet_received_frames_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700161
162 // Frames that have been fully received but didn't have all the information
163 // needed to determine their references.
danilchap56359be2017-09-07 07:53:45 -0700164 std::deque<std::unique_ptr<RtpFrameObject>> stashed_frames_
165 RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700166
167 // Holds the information about the last completed frame for a given temporal
philipel57ec6852018-07-03 18:09:32 +0200168 // layer given an unwrapped Tl0 picture index.
169 std::map<int64_t, std::array<int16_t, kMaxTemporalLayers>> layer_info_
170 RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700171
172 // Where the current scalability structure is in the
173 // |scalability_structures_| array.
174 uint8_t current_ss_idx_;
175
176 // Holds received scalability structures.
177 std::array<GofInfoVP9, kMaxGofSaved> scalability_structures_
danilchap56359be2017-09-07 07:53:45 -0700178 RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700179
philipel57ec6852018-07-03 18:09:32 +0200180 // Holds the the Gof information for a given unwrapped TL0 picture index.
181 std::map<int64_t, GofInfo> gof_info_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700182
183 // Keep track of which picture id and which temporal layer that had the
184 // up switch flag set.
philipelc9b27d52016-07-15 06:50:27 -0700185 std::map<uint16_t, uint8_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>
danilchap56359be2017-09-07 07:53:45 -0700186 up_switch_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700187
188 // For every temporal layer, keep a set of which frames that are missing.
189 std::array<std::set<uint16_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>,
190 kMaxTemporalLayers>
danilchap56359be2017-09-07 07:53:45 -0700191 missing_frames_for_layer_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700192
philipel463d3012016-09-09 03:32:44 -0700193 // How far frames have been cleared by sequence number. A frame will be
194 // cleared if it contains a packet with a sequence number older than
195 // |cleared_to_seq_num_|.
danilchap56359be2017-09-07 07:53:45 -0700196 int cleared_to_seq_num_ RTC_GUARDED_BY(crit_);
philipel463d3012016-09-09 03:32:44 -0700197
philipel02447bc2016-05-13 06:01:03 -0700198 OnCompleteFrameCallback* frame_callback_;
philipeld4fac692017-09-04 07:03:46 -0700199
philipeldabfcae2018-09-25 12:54:37 +0200200 SeqNumUnwrapper<uint16_t> generic_frame_id_unwrapper_ RTC_GUARDED_BY(crit_);
201
philipeld4fac692017-09-04 07:03:46 -0700202 // Unwrapper used to unwrap generic RTP streams. In a generic stream we derive
203 // a picture id from the packet sequence number.
philipeldabfcae2018-09-25 12:54:37 +0200204 SeqNumUnwrapper<uint16_t> rtp_seq_num_unwrapper_ RTC_GUARDED_BY(crit_);
philipeld4fac692017-09-04 07:03:46 -0700205
206 // Unwrapper used to unwrap VP8/VP9 streams which have their picture id
207 // specified.
danilchap56359be2017-09-07 07:53:45 -0700208 SeqNumUnwrapper<uint16_t, kPicIdLength> unwrapper_ RTC_GUARDED_BY(crit_);
philipel57ec6852018-07-03 18:09:32 +0200209
210 SeqNumUnwrapper<uint8_t> tl0_unwrapper_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700211};
212
213} // namespace video_coding
214} // namespace webrtc
215
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200216#endif // MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_