blob: e6f7aa8559948946bbce2741a73e1a93c031430e [file] [log] [blame]
philipel02447bc2016-05-13 06:01:03 -07001/*
2 * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#ifndef MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_
12#define MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_
philipel02447bc2016-05-13 06:01:03 -070013
14#include <array>
Yves Gerey665174f2018-06-19 15:03:05 +020015#include <deque>
philipel02447bc2016-05-13 06:01:03 -070016#include <map>
kwibergfd8be342016-05-14 19:44:11 -070017#include <memory>
philipel02447bc2016-05-13 06:01:03 -070018#include <set>
19#include <utility>
20
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020021#include "modules/include/module_common_types.h"
philipel2837edc2018-10-02 13:55:47 +020022#include "modules/rtp_rtcp/source/rtp_generic_frame_descriptor.h"
Steve Anton10542f22019-01-11 09:11:00 -080023#include "rtc_base/critical_section.h"
Bjorn Tereliusa194e582017-10-25 13:07:09 +020024#include "rtc_base/numerics/sequence_number_util.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020025#include "rtc_base/thread_annotations.h"
philipel02447bc2016-05-13 06:01:03 -070026
27namespace webrtc {
28namespace video_coding {
29
philipele7c891f2018-02-22 14:35:06 +010030class EncodedFrame;
philipel02447bc2016-05-13 06:01:03 -070031class RtpFrameObject;
philipel17deeb42016-08-11 15:09:26 +020032
33// A complete frame is a frame which has received all its packets and all its
34// references are known.
35class OnCompleteFrameCallback {
36 public:
37 virtual ~OnCompleteFrameCallback() {}
philipele7c891f2018-02-22 14:35:06 +010038 virtual void OnCompleteFrame(std::unique_ptr<EncodedFrame> frame) = 0;
philipel17deeb42016-08-11 15:09:26 +020039};
philipel02447bc2016-05-13 06:01:03 -070040
41class RtpFrameReferenceFinder {
42 public:
43 explicit RtpFrameReferenceFinder(OnCompleteFrameCallback* frame_callback);
Mirko Bonadei8fdcac32018-08-28 16:30:18 +020044 ~RtpFrameReferenceFinder();
philipel463d3012016-09-09 03:32:44 -070045
46 // Manage this frame until:
47 // - We have all information needed to determine its references, after
48 // which |frame_callback_| is called with the completed frame, or
philipelafcf7f52017-04-26 08:17:35 -070049 // - We have too many stashed frames (determined by |kMaxStashedFrames|)
philipel463d3012016-09-09 03:32:44 -070050 // so we drop this frame, or
51 // - It gets cleared by ClearTo, which also means we drop it.
philipel02447bc2016-05-13 06:01:03 -070052 void ManageFrame(std::unique_ptr<RtpFrameObject> frame);
philipel463d3012016-09-09 03:32:44 -070053
54 // Notifies that padding has been received, which the reference finder
55 // might need to calculate the references of a frame.
philipel9b2ce6b2016-07-05 05:04:46 -070056 void PaddingReceived(uint16_t seq_num);
philipel02447bc2016-05-13 06:01:03 -070057
philipel463d3012016-09-09 03:32:44 -070058 // Clear all stashed frames that include packets older than |seq_num|.
59 void ClearTo(uint16_t seq_num);
60
philipel02447bc2016-05-13 06:01:03 -070061 private:
philipelfd5a20f2016-11-15 00:57:57 -080062 static const uint16_t kPicIdLength = 1 << 15;
philipel02447bc2016-05-13 06:01:03 -070063 static const uint8_t kMaxTemporalLayers = 5;
philipelfd5a20f2016-11-15 00:57:57 -080064 static const int kMaxLayerInfo = 50;
Sergey Silkin52233a32018-07-31 14:30:54 +020065 static const int kMaxStashedFrames = 100;
philipelfd5a20f2016-11-15 00:57:57 -080066 static const int kMaxNotYetReceivedFrames = 100;
67 static const int kMaxGofSaved = 50;
philipel9b2ce6b2016-07-05 05:04:46 -070068 static const int kMaxPaddingAge = 100;
philipel02447bc2016-05-13 06:01:03 -070069
philipelafcf7f52017-04-26 08:17:35 -070070 enum FrameDecision { kStash, kHandOff, kDrop };
philipelc9b27d52016-07-15 06:50:27 -070071
72 struct GofInfo {
73 GofInfo(GofInfoVP9* gof, uint16_t last_picture_id)
74 : gof(gof), last_picture_id(last_picture_id) {}
75 GofInfoVP9* gof;
76 uint16_t last_picture_id;
77 };
78
philipel02447bc2016-05-13 06:01:03 -070079 rtc::CriticalSection crit_;
80
philipel9b2ce6b2016-07-05 05:04:46 -070081 // Find the relevant group of pictures and update its "last-picture-id-with
82 // padding" sequence number.
83 void UpdateLastPictureIdWithPadding(uint16_t seq_num)
danilchap56359be2017-09-07 07:53:45 -070084 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel9b2ce6b2016-07-05 05:04:46 -070085
philipelafcf7f52017-04-26 08:17:35 -070086 // Retry stashed frames until no more complete frames are found.
danilchap56359be2017-09-07 07:53:45 -070087 void RetryStashedFrames() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -070088
philipelafcf7f52017-04-26 08:17:35 -070089 FrameDecision ManageFrameInternal(RtpFrameObject* frame)
danilchap56359be2017-09-07 07:53:45 -070090 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipelafcf7f52017-04-26 08:17:35 -070091
philipel2837edc2018-10-02 13:55:47 +020092 FrameDecision ManageFrameGeneric(RtpFrameObject* frame,
93 const RtpGenericFrameDescriptor& descriptor)
philipeldabfcae2018-09-25 12:54:37 +020094 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
95
96 // Find references for frames with no or very limited information in the
97 // descriptor. If |picture_id| is unspecified then packet sequence numbers
98 // will be used to determine the references of the frames.
99 FrameDecision ManageFramePidOrSeqNum(RtpFrameObject* frame, int picture_id)
danilchap56359be2017-09-07 07:53:45 -0700100 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700101
philipelafcf7f52017-04-26 08:17:35 -0700102 // Find references for Vp8 frames
103 FrameDecision ManageFrameVp8(RtpFrameObject* frame)
danilchap56359be2017-09-07 07:53:45 -0700104 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipelafcf7f52017-04-26 08:17:35 -0700105
106 // Updates necessary layer info state used to determine frame references for
107 // Vp8.
philipel1610f942017-12-12 13:58:31 +0100108 void UpdateLayerInfoVp8(RtpFrameObject* frame,
philipel57ec6852018-07-03 18:09:32 +0200109 int64_t unwrapped_tl0,
110 uint8_t temporal_idx)
danilchap56359be2017-09-07 07:53:45 -0700111 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700112
113 // Find references for Vp9 frames
philipelafcf7f52017-04-26 08:17:35 -0700114 FrameDecision ManageFrameVp9(RtpFrameObject* frame)
danilchap56359be2017-09-07 07:53:45 -0700115 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700116
117 // Check if we are missing a frame necessary to determine the references
118 // for this frame.
philipelc9b27d52016-07-15 06:50:27 -0700119 bool MissingRequiredFrameVp9(uint16_t picture_id, const GofInfo& info)
danilchap56359be2017-09-07 07:53:45 -0700120 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700121
122 // Updates which frames that have been received. If there is a gap,
123 // missing frames will be added to |missing_frames_for_layer_| or
124 // if this is an already missing frame then it will be removed.
philipelc9b27d52016-07-15 06:50:27 -0700125 void FrameReceivedVp9(uint16_t picture_id, GofInfo* info)
danilchap56359be2017-09-07 07:53:45 -0700126 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700127
128 // Check if there is a frame with the up-switch flag set in the interval
129 // (|pid_ref|, |picture_id|) with temporal layer smaller than |temporal_idx|.
130 bool UpSwitchInIntervalVp9(uint16_t picture_id,
131 uint8_t temporal_idx,
danilchap56359be2017-09-07 07:53:45 -0700132 uint16_t pid_ref)
133 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700134
philipelafcf7f52017-04-26 08:17:35 -0700135 // Unwrap |frame|s picture id and its references to 16 bits.
danilchap56359be2017-09-07 07:53:45 -0700136 void UnwrapPictureIds(RtpFrameObject* frame)
137 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
philipel02447bc2016-05-13 06:01:03 -0700138
Johnny Leebc7f41b2019-05-01 14:41:32 -0400139 // Find references for H264 frames
140 FrameDecision ManageFrameH264(RtpFrameObject* frame)
141 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
142
143 // Update "last-picture-id-with-padding" sequence number for H264.
Jonas Olssona4d87372019-07-05 19:08:33 +0200144 void UpdateLastPictureIdWithPaddingH264() RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
Johnny Leebc7f41b2019-05-01 14:41:32 -0400145
146 // Update H264 layer info state used to determine frame references.
147 void UpdateLayerInfoH264(RtpFrameObject* frame,
148 int64_t unwrapped_tl0,
149 uint8_t temporal_idx)
150 RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
151
152 // Update H264 state for decodeable frames.
153 void UpdateDataH264(RtpFrameObject* frame,
154 int64_t unwrapped_tl0,
Jonas Olssona4d87372019-07-05 19:08:33 +0200155 uint8_t temporal_idx) RTC_EXCLUSIVE_LOCKS_REQUIRED(crit_);
Johnny Leebc7f41b2019-05-01 14:41:32 -0400156
philipel9b2ce6b2016-07-05 05:04:46 -0700157 // For every group of pictures, hold two sequence numbers. The first being
158 // the sequence number of the last packet of the last completed frame, and
159 // the second being the sequence number of the last packet of the last
160 // completed frame advanced by any potential continuous packets of padding.
161 std::map<uint16_t,
162 std::pair<uint16_t, uint16_t>,
163 DescendingSeqNumComp<uint16_t>>
danilchap56359be2017-09-07 07:53:45 -0700164 last_seq_num_gop_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700165
166 // Save the last picture id in order to detect when there is a gap in frames
167 // that have not yet been fully received.
danilchap56359be2017-09-07 07:53:45 -0700168 int last_picture_id_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700169
philipel9b2ce6b2016-07-05 05:04:46 -0700170 // Padding packets that have been received but that are not yet continuous
171 // with any group of pictures.
172 std::set<uint16_t, DescendingSeqNumComp<uint16_t>> stashed_padding_
danilchap56359be2017-09-07 07:53:45 -0700173 RTC_GUARDED_BY(crit_);
philipel9b2ce6b2016-07-05 05:04:46 -0700174
philipel02447bc2016-05-13 06:01:03 -0700175 // Frames earlier than the last received frame that have not yet been
176 // fully received.
177 std::set<uint16_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>
danilchap56359be2017-09-07 07:53:45 -0700178 not_yet_received_frames_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700179
Johnny Leebc7f41b2019-05-01 14:41:32 -0400180 // Sequence numbers of frames earlier than the last received frame that
181 // have not yet been fully received.
Jonas Olssona4d87372019-07-05 19:08:33 +0200182 std::set<uint16_t, DescendingSeqNumComp<uint16_t>> not_yet_received_seq_num_
183 RTC_GUARDED_BY(crit_);
Johnny Leebc7f41b2019-05-01 14:41:32 -0400184
philipel02447bc2016-05-13 06:01:03 -0700185 // Frames that have been fully received but didn't have all the information
186 // needed to determine their references.
danilchap56359be2017-09-07 07:53:45 -0700187 std::deque<std::unique_ptr<RtpFrameObject>> stashed_frames_
188 RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700189
190 // Holds the information about the last completed frame for a given temporal
philipel57ec6852018-07-03 18:09:32 +0200191 // layer given an unwrapped Tl0 picture index.
Johnny Leebc7f41b2019-05-01 14:41:32 -0400192 std::map<int64_t, std::array<int64_t, kMaxTemporalLayers>> layer_info_
philipel57ec6852018-07-03 18:09:32 +0200193 RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700194
195 // Where the current scalability structure is in the
196 // |scalability_structures_| array.
197 uint8_t current_ss_idx_;
198
199 // Holds received scalability structures.
200 std::array<GofInfoVP9, kMaxGofSaved> scalability_structures_
danilchap56359be2017-09-07 07:53:45 -0700201 RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700202
philipel57ec6852018-07-03 18:09:32 +0200203 // Holds the the Gof information for a given unwrapped TL0 picture index.
204 std::map<int64_t, GofInfo> gof_info_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700205
206 // Keep track of which picture id and which temporal layer that had the
207 // up switch flag set.
philipelc9b27d52016-07-15 06:50:27 -0700208 std::map<uint16_t, uint8_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>
danilchap56359be2017-09-07 07:53:45 -0700209 up_switch_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700210
211 // For every temporal layer, keep a set of which frames that are missing.
212 std::array<std::set<uint16_t, DescendingSeqNumComp<uint16_t, kPicIdLength>>,
213 kMaxTemporalLayers>
danilchap56359be2017-09-07 07:53:45 -0700214 missing_frames_for_layer_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700215
philipel463d3012016-09-09 03:32:44 -0700216 // How far frames have been cleared by sequence number. A frame will be
217 // cleared if it contains a packet with a sequence number older than
218 // |cleared_to_seq_num_|.
danilchap56359be2017-09-07 07:53:45 -0700219 int cleared_to_seq_num_ RTC_GUARDED_BY(crit_);
philipel463d3012016-09-09 03:32:44 -0700220
philipel02447bc2016-05-13 06:01:03 -0700221 OnCompleteFrameCallback* frame_callback_;
philipeld4fac692017-09-04 07:03:46 -0700222
philipeldabfcae2018-09-25 12:54:37 +0200223 SeqNumUnwrapper<uint16_t> generic_frame_id_unwrapper_ RTC_GUARDED_BY(crit_);
224
philipeld4fac692017-09-04 07:03:46 -0700225 // Unwrapper used to unwrap generic RTP streams. In a generic stream we derive
226 // a picture id from the packet sequence number.
philipeldabfcae2018-09-25 12:54:37 +0200227 SeqNumUnwrapper<uint16_t> rtp_seq_num_unwrapper_ RTC_GUARDED_BY(crit_);
philipeld4fac692017-09-04 07:03:46 -0700228
229 // Unwrapper used to unwrap VP8/VP9 streams which have their picture id
230 // specified.
danilchap56359be2017-09-07 07:53:45 -0700231 SeqNumUnwrapper<uint16_t, kPicIdLength> unwrapper_ RTC_GUARDED_BY(crit_);
philipel57ec6852018-07-03 18:09:32 +0200232
233 SeqNumUnwrapper<uint8_t> tl0_unwrapper_ RTC_GUARDED_BY(crit_);
philipel02447bc2016-05-13 06:01:03 -0700234};
235
236} // namespace video_coding
237} // namespace webrtc
238
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200239#endif // MODULES_VIDEO_CODING_RTP_FRAME_REFERENCE_FINDER_H_