blob: f769ed0cee144f9b509ba52f4040efe9642cf3e5 [file] [log] [blame]
mikhal@webrtc.org832caca2011-12-13 21:15:05 +00001/*
2 * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "modules/video_coding/decoding_state.h"
stefan@webrtc.org39670f62011-12-23 09:08:51 +000012
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020013#include "common_video/h264/h264_common.h"
Danil Chapovalov7c067772019-10-07 12:56:24 +020014#include "modules/include/module_common_types_public.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020015#include "modules/video_coding/frame_buffer.h"
16#include "modules/video_coding/jitter_buffer_common.h"
17#include "modules/video_coding/packet.h"
18#include "rtc_base/logging.h"
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000019
20namespace webrtc {
21
22VCMDecodingState::VCMDecodingState()
23 : sequence_num_(0),
24 time_stamp_(0),
25 picture_id_(kNoPictureId),
26 temporal_id_(kNoTemporalIdx),
27 tl0_pic_id_(kNoTl0PicIdx),
28 full_sync_(true),
philipelcfc319b2015-11-10 07:17:23 -080029 in_initial_state_(true) {
30 memset(frame_decoded_, 0, sizeof(frame_decoded_));
31}
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000032
33VCMDecodingState::~VCMDecodingState() {}
34
35void VCMDecodingState::Reset() {
36 // TODO(mikhal): Verify - not always would want to reset the sync
37 sequence_num_ = 0;
38 time_stamp_ = 0;
39 picture_id_ = kNoPictureId;
40 temporal_id_ = kNoTemporalIdx;
41 tl0_pic_id_ = kNoTl0PicIdx;
42 full_sync_ = true;
stefan@webrtc.orga64300a2013-03-04 15:24:40 +000043 in_initial_state_ = true;
philipelcfc319b2015-11-10 07:17:23 -080044 memset(frame_decoded_, 0, sizeof(frame_decoded_));
stefana669a3a2016-10-06 05:04:52 -070045 received_sps_.clear();
46 received_pps_.clear();
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000047}
48
49uint32_t VCMDecodingState::time_stamp() const {
50 return time_stamp_;
51}
52
53uint16_t VCMDecodingState::sequence_num() const {
54 return sequence_num_;
55}
56
57bool VCMDecodingState::IsOldFrame(const VCMFrameBuffer* frame) const {
58 assert(frame != NULL);
stefan@webrtc.orga64300a2013-03-04 15:24:40 +000059 if (in_initial_state_)
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000060 return false;
Niels Möller23775882018-08-16 10:24:12 +020061 return !IsNewerTimestamp(frame->Timestamp(), time_stamp_);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000062}
63
64bool VCMDecodingState::IsOldPacket(const VCMPacket* packet) const {
65 assert(packet != NULL);
stefan@webrtc.orga64300a2013-03-04 15:24:40 +000066 if (in_initial_state_)
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000067 return false;
stefan@webrtc.org7bc465b2013-04-11 17:48:02 +000068 return !IsNewerTimestamp(packet->timestamp, time_stamp_);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000069}
70
71void VCMDecodingState::SetState(const VCMFrameBuffer* frame) {
72 assert(frame != NULL && frame->GetHighSeqNum() >= 0);
philipelcfc319b2015-11-10 07:17:23 -080073 if (!UsingFlexibleMode(frame))
74 UpdateSyncState(frame);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000075 sequence_num_ = static_cast<uint16_t>(frame->GetHighSeqNum());
Niels Möller23775882018-08-16 10:24:12 +020076 time_stamp_ = frame->Timestamp();
mikhal@webrtc.org832caca2011-12-13 21:15:05 +000077 picture_id_ = frame->PictureId();
78 temporal_id_ = frame->TemporalId();
79 tl0_pic_id_ = frame->Tl0PicId();
philipelcfc319b2015-11-10 07:17:23 -080080
stefana669a3a2016-10-06 05:04:52 -070081 for (const NaluInfo& nalu : frame->GetNaluInfos()) {
82 if (nalu.type == H264::NaluType::kPps) {
83 if (nalu.pps_id < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +010084 RTC_LOG(LS_WARNING) << "Received pps without pps id.";
stefana669a3a2016-10-06 05:04:52 -070085 } else if (nalu.sps_id < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +010086 RTC_LOG(LS_WARNING) << "Received pps without sps id.";
stefana669a3a2016-10-06 05:04:52 -070087 } else {
88 received_pps_[nalu.pps_id] = nalu.sps_id;
89 }
90 } else if (nalu.type == H264::NaluType::kSps) {
91 if (nalu.sps_id < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +010092 RTC_LOG(LS_WARNING) << "Received sps without sps id.";
stefana669a3a2016-10-06 05:04:52 -070093 } else {
94 received_sps_.insert(nalu.sps_id);
95 }
96 }
97 }
98
philipelcfc319b2015-11-10 07:17:23 -080099 if (UsingFlexibleMode(frame)) {
100 uint16_t frame_index = picture_id_ % kFrameDecodedLength;
101 if (in_initial_state_) {
102 frame_decoded_cleared_to_ = frame_index;
Niels Möller8f7ce222019-03-21 15:43:58 +0100103 } else if (frame->FrameType() == VideoFrameType::kVideoFrameKey) {
philipelcfc319b2015-11-10 07:17:23 -0800104 memset(frame_decoded_, 0, sizeof(frame_decoded_));
105 frame_decoded_cleared_to_ = frame_index;
106 } else {
107 if (AheadOfFramesDecodedClearedTo(frame_index)) {
108 while (frame_decoded_cleared_to_ != frame_index) {
109 frame_decoded_cleared_to_ =
110 (frame_decoded_cleared_to_ + 1) % kFrameDecodedLength;
111 frame_decoded_[frame_decoded_cleared_to_] = false;
112 }
113 }
114 }
115 frame_decoded_[frame_index] = true;
116 }
117
stefan@webrtc.orga64300a2013-03-04 15:24:40 +0000118 in_initial_state_ = false;
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000119}
120
mikhal@webrtc.org381da4b2013-04-25 21:45:29 +0000121void VCMDecodingState::CopyFrom(const VCMDecodingState& state) {
122 sequence_num_ = state.sequence_num_;
123 time_stamp_ = state.time_stamp_;
124 picture_id_ = state.picture_id_;
125 temporal_id_ = state.temporal_id_;
126 tl0_pic_id_ = state.tl0_pic_id_;
127 full_sync_ = state.full_sync_;
128 in_initial_state_ = state.in_initial_state_;
philipelcfc319b2015-11-10 07:17:23 -0800129 frame_decoded_cleared_to_ = state.frame_decoded_cleared_to_;
130 memcpy(frame_decoded_, state.frame_decoded_, sizeof(frame_decoded_));
stefana669a3a2016-10-06 05:04:52 -0700131 received_sps_ = state.received_sps_;
132 received_pps_ = state.received_pps_;
mikhal@webrtc.org381da4b2013-04-25 21:45:29 +0000133}
134
stefan@webrtc.orgc8b29a22013-06-17 07:13:16 +0000135bool VCMDecodingState::UpdateEmptyFrame(const VCMFrameBuffer* frame) {
136 bool empty_packet = frame->GetHighSeqNum() == frame->GetLowSeqNum();
137 if (in_initial_state_ && empty_packet) {
138 // Drop empty packets as long as we are in the initial state.
139 return true;
stefan@webrtc.org7f3f8bc2013-05-27 07:02:45 +0000140 }
stefan@webrtc.orgc8b29a22013-06-17 07:13:16 +0000141 if ((empty_packet && ContinuousSeqNum(frame->GetHighSeqNum())) ||
142 ContinuousFrame(frame)) {
143 // Continuous empty packets or continuous frames can be dropped if we
144 // advance the sequence number.
145 sequence_num_ = frame->GetHighSeqNum();
Niels Möller23775882018-08-16 10:24:12 +0200146 time_stamp_ = frame->Timestamp();
stefan@webrtc.orgc8b29a22013-06-17 07:13:16 +0000147 return true;
148 }
149 return false;
stefan@webrtc.orgbd941d32012-11-29 14:37:18 +0000150}
151
mikhal@webrtc.org77c425b2012-01-03 20:35:25 +0000152void VCMDecodingState::UpdateOldPacket(const VCMPacket* packet) {
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000153 assert(packet != NULL);
mikhal@webrtc.org77c425b2012-01-03 20:35:25 +0000154 if (packet->timestamp == time_stamp_) {
155 // Late packet belonging to the last decoded frame - make sure we update the
156 // last decoded sequence number.
stefan@webrtc.org7bc465b2013-04-11 17:48:02 +0000157 sequence_num_ = LatestSequenceNumber(packet->seqNum, sequence_num_);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000158 }
159}
160
161void VCMDecodingState::SetSeqNum(uint16_t new_seq_num) {
162 sequence_num_ = new_seq_num;
163}
164
stefan@webrtc.orga64300a2013-03-04 15:24:40 +0000165bool VCMDecodingState::in_initial_state() const {
166 return in_initial_state_;
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000167}
168
169bool VCMDecodingState::full_sync() const {
170 return full_sync_;
171}
172
173void VCMDecodingState::UpdateSyncState(const VCMFrameBuffer* frame) {
stefan@webrtc.orga64300a2013-03-04 15:24:40 +0000174 if (in_initial_state_)
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000175 return;
176 if (frame->TemporalId() == kNoTemporalIdx ||
177 frame->Tl0PicId() == kNoTl0PicIdx) {
178 full_sync_ = true;
Niels Möller8f7ce222019-03-21 15:43:58 +0100179 } else if (frame->FrameType() == VideoFrameType::kVideoFrameKey ||
180 frame->LayerSync()) {
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000181 full_sync_ = true;
182 } else if (full_sync_) {
183 // Verify that we are still in sync.
184 // Sync will be broken if continuity is true for layers but not for the
185 // other methods (PictureId and SeqNum).
stefan@webrtc.orge72e9ee2012-09-19 11:08:05 +0000186 if (UsingPictureId(frame)) {
mikhal@webrtc.org0aeb22e2013-10-28 22:26:14 +0000187 // First check for a valid tl0PicId.
188 if (frame->Tl0PicId() - tl0_pic_id_ > 1) {
189 full_sync_ = false;
190 } else {
191 full_sync_ = ContinuousPictureId(frame->PictureId());
192 }
stefan@webrtc.orge72e9ee2012-09-19 11:08:05 +0000193 } else {
philipel9d3ab612015-12-21 04:12:39 -0800194 full_sync_ =
195 ContinuousSeqNum(static_cast<uint16_t>(frame->GetLowSeqNum()));
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000196 }
197 }
198}
199
200bool VCMDecodingState::ContinuousFrame(const VCMFrameBuffer* frame) const {
201 // Check continuity based on the following hierarchy:
202 // - Temporal layers (stop here if out of sync).
203 // - Picture Id when available.
204 // - Sequence numbers.
205 // Return true when in initial state.
206 // Note that when a method is not applicable it will return false.
207 assert(frame != NULL);
stefan@webrtc.orgc8b29a22013-06-17 07:13:16 +0000208 // A key frame is always considered continuous as it doesn't refer to any
209 // frames and therefore won't introduce any errors even if prior frames are
210 // missing.
Niels Möller8f7ce222019-03-21 15:43:58 +0100211 if (frame->FrameType() == VideoFrameType::kVideoFrameKey &&
stefana669a3a2016-10-06 05:04:52 -0700212 HaveSpsAndPps(frame->GetNaluInfos())) {
stefan@webrtc.orgc8b29a22013-06-17 07:13:16 +0000213 return true;
stefana669a3a2016-10-06 05:04:52 -0700214 }
stefan@webrtc.orgc8b29a22013-06-17 07:13:16 +0000215 // When in the initial state we always require a key frame to start decoding.
216 if (in_initial_state_)
mikhal@webrtc.org8392cd92013-04-25 21:30:50 +0000217 return false;
mikhal@webrtc.org0aeb22e2013-10-28 22:26:14 +0000218 if (ContinuousLayer(frame->TemporalId(), frame->Tl0PicId()))
219 return true;
220 // tl0picId is either not used, or should remain unchanged.
221 if (frame->Tl0PicId() != tl0_pic_id_)
222 return false;
223 // Base layers are not continuous or temporal layers are inactive.
224 // In the presence of temporal layers, check for Picture ID/sequence number
225 // continuity if sync can be restored by this frame.
226 if (!full_sync_ && !frame->LayerSync())
227 return false;
228 if (UsingPictureId(frame)) {
philipelcfc319b2015-11-10 07:17:23 -0800229 if (UsingFlexibleMode(frame)) {
230 return ContinuousFrameRefs(frame);
231 } else {
232 return ContinuousPictureId(frame->PictureId());
233 }
mikhal@webrtc.org0aeb22e2013-10-28 22:26:14 +0000234 } else {
stefana669a3a2016-10-06 05:04:52 -0700235 return ContinuousSeqNum(static_cast<uint16_t>(frame->GetLowSeqNum())) &&
236 HaveSpsAndPps(frame->GetNaluInfos());
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000237 }
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000238}
239
240bool VCMDecodingState::ContinuousPictureId(int picture_id) const {
stefan@webrtc.org39670f62011-12-23 09:08:51 +0000241 int next_picture_id = picture_id_ + 1;
242 if (picture_id < picture_id_) {
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000243 // Wrap
stefan@webrtc.org39670f62011-12-23 09:08:51 +0000244 if (picture_id_ >= 0x80) {
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000245 // 15 bits used for picture id
stefan@webrtc.org39670f62011-12-23 09:08:51 +0000246 return ((next_picture_id & 0x7FFF) == picture_id);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000247 } else {
248 // 7 bits used for picture id
stefan@webrtc.org39670f62011-12-23 09:08:51 +0000249 return ((next_picture_id & 0x7F) == picture_id);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000250 }
251 }
252 // No wrap
stefan@webrtc.org39670f62011-12-23 09:08:51 +0000253 return (next_picture_id == picture_id);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000254}
255
256bool VCMDecodingState::ContinuousSeqNum(uint16_t seq_num) const {
pbos@webrtc.org4f16c872014-11-24 09:06:48 +0000257 return seq_num == static_cast<uint16_t>(sequence_num_ + 1);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000258}
259
philipel9d3ab612015-12-21 04:12:39 -0800260bool VCMDecodingState::ContinuousLayer(int temporal_id, int tl0_pic_id) const {
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000261 // First, check if applicable.
262 if (temporal_id == kNoTemporalIdx || tl0_pic_id == kNoTl0PicIdx)
263 return false;
264 // If this is the first frame to use temporal layers, make sure we start
265 // from base.
266 else if (tl0_pic_id_ == kNoTl0PicIdx && temporal_id_ == kNoTemporalIdx &&
267 temporal_id == 0)
268 return true;
269
mikhal@webrtc.org884d8e72011-12-19 18:53:05 +0000270 // Current implementation: Look for base layer continuity.
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000271 if (temporal_id != 0)
272 return false;
stefan@webrtc.org39670f62011-12-23 09:08:51 +0000273 return (static_cast<uint8_t>(tl0_pic_id_ + 1) == tl0_pic_id);
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000274}
275
philipelcfc319b2015-11-10 07:17:23 -0800276bool VCMDecodingState::ContinuousFrameRefs(const VCMFrameBuffer* frame) const {
277 uint8_t num_refs = frame->CodecSpecific()->codecSpecific.VP9.num_ref_pics;
278 for (uint8_t r = 0; r < num_refs; ++r) {
279 uint16_t frame_ref = frame->PictureId() -
280 frame->CodecSpecific()->codecSpecific.VP9.p_diff[r];
281 uint16_t frame_index = frame_ref % kFrameDecodedLength;
282 if (AheadOfFramesDecodedClearedTo(frame_index) ||
283 !frame_decoded_[frame_index]) {
284 return false;
285 }
286 }
287 return true;
288}
289
stefan@webrtc.orge72e9ee2012-09-19 11:08:05 +0000290bool VCMDecodingState::UsingPictureId(const VCMFrameBuffer* frame) const {
291 return (frame->PictureId() != kNoPictureId && picture_id_ != kNoPictureId);
292}
293
philipelcfc319b2015-11-10 07:17:23 -0800294bool VCMDecodingState::UsingFlexibleMode(const VCMFrameBuffer* frame) const {
philipelee414d92016-11-29 07:01:23 -0800295 bool is_flexible_mode =
296 frame->CodecSpecific()->codecType == kVideoCodecVP9 &&
297 frame->CodecSpecific()->codecSpecific.VP9.flexible_mode;
298 if (is_flexible_mode && frame->PictureId() == kNoPictureId) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100299 RTC_LOG(LS_WARNING) << "Frame is marked as using flexible mode but no"
300 << "picture id is set.";
philipelee414d92016-11-29 07:01:23 -0800301 return false;
302 }
303 return is_flexible_mode;
philipelcfc319b2015-11-10 07:17:23 -0800304}
305
306// TODO(philipel): change how check work, this check practially
307// limits the max p_diff to 64.
308bool VCMDecodingState::AheadOfFramesDecodedClearedTo(uint16_t index) const {
309 // No way of knowing for sure if we are actually ahead of
310 // frame_decoded_cleared_to_. We just make the assumption
311 // that we are not trying to reference back to a very old
312 // index, but instead are referencing a newer index.
313 uint16_t diff =
314 index > frame_decoded_cleared_to_
315 ? kFrameDecodedLength - (index - frame_decoded_cleared_to_)
316 : frame_decoded_cleared_to_ - index;
317 return diff > kFrameDecodedLength / 2;
318}
319
stefana669a3a2016-10-06 05:04:52 -0700320bool VCMDecodingState::HaveSpsAndPps(const std::vector<NaluInfo>& nalus) const {
321 std::set<int> new_sps;
322 std::map<int, int> new_pps;
323 for (const NaluInfo& nalu : nalus) {
324 // Check if this nalu actually contains sps/pps information or dependencies.
325 if (nalu.sps_id == -1 && nalu.pps_id == -1)
326 continue;
327 switch (nalu.type) {
328 case H264::NaluType::kPps:
329 if (nalu.pps_id < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100330 RTC_LOG(LS_WARNING) << "Received pps without pps id.";
stefana669a3a2016-10-06 05:04:52 -0700331 } else if (nalu.sps_id < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100332 RTC_LOG(LS_WARNING) << "Received pps without sps id.";
stefana669a3a2016-10-06 05:04:52 -0700333 } else {
334 new_pps[nalu.pps_id] = nalu.sps_id;
335 }
336 break;
337 case H264::NaluType::kSps:
338 if (nalu.sps_id < 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100339 RTC_LOG(LS_WARNING) << "Received sps without sps id.";
stefana669a3a2016-10-06 05:04:52 -0700340 } else {
341 new_sps.insert(nalu.sps_id);
342 }
343 break;
344 default: {
345 int needed_sps = -1;
346 auto pps_it = new_pps.find(nalu.pps_id);
347 if (pps_it != new_pps.end()) {
348 needed_sps = pps_it->second;
349 } else {
350 auto pps_it2 = received_pps_.find(nalu.pps_id);
351 if (pps_it2 == received_pps_.end()) {
352 return false;
353 }
354 needed_sps = pps_it2->second;
355 }
356 if (new_sps.find(needed_sps) == new_sps.end() &&
357 received_sps_.find(needed_sps) == received_sps_.end()) {
358 return false;
359 }
360 break;
361 }
362 }
363 }
364 return true;
365}
366
mikhal@webrtc.org832caca2011-12-13 21:15:05 +0000367} // namespace webrtc