blob: da0ec5b2648ff1122b70d2bb750bbf3a6a9a0203 [file] [log] [blame]
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001/*
2 * Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 *
10 */
11
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020012#include "modules/video_coding/codecs/vp9/vp9_impl.h"
marpan@webrtc.org5b883172014-11-01 06:10:48 +000013
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +020014#include <algorithm>
Sergey Silkind45b3452018-05-31 16:00:24 +020015#include <limits>
marpan@webrtc.org5b883172014-11-01 06:10:48 +000016#include <vector>
17
marpan@webrtc.org5b883172014-11-01 06:10:48 +000018#include "vpx/vp8cx.h"
19#include "vpx/vp8dx.h"
Yves Gerey665174f2018-06-19 15:03:05 +020020#include "vpx/vpx_decoder.h"
21#include "vpx/vpx_encoder.h"
marpan@webrtc.org5b883172014-11-01 06:10:48 +000022
Karl Wiberg918f50c2018-07-05 11:40:33 +020023#include "absl/memory/memory.h"
Emircan Uysaler800787f2018-07-16 10:01:49 -070024#include "api/video/color_space.h"
Emircan Uysaler0823eec2018-07-13 17:10:00 -070025#include "api/video/i010_buffer.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020026#include "common_video/include/video_frame_buffer.h"
27#include "common_video/libyuv/include/webrtc_libyuv.h"
Sergey Silkind902d582018-05-18 17:31:19 +020028#include "modules/rtp_rtcp/include/rtp_rtcp_defines.h"
Sergey Silkin86684962018-03-28 19:32:37 +020029#include "modules/video_coding/codecs/vp9/svc_rate_allocator.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020030#include "rtc_base/checks.h"
31#include "rtc_base/keep_ref_until_done.h"
32#include "rtc_base/logging.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020033#include "rtc_base/timeutils.h"
34#include "rtc_base/trace_event.h"
marpan@webrtc.org5b883172014-11-01 06:10:48 +000035
36namespace webrtc {
37
Sergey Silkind902d582018-05-18 17:31:19 +020038namespace {
39const float kMaxScreenSharingFramerateFps = 5.0f;
40}
41
Marco6e89b252015-07-07 14:40:38 -070042// Only positive speeds, range for real-time coding currently is: 5 - 8.
43// Lower means slower/better quality, higher means fastest/lower quality.
44int GetCpuSpeed(int width, int height) {
Alex Glaznevfecb7c32016-03-31 14:23:27 -070045#if defined(WEBRTC_ARCH_ARM) || defined(WEBRTC_ARCH_ARM64) || defined(ANDROID)
Marco002f0d02015-12-17 09:49:31 -080046 return 8;
47#else
Marco6e89b252015-07-07 14:40:38 -070048 // For smaller resolutions, use lower speed setting (get some coding gain at
49 // the cost of increased encoding complexity).
50 if (width * height <= 352 * 288)
51 return 5;
52 else
53 return 7;
Marco002f0d02015-12-17 09:49:31 -080054#endif
Marco6e89b252015-07-07 14:40:38 -070055}
56
Emircan Uysaler98badbc2018-06-28 10:59:02 -070057std::vector<SdpVideoFormat> SupportedVP9Codecs() {
Emircan Uysaler0823eec2018-07-13 17:10:00 -070058 // TODO(emircan): Add Profile 2 support after fixing browser_tests.
59 std::vector<SdpVideoFormat> supported_formats{SdpVideoFormat(
60 cricket::kVp9CodecName,
61 {{kVP9FmtpProfileId, VP9ProfileToString(VP9Profile::kProfile0)}})};
62 return supported_formats;
Peter Boström12996152016-05-14 02:03:18 +020063}
64
Magnus Jedvert46a27652017-11-13 14:10:02 +010065std::unique_ptr<VP9Encoder> VP9Encoder::Create() {
Karl Wiberg918f50c2018-07-05 11:40:33 +020066 return absl::make_unique<VP9EncoderImpl>(cricket::VideoCodec());
Emircan Uysaler98badbc2018-06-28 10:59:02 -070067}
68
69std::unique_ptr<VP9Encoder> VP9Encoder::Create(
70 const cricket::VideoCodec& codec) {
Karl Wiberg918f50c2018-07-05 11:40:33 +020071 return absl::make_unique<VP9EncoderImpl>(codec);
marpan@webrtc.org5b883172014-11-01 06:10:48 +000072}
73
asaperssona9455ab2015-07-31 06:10:09 -070074void VP9EncoderImpl::EncoderOutputCodedPacketCallback(vpx_codec_cx_pkt* pkt,
75 void* user_data) {
philipelcce46fc2015-12-21 03:04:49 -080076 VP9EncoderImpl* enc = static_cast<VP9EncoderImpl*>(user_data);
asaperssona9455ab2015-07-31 06:10:09 -070077 enc->GetEncodedLayerFrame(pkt);
78}
79
Emircan Uysaler98badbc2018-06-28 10:59:02 -070080VP9EncoderImpl::VP9EncoderImpl(const cricket::VideoCodec& codec)
marpan@webrtc.org5b883172014-11-01 06:10:48 +000081 : encoded_image_(),
sprang3958ed82017-08-17 08:12:10 -070082 encoded_complete_callback_(nullptr),
Emircan Uysaler98badbc2018-06-28 10:59:02 -070083 profile_(
84 ParseSdpForVP9Profile(codec.params).value_or(VP9Profile::kProfile0)),
marpan@webrtc.org5b883172014-11-01 06:10:48 +000085 inited_(false),
86 timestamp_(0),
marpan@webrtc.org5b883172014-11-01 06:10:48 +000087 cpu_speed_(3),
88 rc_max_intra_target_(0),
sprang3958ed82017-08-17 08:12:10 -070089 encoder_(nullptr),
90 config_(nullptr),
91 raw_(nullptr),
92 input_image_(nullptr),
Sergey Silkinbd0954e2018-05-03 14:14:09 +020093 force_key_frame_(true),
Sergey Silkin6a8f30e2018-04-26 11:03:49 +020094 pics_since_key_(0),
asaperssona9455ab2015-07-31 06:10:09 -070095 num_temporal_layers_(0),
philipelcfc319b2015-11-10 07:17:23 -080096 num_spatial_layers_(0),
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +020097 is_svc_(false),
Sergey Silkin6a8f30e2018-04-26 11:03:49 +020098 inter_layer_pred_(InterLayerPredMode::kOn),
Sergey Silkind902d582018-05-18 17:31:19 +020099 output_framerate_(1000.0, 1000.0),
100 last_encoded_frame_rtp_timestamp_(0),
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200101 is_flexible_mode_(false) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000102 memset(&codec_, 0, sizeof(codec_));
johannkoenig8225c402017-01-26 13:23:44 -0800103 memset(&svc_params_, 0, sizeof(vpx_svc_extra_cfg_t));
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000104}
105
106VP9EncoderImpl::~VP9EncoderImpl() {
107 Release();
108}
109
110int VP9EncoderImpl::Release() {
Sergey Silkin3e871ea2018-03-02 13:11:04 +0100111 int ret_val = WEBRTC_VIDEO_CODEC_OK;
112
sprang3958ed82017-08-17 08:12:10 -0700113 if (encoded_image_._buffer != nullptr) {
philipelcce46fc2015-12-21 03:04:49 -0800114 delete[] encoded_image_._buffer;
sprang3958ed82017-08-17 08:12:10 -0700115 encoded_image_._buffer = nullptr;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000116 }
sprang3958ed82017-08-17 08:12:10 -0700117 if (encoder_ != nullptr) {
Sergey Silkin90399692018-03-02 14:44:10 +0100118 if (inited_) {
119 if (vpx_codec_destroy(encoder_)) {
120 ret_val = WEBRTC_VIDEO_CODEC_MEMORY;
121 }
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000122 }
123 delete encoder_;
sprang3958ed82017-08-17 08:12:10 -0700124 encoder_ = nullptr;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000125 }
sprang3958ed82017-08-17 08:12:10 -0700126 if (config_ != nullptr) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000127 delete config_;
sprang3958ed82017-08-17 08:12:10 -0700128 config_ = nullptr;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000129 }
sprang3958ed82017-08-17 08:12:10 -0700130 if (raw_ != nullptr) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000131 vpx_img_free(raw_);
sprang3958ed82017-08-17 08:12:10 -0700132 raw_ = nullptr;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000133 }
134 inited_ = false;
Sergey Silkin3e871ea2018-03-02 13:11:04 +0100135 return ret_val;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000136}
137
sprangce4aef12015-11-02 07:23:20 -0800138bool VP9EncoderImpl::ExplicitlyConfiguredSpatialLayers() const {
139 // We check target_bitrate_bps of the 0th layer to see if the spatial layers
140 // (i.e. bitrates) were explicitly configured.
Sergey Silkin13e74342018-03-02 12:28:00 +0100141 return num_spatial_layers_ > 1 && codec_.spatialLayers[0].targetBitrate > 0;
sprangce4aef12015-11-02 07:23:20 -0800142}
143
Erik Språng566124a2018-04-23 12:32:22 +0200144bool VP9EncoderImpl::SetSvcRates(
145 const VideoBitrateAllocation& bitrate_allocation) {
asaperssona9455ab2015-07-31 06:10:09 -0700146 uint8_t i = 0;
147
Sergey Silkin86684962018-03-28 19:32:37 +0200148 config_->rc_target_bitrate = bitrate_allocation.get_sum_kbps();
Sergey Silkin86684962018-03-28 19:32:37 +0200149
“Michael23c5a992018-06-21 11:07:21 -0500150 num_active_spatial_layers_ = 0;
151 for (i = 0; i < num_spatial_layers_; ++i)
152 num_active_spatial_layers_ += bitrate_allocation.IsSpatialLayerUsed(i);
153 RTC_DCHECK_GT(num_active_spatial_layers_, 0);
154 RTC_DCHECK_LE(num_active_spatial_layers_, num_spatial_layers_);
155
sprangce4aef12015-11-02 07:23:20 -0800156 if (ExplicitlyConfiguredSpatialLayers()) {
Sergey Silkin86684962018-03-28 19:32:37 +0200157 for (size_t sl_idx = 0; sl_idx < num_spatial_layers_; ++sl_idx) {
Sergey Silkinbd0954e2018-05-03 14:14:09 +0200158 const bool was_layer_enabled = (config_->ss_target_bitrate[sl_idx] > 0);
Sergey Silkin86684962018-03-28 19:32:37 +0200159 config_->ss_target_bitrate[sl_idx] =
160 bitrate_allocation.GetSpatialLayerSum(sl_idx) / 1000;
161
162 for (size_t tl_idx = 0; tl_idx < num_temporal_layers_; ++tl_idx) {
163 config_->layer_target_bitrate[sl_idx * num_temporal_layers_ + tl_idx] =
164 bitrate_allocation.GetTemporalLayerSum(sl_idx, tl_idx) / 1000;
165 }
Sergey Silkinbd0954e2018-05-03 14:14:09 +0200166
167 const bool is_layer_enabled = (config_->ss_target_bitrate[sl_idx] > 0);
168 if (is_layer_enabled && !was_layer_enabled) {
169 if (inter_layer_pred_ == InterLayerPredMode::kOff ||
170 inter_layer_pred_ == InterLayerPredMode::kOnKeyPic) {
171 // TODO(wemb:1526): remove key frame request when issue is fixed.
172 force_key_frame_ = true;
173 }
174 }
sprangce4aef12015-11-02 07:23:20 -0800175 }
176 } else {
177 float rate_ratio[VPX_MAX_LAYERS] = {0};
178 float total = 0;
“Michael67c8bcf2018-06-27 04:24:13 -0500179 for (i = 0; i < num_spatial_layers_; ++i) {
johannkoenig8225c402017-01-26 13:23:44 -0800180 if (svc_params_.scaling_factor_num[i] <= 0 ||
181 svc_params_.scaling_factor_den[i] <= 0) {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100182 RTC_LOG(LS_ERROR) << "Scaling factors not specified!";
sprangce4aef12015-11-02 07:23:20 -0800183 return false;
184 }
Yves Gerey665174f2018-06-19 15:03:05 +0200185 rate_ratio[i] = static_cast<float>(svc_params_.scaling_factor_num[i]) /
186 svc_params_.scaling_factor_den[i];
sprangce4aef12015-11-02 07:23:20 -0800187 total += rate_ratio[i];
188 }
189
“Michael67c8bcf2018-06-27 04:24:13 -0500190 for (i = 0; i < num_spatial_layers_; ++i) {
Rasmus Brandt58cd3852018-06-26 13:41:16 +0200191 RTC_CHECK_GT(total, 0);
sprangce4aef12015-11-02 07:23:20 -0800192 config_->ss_target_bitrate[i] = static_cast<unsigned int>(
193 config_->rc_target_bitrate * rate_ratio[i] / total);
194 if (num_temporal_layers_ == 1) {
195 config_->layer_target_bitrate[i] = config_->ss_target_bitrate[i];
196 } else if (num_temporal_layers_ == 2) {
197 config_->layer_target_bitrate[i * num_temporal_layers_] =
198 config_->ss_target_bitrate[i] * 2 / 3;
199 config_->layer_target_bitrate[i * num_temporal_layers_ + 1] =
200 config_->ss_target_bitrate[i];
201 } else if (num_temporal_layers_ == 3) {
202 config_->layer_target_bitrate[i * num_temporal_layers_] =
203 config_->ss_target_bitrate[i] / 2;
204 config_->layer_target_bitrate[i * num_temporal_layers_ + 1] =
205 config_->layer_target_bitrate[i * num_temporal_layers_] +
206 (config_->ss_target_bitrate[i] / 4);
207 config_->layer_target_bitrate[i * num_temporal_layers_ + 2] =
208 config_->ss_target_bitrate[i];
209 } else {
Mirko Bonadei675513b2017-11-09 11:09:25 +0100210 RTC_LOG(LS_ERROR) << "Unsupported number of temporal layers: "
211 << num_temporal_layers_;
sprangce4aef12015-11-02 07:23:20 -0800212 return false;
213 }
asaperssona9455ab2015-07-31 06:10:09 -0700214 }
215 }
asaperssona9455ab2015-07-31 06:10:09 -0700216 return true;
217}
218
Erik Språng08127a92016-11-16 16:41:30 +0100219int VP9EncoderImpl::SetRateAllocation(
Erik Språng566124a2018-04-23 12:32:22 +0200220 const VideoBitrateAllocation& bitrate_allocation,
Erik Språng08127a92016-11-16 16:41:30 +0100221 uint32_t frame_rate) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000222 if (!inited_) {
223 return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
224 }
225 if (encoder_->err) {
226 return WEBRTC_VIDEO_CODEC_ERROR;
227 }
Erik Språng08127a92016-11-16 16:41:30 +0100228 if (frame_rate < 1) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000229 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
230 }
231 // Update bit rate
Erik Språng08127a92016-11-16 16:41:30 +0100232 if (codec_.maxBitrate > 0 &&
233 bitrate_allocation.get_sum_kbps() > codec_.maxBitrate) {
234 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000235 }
Erik Språng08127a92016-11-16 16:41:30 +0100236
Erik Språng08127a92016-11-16 16:41:30 +0100237 codec_.maxFramerate = frame_rate;
asaperssona9455ab2015-07-31 06:10:09 -0700238
Sergey Silkin86684962018-03-28 19:32:37 +0200239 if (!SetSvcRates(bitrate_allocation)) {
asaperssona9455ab2015-07-31 06:10:09 -0700240 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
241 }
242
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000243 // Update encoder context
244 if (vpx_codec_enc_config_set(encoder_, config_)) {
245 return WEBRTC_VIDEO_CODEC_ERROR;
246 }
247 return WEBRTC_VIDEO_CODEC_OK;
248}
249
250int VP9EncoderImpl::InitEncode(const VideoCodec* inst,
251 int number_of_cores,
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000252 size_t /*max_payload_size*/) {
sprang3958ed82017-08-17 08:12:10 -0700253 if (inst == nullptr) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000254 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
255 }
256 if (inst->maxFramerate < 1) {
257 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
258 }
259 // Allow zero to represent an unspecified maxBitRate
260 if (inst->maxBitrate > 0 && inst->startBitrate > inst->maxBitrate) {
261 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
262 }
263 if (inst->width < 1 || inst->height < 1) {
264 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
265 }
266 if (number_of_cores < 1) {
267 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
268 }
hta257dc392016-10-25 09:05:06 -0700269 if (inst->VP9().numberOfTemporalLayers > 3) {
asaperssona9455ab2015-07-31 06:10:09 -0700270 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
271 }
ilnik2a8c2f52017-02-15 02:23:28 -0800272 // libvpx probably does not support more than 3 spatial layers.
273 if (inst->VP9().numberOfSpatialLayers > 3) {
asaperssona9455ab2015-07-31 06:10:09 -0700274 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
275 }
philipelcfc319b2015-11-10 07:17:23 -0800276
asapersson86956de2016-01-26 01:05:20 -0800277 int ret_val = Release();
278 if (ret_val < 0) {
279 return ret_val;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000280 }
sprang3958ed82017-08-17 08:12:10 -0700281 if (encoder_ == nullptr) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000282 encoder_ = new vpx_codec_ctx_t;
283 }
sprang3958ed82017-08-17 08:12:10 -0700284 if (config_ == nullptr) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000285 config_ = new vpx_codec_enc_cfg_t;
286 }
287 timestamp_ = 0;
288 if (&codec_ != inst) {
289 codec_ = *inst;
290 }
asaperssona9455ab2015-07-31 06:10:09 -0700291
hta257dc392016-10-25 09:05:06 -0700292 num_spatial_layers_ = inst->VP9().numberOfSpatialLayers;
Niels Möller65fb4042018-04-25 14:46:06 +0200293 RTC_DCHECK_GT(num_spatial_layers_, 0);
hta257dc392016-10-25 09:05:06 -0700294 num_temporal_layers_ = inst->VP9().numberOfTemporalLayers;
asaperssona9455ab2015-07-31 06:10:09 -0700295 if (num_temporal_layers_ == 0)
296 num_temporal_layers_ = 1;
297
Sergey Silkind902d582018-05-18 17:31:19 +0200298 // Init framerate controller.
299 output_framerate_.Reset();
Niels Möllere3cf3d02018-06-13 11:52:16 +0200300 if (codec_.mode == VideoCodecMode::kScreensharing) {
Sergey Silkind902d582018-05-18 17:31:19 +0200301 target_framerate_fps_ = kMaxScreenSharingFramerateFps;
302 } else {
303 target_framerate_fps_.reset();
304 }
305
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +0200306 is_svc_ = (num_spatial_layers_ > 1 || num_temporal_layers_ > 1);
307 // Flexible mode requires SVC to be enabled since libvpx API only allows
308 // to get reference list in SVC mode.
309 RTC_DCHECK(!inst->VP9().flexibleMode || is_svc_);
310
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000311 // Allocate memory for encoded image
sprang3958ed82017-08-17 08:12:10 -0700312 if (encoded_image_._buffer != nullptr) {
philipelcce46fc2015-12-21 03:04:49 -0800313 delete[] encoded_image_._buffer;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000314 }
nisseeb44b392017-04-28 07:18:05 -0700315 encoded_image_._size =
316 CalcBufferSize(VideoType::kI420, codec_.width, codec_.height);
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000317 encoded_image_._buffer = new uint8_t[encoded_image_._size];
318 encoded_image_._completeFrame = true;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000319 // Populate encoder configuration with default values.
320 if (vpx_codec_enc_config_default(vpx_codec_vp9_cx(), config_, 0)) {
321 return WEBRTC_VIDEO_CODEC_ERROR;
322 }
Emircan Uysaler0823eec2018-07-13 17:10:00 -0700323
324 vpx_img_fmt img_fmt = VPX_IMG_FMT_NONE;
325 unsigned int bits_for_storage = 8;
326 switch (profile_) {
327 case VP9Profile::kProfile0:
328 img_fmt = VPX_IMG_FMT_I420;
329 bits_for_storage = 8;
330 config_->g_bit_depth = VPX_BITS_8;
331 config_->g_profile = 0;
332 config_->g_input_bit_depth = 8;
333 break;
334 case VP9Profile::kProfile2:
335 img_fmt = VPX_IMG_FMT_I42016;
336 bits_for_storage = 16;
337 config_->g_bit_depth = VPX_BITS_10;
338 config_->g_profile = 2;
339 config_->g_input_bit_depth = 10;
340 break;
341 }
342
343 // Creating a wrapper to the image - setting image data to nullptr. Actual
344 // pointer will be set in encode. Setting align to 1, as it is meaningless
345 // (actual memory is not allocated).
346 raw_ =
347 vpx_img_wrap(nullptr, img_fmt, codec_.width, codec_.height, 1, nullptr);
348 raw_->bit_depth = bits_for_storage;
349
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000350 config_->g_w = codec_.width;
351 config_->g_h = codec_.height;
352 config_->rc_target_bitrate = inst->startBitrate; // in kbit/s
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +0200353 config_->g_error_resilient = is_svc_ ? VPX_ERROR_RESILIENT_DEFAULT : 0;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000354 // Setting the time base of the codec.
355 config_->g_timebase.num = 1;
356 config_->g_timebase.den = 90000;
357 config_->g_lag_in_frames = 0; // 0- no frame lagging
358 config_->g_threads = 1;
359 // Rate control settings.
hta257dc392016-10-25 09:05:06 -0700360 config_->rc_dropframe_thresh = inst->VP9().frameDroppingOn ? 30 : 0;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000361 config_->rc_end_usage = VPX_CBR;
362 config_->g_pass = VPX_RC_ONE_PASS;
363 config_->rc_min_quantizer = 2;
marpan@webrtc.orgdc8a9da2015-01-27 23:08:24 +0000364 config_->rc_max_quantizer = 52;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000365 config_->rc_undershoot_pct = 50;
366 config_->rc_overshoot_pct = 50;
367 config_->rc_buf_initial_sz = 500;
368 config_->rc_buf_optimal_sz = 600;
369 config_->rc_buf_sz = 1000;
370 // Set the maximum target size of any key-frame.
371 rc_max_intra_target_ = MaxIntraTarget(config_->rc_buf_optimal_sz);
hta257dc392016-10-25 09:05:06 -0700372 if (inst->VP9().keyFrameInterval > 0) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000373 config_->kf_mode = VPX_KF_AUTO;
hta257dc392016-10-25 09:05:06 -0700374 config_->kf_max_dist = inst->VP9().keyFrameInterval;
Åsa Perssonff24c042015-12-04 10:58:08 +0100375 // Needs to be set (in svc mode) to get correct periodic key frame interval
376 // (will have no effect in non-svc).
377 config_->kf_min_dist = config_->kf_max_dist;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000378 } else {
379 config_->kf_mode = VPX_KF_DISABLED;
380 }
hta257dc392016-10-25 09:05:06 -0700381 config_->rc_resize_allowed = inst->VP9().automaticResizeOn ? 1 : 0;
marpan@webrtc.org38d11b82015-01-26 15:21:36 +0000382 // Determine number of threads based on the image size and #cores.
philipelcce46fc2015-12-21 03:04:49 -0800383 config_->g_threads =
384 NumberOfThreads(config_->g_w, config_->g_h, number_of_cores);
asaperssona9455ab2015-07-31 06:10:09 -0700385
Marco6e89b252015-07-07 14:40:38 -0700386 cpu_speed_ = GetCpuSpeed(config_->g_w, config_->g_h);
asaperssona9455ab2015-07-31 06:10:09 -0700387
388 // TODO(asapersson): Check configuration of temporal switch up and increase
389 // pattern length.
hta257dc392016-10-25 09:05:06 -0700390 is_flexible_mode_ = inst->VP9().flexibleMode;
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200391
392 // TODO(ssilkin): Only non-flexible mode is supported for now.
393 RTC_DCHECK(!is_flexible_mode_);
394
395 if (num_temporal_layers_ == 1) {
asaperssona9455ab2015-07-31 06:10:09 -0700396 gof_.SetGofInfoVP9(kTemporalStructureMode1);
397 config_->temporal_layering_mode = VP9E_TEMPORAL_LAYERING_MODE_NOLAYERING;
398 config_->ts_number_layers = 1;
399 config_->ts_rate_decimator[0] = 1;
400 config_->ts_periodicity = 1;
401 config_->ts_layer_id[0] = 0;
402 } else if (num_temporal_layers_ == 2) {
403 gof_.SetGofInfoVP9(kTemporalStructureMode2);
404 config_->temporal_layering_mode = VP9E_TEMPORAL_LAYERING_MODE_0101;
405 config_->ts_number_layers = 2;
406 config_->ts_rate_decimator[0] = 2;
407 config_->ts_rate_decimator[1] = 1;
408 config_->ts_periodicity = 2;
409 config_->ts_layer_id[0] = 0;
410 config_->ts_layer_id[1] = 1;
411 } else if (num_temporal_layers_ == 3) {
412 gof_.SetGofInfoVP9(kTemporalStructureMode3);
413 config_->temporal_layering_mode = VP9E_TEMPORAL_LAYERING_MODE_0212;
414 config_->ts_number_layers = 3;
415 config_->ts_rate_decimator[0] = 4;
416 config_->ts_rate_decimator[1] = 2;
417 config_->ts_rate_decimator[2] = 1;
418 config_->ts_periodicity = 4;
419 config_->ts_layer_id[0] = 0;
420 config_->ts_layer_id[1] = 2;
421 config_->ts_layer_id[2] = 1;
422 config_->ts_layer_id[3] = 2;
423 } else {
424 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
425 }
426
Sergey Silkin6a8f30e2018-04-26 11:03:49 +0200427 inter_layer_pred_ = inst->VP9().interLayerPred;
428
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +0200429 ref_buf_.clear();
430
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000431 return InitAndSetControlSettings(inst);
432}
433
marpan@webrtc.org38d11b82015-01-26 15:21:36 +0000434int VP9EncoderImpl::NumberOfThreads(int width,
435 int height,
436 int number_of_cores) {
437 // Keep the number of encoder threads equal to the possible number of column
438 // tiles, which is (1, 2, 4, 8). See comments below for VP9E_SET_TILE_COLUMNS.
439 if (width * height >= 1280 * 720 && number_of_cores > 4) {
440 return 4;
jianj23173a32017-07-12 16:11:09 -0700441 } else if (width * height >= 640 * 360 && number_of_cores > 2) {
marpan@webrtc.org38d11b82015-01-26 15:21:36 +0000442 return 2;
443 } else {
Yves Gerey665174f2018-06-19 15:03:05 +0200444// Use 2 threads for low res on ARM.
Jerome Jiang831af372017-12-05 10:44:35 -0800445#if defined(WEBRTC_ARCH_ARM) || defined(WEBRTC_ARCH_ARM64) || \
446 defined(WEBRTC_ANDROID)
447 if (width * height >= 320 * 180 && number_of_cores > 2) {
448 return 2;
449 }
450#endif
marpan@webrtc.org38d11b82015-01-26 15:21:36 +0000451 // 1 thread less than VGA.
452 return 1;
453 }
454}
455
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000456int VP9EncoderImpl::InitAndSetControlSettings(const VideoCodec* inst) {
Åsa Perssonff24c042015-12-04 10:58:08 +0100457 // Set QP-min/max per spatial and temporal layer.
458 int tot_num_layers = num_spatial_layers_ * num_temporal_layers_;
459 for (int i = 0; i < tot_num_layers; ++i) {
johannkoenig8225c402017-01-26 13:23:44 -0800460 svc_params_.max_quantizers[i] = config_->rc_max_quantizer;
461 svc_params_.min_quantizers[i] = config_->rc_min_quantizer;
Åsa Perssonff24c042015-12-04 10:58:08 +0100462 }
asaperssona9455ab2015-07-31 06:10:09 -0700463 config_->ss_number_layers = num_spatial_layers_;
sprangce4aef12015-11-02 07:23:20 -0800464 if (ExplicitlyConfiguredSpatialLayers()) {
465 for (int i = 0; i < num_spatial_layers_; ++i) {
466 const auto& layer = codec_.spatialLayers[i];
Rasmus Brandt58cd3852018-06-26 13:41:16 +0200467 RTC_CHECK_GT(layer.width, 0);
Sergey Silkin13e74342018-03-02 12:28:00 +0100468 const int scale_factor = codec_.width / layer.width;
469 RTC_DCHECK_GT(scale_factor, 0);
470
471 // Ensure scaler factor is integer.
472 if (scale_factor * layer.width != codec_.width) {
473 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
474 }
475
476 // Ensure scale factor is the same in both dimensions.
477 if (scale_factor * layer.height != codec_.height) {
478 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
479 }
480
481 // Ensure scale factor is power of two.
482 const bool is_pow_of_two = (scale_factor & (scale_factor - 1)) == 0;
483 if (!is_pow_of_two) {
484 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
485 }
486
487 svc_params_.scaling_factor_num[i] = 1;
488 svc_params_.scaling_factor_den[i] = scale_factor;
sprangce4aef12015-11-02 07:23:20 -0800489 }
490 } else {
491 int scaling_factor_num = 256;
492 for (int i = num_spatial_layers_ - 1; i >= 0; --i) {
sprangce4aef12015-11-02 07:23:20 -0800493 // 1:2 scaling in each dimension.
johannkoenig8225c402017-01-26 13:23:44 -0800494 svc_params_.scaling_factor_num[i] = scaling_factor_num;
495 svc_params_.scaling_factor_den[i] = 256;
sprangce4aef12015-11-02 07:23:20 -0800496 }
asaperssona9455ab2015-07-31 06:10:09 -0700497 }
498
Sergey Silkin86684962018-03-28 19:32:37 +0200499 SvcRateAllocator init_allocator(codec_);
Erik Språng566124a2018-04-23 12:32:22 +0200500 VideoBitrateAllocation allocation = init_allocator.GetAllocation(
Sergey Silkin86684962018-03-28 19:32:37 +0200501 inst->startBitrate * 1000, inst->maxFramerate);
502 if (!SetSvcRates(allocation)) {
asaperssona9455ab2015-07-31 06:10:09 -0700503 return WEBRTC_VIDEO_CODEC_ERR_PARAMETER;
504 }
505
Emircan Uysaler0823eec2018-07-13 17:10:00 -0700506 const vpx_codec_err_t rv = vpx_codec_enc_init(
507 encoder_, vpx_codec_vp9_cx(), config_,
508 config_->g_bit_depth == VPX_BITS_8 ? 0 : VPX_CODEC_USE_HIGHBITDEPTH);
509 if (rv != VPX_CODEC_OK) {
510 RTC_LOG(LS_ERROR) << "Init error: " << vpx_codec_err_to_string(rv);
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000511 return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
512 }
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000513 vpx_codec_control(encoder_, VP8E_SET_CPUUSED, cpu_speed_);
514 vpx_codec_control(encoder_, VP8E_SET_MAX_INTRA_BITRATE_PCT,
515 rc_max_intra_target_);
516 vpx_codec_control(encoder_, VP9E_SET_AQ_MODE,
hta257dc392016-10-25 09:05:06 -0700517 inst->VP9().adaptiveQpMode ? 3 : 0);
asaperssona9455ab2015-07-31 06:10:09 -0700518
jianj822e5932017-07-12 16:09:58 -0700519 vpx_codec_control(encoder_, VP9E_SET_FRAME_PARALLEL_DECODING, 0);
Sergey Silkin6a8f30e2018-04-26 11:03:49 +0200520
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +0200521 if (is_svc_) {
522 vpx_codec_control(encoder_, VP9E_SET_SVC, 1);
523 vpx_codec_control(encoder_, VP9E_SET_SVC_PARAMETERS, &svc_params_);
asaperssona9455ab2015-07-31 06:10:09 -0700524 }
Sergey Silkin6a8f30e2018-04-26 11:03:49 +0200525
526 if (num_spatial_layers_ > 1) {
527 switch (inter_layer_pred_) {
528 case InterLayerPredMode::kOn:
529 vpx_codec_control(encoder_, VP9E_SET_SVC_INTER_LAYER_PRED, 0);
530 break;
531 case InterLayerPredMode::kOff:
532 vpx_codec_control(encoder_, VP9E_SET_SVC_INTER_LAYER_PRED, 1);
533 break;
534 case InterLayerPredMode::kOnKeyPic:
535 vpx_codec_control(encoder_, VP9E_SET_SVC_INTER_LAYER_PRED, 2);
536 break;
537 default:
538 RTC_NOTREACHED();
539 }
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200540
Sergey Silkinee203362018-05-30 11:34:08 +0200541 // Configure encoder to drop entire superframe whenever it needs to drop
542 // a layer. This mode is prefered over per-layer dropping which causes
543 // quality flickering and is not compatible with RTP non-flexible mode.
544 vpx_svc_frame_drop_t svc_drop_frame;
545 memset(&svc_drop_frame, 0, sizeof(svc_drop_frame));
546 svc_drop_frame.framedrop_mode = FULL_SUPERFRAME_DROP;
Sergey Silkind45b3452018-05-31 16:00:24 +0200547 svc_drop_frame.max_consec_drop = std::numeric_limits<int>::max();
Sergey Silkinee203362018-05-30 11:34:08 +0200548 for (size_t i = 0; i < num_spatial_layers_; ++i) {
549 svc_drop_frame.framedrop_thresh[i] = config_->rc_dropframe_thresh;
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200550 }
Sergey Silkinee203362018-05-30 11:34:08 +0200551 vpx_codec_control(encoder_, VP9E_SET_SVC_FRAME_DROP_LAYER, &svc_drop_frame);
Sergey Silkin6a8f30e2018-04-26 11:03:49 +0200552 }
553
asaperssona9455ab2015-07-31 06:10:09 -0700554 // Register callback for getting each spatial layer.
555 vpx_codec_priv_output_cx_pkt_cb_pair_t cbp = {
philipelcce46fc2015-12-21 03:04:49 -0800556 VP9EncoderImpl::EncoderOutputCodedPacketCallback,
557 reinterpret_cast<void*>(this)};
558 vpx_codec_control(encoder_, VP9E_REGISTER_CX_CALLBACK,
559 reinterpret_cast<void*>(&cbp));
asaperssona9455ab2015-07-31 06:10:09 -0700560
marpan@webrtc.org38d11b82015-01-26 15:21:36 +0000561 // Control function to set the number of column tiles in encoding a frame, in
562 // log2 unit: e.g., 0 = 1 tile column, 1 = 2 tile columns, 2 = 4 tile columns.
563 // The number tile columns will be capped by the encoder based on image size
564 // (minimum width of tile column is 256 pixels, maximum is 4096).
565 vpx_codec_control(encoder_, VP9E_SET_TILE_COLUMNS, (config_->g_threads >> 1));
jianjcb5d1152017-03-28 23:56:08 -0700566
567 // Turn on row-based multithreading.
568 vpx_codec_control(encoder_, VP9E_SET_ROW_MT, 1);
jianj6bf57e32017-06-05 13:43:49 -0700569
Alex Glaznevfecb7c32016-03-31 14:23:27 -0700570#if !defined(WEBRTC_ARCH_ARM) && !defined(WEBRTC_ARCH_ARM64) && \
Yves Gerey665174f2018-06-19 15:03:05 +0200571 !defined(ANDROID)
jianj6bf57e32017-06-05 13:43:49 -0700572 // Do not enable the denoiser on ARM since optimization is pending.
573 // Denoiser is on by default on other platforms.
marpan@webrtc.org16a87b92015-03-05 22:19:00 +0000574 vpx_codec_control(encoder_, VP9E_SET_NOISE_SENSITIVITY,
hta257dc392016-10-25 09:05:06 -0700575 inst->VP9().denoisingOn ? 1 : 0);
marpan@webrtc.org16a87b92015-03-05 22:19:00 +0000576#endif
jianj6bf57e32017-06-05 13:43:49 -0700577
Niels Möllere3cf3d02018-06-13 11:52:16 +0200578 if (codec_.mode == VideoCodecMode::kScreensharing) {
ivica242d6382015-09-04 06:13:23 -0700579 // Adjust internal parameters to screen content.
580 vpx_codec_control(encoder_, VP9E_SET_TUNE_CONTENT, 1);
ivica242d6382015-09-04 06:13:23 -0700581 }
Marco2520e722015-09-16 14:05:00 -0700582 // Enable encoder skip of static/low content blocks.
583 vpx_codec_control(encoder_, VP8E_SET_STATIC_THRESHOLD, 1);
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000584 inited_ = true;
585 return WEBRTC_VIDEO_CODEC_OK;
586}
587
588uint32_t VP9EncoderImpl::MaxIntraTarget(uint32_t optimal_buffer_size) {
589 // Set max to the optimal buffer level (normalized by target BR),
590 // and scaled by a scale_par.
591 // Max target size = scale_par * optimal_buffer_size * targetBR[Kbps].
592 // This value is presented in percentage of perFrameBw:
593 // perFrameBw = targetBR[Kbps] * 1000 / framerate.
594 // The target in % is as follows:
595 float scale_par = 0.5;
596 uint32_t target_pct =
597 optimal_buffer_size * scale_par * codec_.maxFramerate / 10;
598 // Don't go below 3 times the per frame bandwidth.
599 const uint32_t min_intra_size = 300;
philipelcce46fc2015-12-21 03:04:49 -0800600 return (target_pct < min_intra_size) ? min_intra_size : target_pct;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000601}
602
Miguel Casas-Sanchez47650702015-05-29 17:21:40 -0700603int VP9EncoderImpl::Encode(const VideoFrame& input_image,
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000604 const CodecSpecificInfo* codec_specific_info,
pbos22993e12015-10-19 02:39:06 -0700605 const std::vector<FrameType>* frame_types) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000606 if (!inited_) {
607 return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
608 }
sprang3958ed82017-08-17 08:12:10 -0700609 if (encoded_complete_callback_ == nullptr) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000610 return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
611 }
Sergey Silkinbd0954e2018-05-03 14:14:09 +0200612
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000613 // We only support one stream at the moment.
Sergey Silkinbd0954e2018-05-03 14:14:09 +0200614 if (frame_types && !frame_types->empty()) {
615 if ((*frame_types)[0] == kVideoFrameKey) {
616 force_key_frame_ = true;
617 }
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000618 }
Sergey Silkind902d582018-05-18 17:31:19 +0200619
Niels Möllere3cf3d02018-06-13 11:52:16 +0200620 if (VideoCodecMode::kScreensharing == codec_.mode && !force_key_frame_) {
Sergey Silkind902d582018-05-18 17:31:19 +0200621 if (DropFrame(input_image.timestamp())) {
622 return WEBRTC_VIDEO_CODEC_OK;
623 }
624 }
625
kwiberg352444f2016-11-28 15:58:53 -0800626 RTC_DCHECK_EQ(input_image.width(), raw_->d_w);
627 RTC_DCHECK_EQ(input_image.height(), raw_->d_h);
asaperssona9455ab2015-07-31 06:10:09 -0700628
629 // Set input image for use in the callback.
630 // This was necessary since you need some information from input_image.
631 // You can save only the necessary information (such as timestamp) instead of
632 // doing this.
633 input_image_ = &input_image;
634
Emircan Uysaler0823eec2018-07-13 17:10:00 -0700635 // Keep reference to buffer until encode completes.
636 rtc::scoped_refptr<I420BufferInterface> i420_buffer;
637 rtc::scoped_refptr<I010BufferInterface> i010_buffer;
638 switch (profile_) {
639 case VP9Profile::kProfile0: {
640 i420_buffer = input_image.video_frame_buffer()->ToI420();
641 // Image in vpx_image_t format.
642 // Input image is const. VPX's raw image is not defined as const.
643 raw_->planes[VPX_PLANE_Y] = const_cast<uint8_t*>(i420_buffer->DataY());
644 raw_->planes[VPX_PLANE_U] = const_cast<uint8_t*>(i420_buffer->DataU());
645 raw_->planes[VPX_PLANE_V] = const_cast<uint8_t*>(i420_buffer->DataV());
646 raw_->stride[VPX_PLANE_Y] = i420_buffer->StrideY();
647 raw_->stride[VPX_PLANE_U] = i420_buffer->StrideU();
648 raw_->stride[VPX_PLANE_V] = i420_buffer->StrideV();
649 break;
650 }
651 case VP9Profile::kProfile2: {
652 // We can inject kI010 frames directly for encode. All other formats
653 // should be converted to it.
654 switch (input_image.video_frame_buffer()->type()) {
655 case VideoFrameBuffer::Type::kI010: {
656 i010_buffer = input_image.video_frame_buffer()->GetI010();
657 break;
658 }
659 default: {
660 i010_buffer =
661 I010Buffer::Copy(*input_image.video_frame_buffer()->ToI420());
662 }
663 }
664 raw_->planes[VPX_PLANE_Y] = const_cast<uint8_t*>(
665 reinterpret_cast<const uint8_t*>(i010_buffer->DataY()));
666 raw_->planes[VPX_PLANE_U] = const_cast<uint8_t*>(
667 reinterpret_cast<const uint8_t*>(i010_buffer->DataU()));
668 raw_->planes[VPX_PLANE_V] = const_cast<uint8_t*>(
669 reinterpret_cast<const uint8_t*>(i010_buffer->DataV()));
670 raw_->stride[VPX_PLANE_Y] = i010_buffer->StrideY() * 2;
671 raw_->stride[VPX_PLANE_U] = i010_buffer->StrideU() * 2;
672 raw_->stride[VPX_PLANE_V] = i010_buffer->StrideV() * 2;
673 break;
674 }
675 }
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000676
philipelcfc319b2015-11-10 07:17:23 -0800677 vpx_enc_frame_flags_t flags = 0;
Sergey Silkinbd0954e2018-05-03 14:14:09 +0200678 if (force_key_frame_) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000679 flags = VPX_EFLAG_FORCE_KF;
680 }
philipelcfc319b2015-11-10 07:17:23 -0800681
sprang3958ed82017-08-17 08:12:10 -0700682 RTC_CHECK_GT(codec_.maxFramerate, 0);
Sergey Silkind902d582018-05-18 17:31:19 +0200683 uint32_t duration =
684 90000 / target_framerate_fps_.value_or(codec_.maxFramerate);
Emircan Uysaler0823eec2018-07-13 17:10:00 -0700685 const vpx_codec_err_t rv = vpx_codec_encode(encoder_, raw_, timestamp_,
686 duration, flags, VPX_DL_REALTIME);
687 if (rv != VPX_CODEC_OK) {
688 RTC_LOG(LS_ERROR) << "Encoding error: " << vpx_codec_err_to_string(rv)
689 << "\n"
690 << "Details: " << vpx_codec_error(encoder_) << "\n"
691 << vpx_codec_error_detail(encoder_);
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000692 return WEBRTC_VIDEO_CODEC_ERROR;
693 }
694 timestamp_ += duration;
asaperssona9455ab2015-07-31 06:10:09 -0700695
Sergey Silkinbc0f0d32018-04-24 21:29:14 +0200696 const bool end_of_picture = true;
697 DeliverBufferedFrame(end_of_picture);
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200698
asaperssona9455ab2015-07-31 06:10:09 -0700699 return WEBRTC_VIDEO_CODEC_OK;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000700}
701
702void VP9EncoderImpl::PopulateCodecSpecific(CodecSpecificInfo* codec_specific,
philipelcce46fc2015-12-21 03:04:49 -0800703 const vpx_codec_cx_pkt& pkt,
Sergey Silkin07f80cc2018-04-09 13:11:59 +0200704 uint32_t timestamp,
705 bool first_frame_in_picture) {
sprang3958ed82017-08-17 08:12:10 -0700706 RTC_CHECK(codec_specific != nullptr);
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000707 codec_specific->codecType = kVideoCodecVP9;
perkj275afc52016-09-01 00:21:16 -0700708 codec_specific->codec_name = ImplementationName();
philipelcce46fc2015-12-21 03:04:49 -0800709 CodecSpecificInfoVP9* vp9_info = &(codec_specific->codecSpecific.VP9);
Sergey Silkin07f80cc2018-04-09 13:11:59 +0200710
711 vp9_info->first_frame_in_picture = first_frame_in_picture;
hta257dc392016-10-25 09:05:06 -0700712 vp9_info->flexible_mode = codec_.VP9()->flexibleMode;
713 vp9_info->ss_data_available =
714 ((pkt.data.frame.flags & VPX_FRAME_IS_KEY) && !codec_.VP9()->flexibleMode)
715 ? true
716 : false;
asaperssona9455ab2015-07-31 06:10:09 -0700717
718 vpx_svc_layer_id_t layer_id = {0};
719 vpx_codec_control(encoder_, VP9E_GET_SVC_LAYER_ID, &layer_id);
720
sprang3958ed82017-08-17 08:12:10 -0700721 RTC_CHECK_GT(num_temporal_layers_, 0);
“Michael23c5a992018-06-21 11:07:21 -0500722 RTC_CHECK_GT(num_active_spatial_layers_, 0);
asaperssona9455ab2015-07-31 06:10:09 -0700723 if (num_temporal_layers_ == 1) {
sprang3958ed82017-08-17 08:12:10 -0700724 RTC_CHECK_EQ(layer_id.temporal_layer_id, 0);
asaperssona9455ab2015-07-31 06:10:09 -0700725 vp9_info->temporal_idx = kNoTemporalIdx;
726 } else {
727 vp9_info->temporal_idx = layer_id.temporal_layer_id;
728 }
“Michael23c5a992018-06-21 11:07:21 -0500729 if (num_active_spatial_layers_ == 1) {
sprang3958ed82017-08-17 08:12:10 -0700730 RTC_CHECK_EQ(layer_id.spatial_layer_id, 0);
asaperssona9455ab2015-07-31 06:10:09 -0700731 vp9_info->spatial_idx = kNoSpatialIdx;
732 } else {
733 vp9_info->spatial_idx = layer_id.spatial_layer_id;
734 }
735 if (layer_id.spatial_layer_id != 0) {
736 vp9_info->ss_data_available = false;
737 }
738
asaperssona9455ab2015-07-31 06:10:09 -0700739 // TODO(asapersson): this info has to be obtained from the encoder.
asaperssoncb50c962015-11-18 01:58:55 -0800740 vp9_info->temporal_up_switch = false;
asaperssona9455ab2015-07-31 06:10:09 -0700741
Sergey Silkin6a8f30e2018-04-26 11:03:49 +0200742 if (pkt.data.frame.flags & VPX_FRAME_IS_KEY) {
743 pics_since_key_ = 0;
744 } else if (first_frame_in_picture) {
745 ++pics_since_key_;
asaperssona9455ab2015-07-31 06:10:09 -0700746 }
747
Sergey Silkin6a8f30e2018-04-26 11:03:49 +0200748 const bool is_key_pic = (pics_since_key_ == 0);
749 const bool is_inter_layer_pred_allowed =
750 (inter_layer_pred_ == InterLayerPredMode::kOn ||
751 (inter_layer_pred_ == InterLayerPredMode::kOnKeyPic && is_key_pic));
752
753 // Always set inter_layer_predicted to true on high layer frame if inter-layer
754 // prediction (ILP) is allowed even if encoder didn't actually use it.
755 // Setting inter_layer_predicted to false would allow receiver to decode high
756 // layer frame without decoding low layer frame. If that would happen (e.g.
757 // if low layer frame is lost) then receiver won't be able to decode next high
758 // layer frame which uses ILP.
759 vp9_info->inter_layer_predicted =
760 first_frame_in_picture ? false : is_inter_layer_pred_allowed;
761
762 const bool is_last_layer =
“Michael23c5a992018-06-21 11:07:21 -0500763 (layer_id.spatial_layer_id + 1 == num_active_spatial_layers_);
Sergey Silkin6a8f30e2018-04-26 11:03:49 +0200764 vp9_info->non_ref_for_inter_layer_pred =
765 is_last_layer ? true : !is_inter_layer_pred_allowed;
asapersson00ac85e2015-11-11 05:30:48 -0800766
ivica7f6a6fc2015-09-08 02:40:29 -0700767 // Always populate this, so that the packetizer can properly set the marker
768 // bit.
“Michael23c5a992018-06-21 11:07:21 -0500769 vp9_info->num_spatial_layers = num_active_spatial_layers_;
philipelcfc319b2015-11-10 07:17:23 -0800770
Sergey Silkinbe71a1e2018-05-17 16:46:43 +0200771 RTC_DCHECK(!vp9_info->flexible_mode);
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +0200772
773 vp9_info->num_ref_pics = 0;
774 if (vp9_info->flexible_mode) {
775 vp9_info->gof_idx = kNoGofIdx;
776 FillReferenceIndices(pkt, pics_since_key_, vp9_info->inter_layer_predicted,
777 vp9_info);
778 } else {
779 vp9_info->gof_idx =
780 static_cast<uint8_t>(pics_since_key_ % gof_.num_frames_in_gof);
781 vp9_info->temporal_up_switch = gof_.temporal_up_switch[vp9_info->gof_idx];
782 vp9_info->num_ref_pics = gof_.num_ref_pics[vp9_info->gof_idx];
783 }
784
785 vp9_info->inter_pic_predicted = (!is_key_pic && vp9_info->num_ref_pics > 0);
786
asaperssona9455ab2015-07-31 06:10:09 -0700787 if (vp9_info->ss_data_available) {
asaperssona9455ab2015-07-31 06:10:09 -0700788 vp9_info->spatial_layer_resolution_present = true;
“Michael23c5a992018-06-21 11:07:21 -0500789 for (size_t i = 0; i < num_active_spatial_layers_; ++i) {
Yves Gerey665174f2018-06-19 15:03:05 +0200790 vp9_info->width[i] = codec_.width * svc_params_.scaling_factor_num[i] /
johannkoenig8225c402017-01-26 13:23:44 -0800791 svc_params_.scaling_factor_den[i];
Yves Gerey665174f2018-06-19 15:03:05 +0200792 vp9_info->height[i] = codec_.height * svc_params_.scaling_factor_num[i] /
johannkoenig8225c402017-01-26 13:23:44 -0800793 svc_params_.scaling_factor_den[i];
asaperssona9455ab2015-07-31 06:10:09 -0700794 }
795 if (!vp9_info->flexible_mode) {
796 vp9_info->gof.CopyGofInfoVP9(gof_);
797 }
798 }
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000799}
800
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +0200801void VP9EncoderImpl::FillReferenceIndices(const vpx_codec_cx_pkt& pkt,
802 const size_t pic_num,
803 const bool inter_layer_predicted,
804 CodecSpecificInfoVP9* vp9_info) {
805 vpx_svc_layer_id_t layer_id = {0};
806 vpx_codec_control(encoder_, VP9E_GET_SVC_LAYER_ID, &layer_id);
807
808 vpx_svc_ref_frame_config_t enc_layer_conf = {{0}};
809 vpx_codec_control(encoder_, VP9E_GET_SVC_REF_FRAME_CONFIG, &enc_layer_conf);
810
811 std::vector<RefFrameBuffer> ref_buf_list;
812 if (enc_layer_conf.reference_last[layer_id.spatial_layer_id]) {
813 const size_t fb_idx = enc_layer_conf.lst_fb_idx[layer_id.spatial_layer_id];
814 RTC_DCHECK(ref_buf_.find(fb_idx) != ref_buf_.end());
815 ref_buf_list.push_back(ref_buf_.at(fb_idx));
816 }
817
818 if (enc_layer_conf.reference_alt_ref[layer_id.spatial_layer_id]) {
819 const size_t fb_idx = enc_layer_conf.alt_fb_idx[layer_id.spatial_layer_id];
820 RTC_DCHECK(ref_buf_.find(fb_idx) != ref_buf_.end());
821 ref_buf_list.push_back(ref_buf_.at(fb_idx));
822 }
823
824 if (enc_layer_conf.reference_golden[layer_id.spatial_layer_id]) {
825 const size_t fb_idx = enc_layer_conf.gld_fb_idx[layer_id.spatial_layer_id];
826 RTC_DCHECK(ref_buf_.find(fb_idx) != ref_buf_.end());
827 ref_buf_list.push_back(ref_buf_.at(fb_idx));
828 }
829
830 size_t max_ref_temporal_layer_id = 0;
831
832 vp9_info->num_ref_pics = 0;
833 for (const RefFrameBuffer& ref_buf : ref_buf_list) {
834 RTC_DCHECK_LE(ref_buf.pic_num, pic_num);
835 if (ref_buf.pic_num < pic_num) {
836 if (inter_layer_pred_ != InterLayerPredMode::kOn) {
837 // RTP spec limits temporal prediction to the same spatial layer.
838 // It is safe to ignore this requirement if inter-layer prediction is
839 // enabled for all frames when all base frames are relayed to receiver.
840 RTC_DCHECK_EQ(ref_buf.spatial_layer_id, layer_id.spatial_layer_id);
841 }
842 RTC_DCHECK_LE(ref_buf.temporal_layer_id, layer_id.temporal_layer_id);
843
844 const size_t p_diff = pic_num - ref_buf.pic_num;
845 RTC_DCHECK_LE(p_diff, 127UL);
846
847 vp9_info->p_diff[vp9_info->num_ref_pics] = static_cast<uint8_t>(p_diff);
848 ++vp9_info->num_ref_pics;
849
850 max_ref_temporal_layer_id =
851 std::max(max_ref_temporal_layer_id, ref_buf.temporal_layer_id);
852 } else {
853 RTC_DCHECK(inter_layer_predicted);
854 // RTP spec only allows to use previous spatial layer for inter-layer
855 // prediction.
856 RTC_DCHECK_EQ(ref_buf.spatial_layer_id + 1, layer_id.spatial_layer_id);
857 }
858 }
859
860 vp9_info->temporal_up_switch =
861 (max_ref_temporal_layer_id <
862 static_cast<size_t>(layer_id.temporal_layer_id));
863}
864
865void VP9EncoderImpl::UpdateReferenceBuffers(const vpx_codec_cx_pkt& pkt,
866 const size_t pic_num) {
867 vpx_svc_layer_id_t layer_id = {0};
868 vpx_codec_control(encoder_, VP9E_GET_SVC_LAYER_ID, &layer_id);
869
870 vpx_svc_ref_frame_config_t enc_layer_conf = {{0}};
871 vpx_codec_control(encoder_, VP9E_GET_SVC_REF_FRAME_CONFIG, &enc_layer_conf);
872
873 const bool is_key_frame =
874 (pkt.data.frame.flags & VPX_FRAME_IS_KEY) ? true : false;
875
876 RefFrameBuffer frame_buf(pic_num, layer_id.spatial_layer_id,
877 layer_id.temporal_layer_id);
878
879 if (is_key_frame && layer_id.spatial_layer_id == 0) {
880 // Key frame updates all ref buffers.
881 for (size_t i = 0; i < kNumVp9Buffers; ++i) {
882 ref_buf_[i] = frame_buf;
883 }
884 } else {
885 if (enc_layer_conf.update_last[layer_id.spatial_layer_id]) {
886 ref_buf_[enc_layer_conf.lst_fb_idx[layer_id.spatial_layer_id]] =
887 frame_buf;
888 }
889
890 if (enc_layer_conf.update_alt_ref[layer_id.spatial_layer_id]) {
891 ref_buf_[enc_layer_conf.alt_fb_idx[layer_id.spatial_layer_id]] =
892 frame_buf;
893 }
894
895 if (enc_layer_conf.update_golden[layer_id.spatial_layer_id]) {
896 ref_buf_[enc_layer_conf.gld_fb_idx[layer_id.spatial_layer_id]] =
897 frame_buf;
898 }
899 }
900}
901
asaperssona9455ab2015-07-31 06:10:09 -0700902int VP9EncoderImpl::GetEncodedLayerFrame(const vpx_codec_cx_pkt* pkt) {
asapersson86956de2016-01-26 01:05:20 -0800903 RTC_DCHECK_EQ(pkt->kind, VPX_CODEC_CX_FRAME_PKT);
asaperssona9455ab2015-07-31 06:10:09 -0700904
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200905 if (pkt->data.frame.sz == 0) {
906 // Ignore dropped frame.
907 return WEBRTC_VIDEO_CODEC_OK;
908 }
909
Sergey Silkin07f80cc2018-04-09 13:11:59 +0200910 vpx_svc_layer_id_t layer_id = {0};
911 vpx_codec_control(encoder_, VP9E_GET_SVC_LAYER_ID, &layer_id);
912
913 const bool first_frame_in_picture = encoded_image_._length == 0;
914 // Ensure we don't buffer layers of previous picture (superframe).
915 RTC_DCHECK(first_frame_in_picture || layer_id.spatial_layer_id > 0);
916
Sergey Silkinbc0f0d32018-04-24 21:29:14 +0200917 const bool end_of_picture = false;
918 DeliverBufferedFrame(end_of_picture);
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200919
asaperssond9f641e2016-01-21 01:11:35 -0800920 if (pkt->data.frame.sz > encoded_image_._size) {
921 delete[] encoded_image_._buffer;
922 encoded_image_._size = pkt->data.frame.sz;
923 encoded_image_._buffer = new uint8_t[encoded_image_._size];
924 }
asapersson86956de2016-01-26 01:05:20 -0800925 memcpy(encoded_image_._buffer, pkt->data.frame.buf, pkt->data.frame.sz);
926 encoded_image_._length = pkt->data.frame.sz;
asaperssond9f641e2016-01-21 01:11:35 -0800927
Sergey Silkinbd0954e2018-05-03 14:14:09 +0200928 const bool is_key_frame =
929 (pkt->data.frame.flags & VPX_FRAME_IS_KEY) ? true : false;
930 // Ensure encoder issued key frame on request.
931 RTC_DCHECK(is_key_frame || !force_key_frame_);
932
asaperssona9455ab2015-07-31 06:10:09 -0700933 // Check if encoded frame is a key frame.
asapersson86956de2016-01-26 01:05:20 -0800934 encoded_image_._frameType = kVideoFrameDelta;
Sergey Silkinbd0954e2018-05-03 14:14:09 +0200935 if (is_key_frame) {
Peter Boström49e196a2015-10-23 15:58:18 +0200936 encoded_image_._frameType = kVideoFrameKey;
Sergey Silkinbd0954e2018-05-03 14:14:09 +0200937 force_key_frame_ = false;
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000938 }
asapersson86956de2016-01-26 01:05:20 -0800939 RTC_DCHECK_LE(encoded_image_._length, encoded_image_._size);
940
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200941 memset(&codec_specific_, 0, sizeof(codec_specific_));
Sergey Silkin07f80cc2018-04-09 13:11:59 +0200942 PopulateCodecSpecific(&codec_specific_, *pkt, input_image_->timestamp(),
943 first_frame_in_picture);
asaperssona9455ab2015-07-31 06:10:09 -0700944
Sergey Silkin4e6cd5e2018-05-28 12:26:36 +0200945 if (is_flexible_mode_) {
946 UpdateReferenceBuffers(*pkt, pics_since_key_);
947 }
948
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200949 TRACE_COUNTER1("webrtc", "EncodedFrameSize", encoded_image_._length);
950 encoded_image_._timeStamp = input_image_->timestamp();
951 encoded_image_.capture_time_ms_ = input_image_->render_time_ms();
952 encoded_image_.rotation_ = input_image_->rotation();
Niels Möllere3cf3d02018-06-13 11:52:16 +0200953 encoded_image_.content_type_ = (codec_.mode == VideoCodecMode::kScreensharing)
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200954 ? VideoContentType::SCREENSHARE
955 : VideoContentType::UNSPECIFIED;
956 encoded_image_._encodedHeight =
957 pkt->data.frame.height[layer_id.spatial_layer_id];
958 encoded_image_._encodedWidth =
959 pkt->data.frame.width[layer_id.spatial_layer_id];
Ilya Nikolaevskiyb6c462d2018-06-05 15:21:32 +0200960 encoded_image_.timing_.flags = VideoSendTiming::kInvalid;
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200961 int qp = -1;
962 vpx_codec_control(encoder_, VP8E_GET_LAST_QUANTIZER, &qp);
963 encoded_image_.qp_ = qp;
ilnik04f4d122017-06-19 07:18:55 -0700964
marpan@webrtc.org5b883172014-11-01 06:10:48 +0000965 return WEBRTC_VIDEO_CODEC_OK;
966}
967
Sergey Silkinbc0f0d32018-04-24 21:29:14 +0200968void VP9EncoderImpl::DeliverBufferedFrame(bool end_of_picture) {
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200969 if (encoded_image_._length > 0) {
Sergey Silkinbc0f0d32018-04-24 21:29:14 +0200970 codec_specific_.codecSpecific.VP9.end_of_picture = end_of_picture;
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200971
972 // No data partitioning in VP9, so 1 partition only.
973 int part_idx = 0;
974 RTPFragmentationHeader frag_info;
975 frag_info.VerifyAndAllocateFragmentationHeader(1);
976 frag_info.fragmentationOffset[part_idx] = 0;
977 frag_info.fragmentationLength[part_idx] = encoded_image_._length;
978 frag_info.fragmentationPlType[part_idx] = 0;
979 frag_info.fragmentationTimeDiff[part_idx] = 0;
980
981 encoded_complete_callback_->OnEncodedImage(encoded_image_, &codec_specific_,
982 &frag_info);
983 encoded_image_._length = 0;
Sergey Silkind902d582018-05-18 17:31:19 +0200984
985 if (end_of_picture) {
986 const uint32_t timestamp_ms =
987 1000 * encoded_image_._timeStamp / kVideoPayloadTypeFrequency;
988 output_framerate_.Update(1, timestamp_ms);
989 last_encoded_frame_rtp_timestamp_ = encoded_image_._timeStamp;
990 }
Sergey Silkin2a1f1832018-04-04 11:45:41 +0200991 }
992}
993
Sergey Silkind902d582018-05-18 17:31:19 +0200994bool VP9EncoderImpl::DropFrame(uint32_t rtp_timestamp) {
995 if (target_framerate_fps_) {
996 if (rtp_timestamp < last_encoded_frame_rtp_timestamp_) {
997 // Timestamp has wrapped around. Reset framerate statistic.
998 output_framerate_.Reset();
999 return false;
1000 }
1001
1002 const uint32_t timestamp_ms =
1003 1000 * rtp_timestamp / kVideoPayloadTypeFrequency;
1004 const uint32_t framerate_fps =
1005 output_framerate_.Rate(timestamp_ms).value_or(0);
1006 if (framerate_fps > *target_framerate_fps_) {
1007 return true;
1008 }
1009
1010 // Primarily check if frame interval is too short using frame timestamps,
1011 // as if they are correct they won't be affected by queuing in webrtc.
1012 const uint32_t expected_frame_interval =
1013 kVideoPayloadTypeFrequency / *target_framerate_fps_;
1014
1015 const uint32_t ts_diff = rtp_timestamp - last_encoded_frame_rtp_timestamp_;
1016 if (ts_diff < 85 * expected_frame_interval / 100) {
1017 return true;
1018 }
1019 }
1020
1021 return false;
1022}
1023
pkasting@chromium.org16825b12015-01-12 21:51:21 +00001024int VP9EncoderImpl::SetChannelParameters(uint32_t packet_loss, int64_t rtt) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001025 return WEBRTC_VIDEO_CODEC_OK;
1026}
1027
1028int VP9EncoderImpl::RegisterEncodeCompleteCallback(
1029 EncodedImageCallback* callback) {
1030 encoded_complete_callback_ = callback;
1031 return WEBRTC_VIDEO_CODEC_OK;
1032}
1033
Peter Boströmb7d9a972015-12-18 16:01:11 +01001034const char* VP9EncoderImpl::ImplementationName() const {
1035 return "libvpx";
1036}
1037
Magnus Jedvert46a27652017-11-13 14:10:02 +01001038std::unique_ptr<VP9Decoder> VP9Decoder::Create() {
Karl Wiberg918f50c2018-07-05 11:40:33 +02001039 return absl::make_unique<VP9DecoderImpl>();
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001040}
1041
1042VP9DecoderImpl::VP9DecoderImpl()
sprang3958ed82017-08-17 08:12:10 -07001043 : decode_complete_callback_(nullptr),
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001044 inited_(false),
sprang3958ed82017-08-17 08:12:10 -07001045 decoder_(nullptr),
philipel9d7d75b2018-04-04 13:03:01 +02001046 key_frame_required_(true) {}
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001047
1048VP9DecoderImpl::~VP9DecoderImpl() {
1049 inited_ = true; // in order to do the actual release
1050 Release();
Henrik Boström9695d852015-05-06 10:42:15 +02001051 int num_buffers_in_use = frame_buffer_pool_.GetNumBuffersInUse();
1052 if (num_buffers_in_use > 0) {
1053 // The frame buffers are reference counted and frames are exposed after
1054 // decoding. There may be valid usage cases where previous frames are still
1055 // referenced after ~VP9DecoderImpl that is not a leak.
Mirko Bonadei675513b2017-11-09 11:09:25 +01001056 RTC_LOG(LS_INFO) << num_buffers_in_use << " Vp9FrameBuffers are still "
1057 << "referenced during ~VP9DecoderImpl.";
Henrik Boström9695d852015-05-06 10:42:15 +02001058 }
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001059}
1060
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001061int VP9DecoderImpl::InitDecode(const VideoCodec* inst, int number_of_cores) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001062 int ret_val = Release();
1063 if (ret_val < 0) {
1064 return ret_val;
1065 }
sprang3958ed82017-08-17 08:12:10 -07001066 if (decoder_ == nullptr) {
pbos@webrtc.orge728ee02014-12-17 13:43:55 +00001067 decoder_ = new vpx_codec_ctx_t;
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001068 }
philipelcce46fc2015-12-21 03:04:49 -08001069 vpx_codec_dec_cfg_t cfg;
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001070 // Setting number of threads to a constant value (1)
1071 cfg.threads = 1;
1072 cfg.h = cfg.w = 0; // set after decode
1073 vpx_codec_flags_t flags = 0;
1074 if (vpx_codec_dec_init(decoder_, vpx_codec_vp9_dx(), &cfg, flags)) {
1075 return WEBRTC_VIDEO_CODEC_MEMORY;
1076 }
Henrik Boström9695d852015-05-06 10:42:15 +02001077
1078 if (!frame_buffer_pool_.InitializeVpxUsePool(decoder_)) {
1079 return WEBRTC_VIDEO_CODEC_MEMORY;
1080 }
1081
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001082 inited_ = true;
1083 // Always start with a complete key frame.
1084 key_frame_required_ = true;
1085 return WEBRTC_VIDEO_CODEC_OK;
1086}
1087
1088int VP9DecoderImpl::Decode(const EncodedImage& input_image,
1089 bool missing_frames,
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001090 const CodecSpecificInfo* codec_specific_info,
1091 int64_t /*render_time_ms*/) {
1092 if (!inited_) {
1093 return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
1094 }
sprang3958ed82017-08-17 08:12:10 -07001095 if (decode_complete_callback_ == nullptr) {
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001096 return WEBRTC_VIDEO_CODEC_UNINITIALIZED;
1097 }
1098 // Always start with a complete key frame.
1099 if (key_frame_required_) {
Peter Boström49e196a2015-10-23 15:58:18 +02001100 if (input_image._frameType != kVideoFrameKey)
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001101 return WEBRTC_VIDEO_CODEC_ERROR;
1102 // We have a key frame - is it complete?
1103 if (input_image._completeFrame) {
1104 key_frame_required_ = false;
1105 } else {
1106 return WEBRTC_VIDEO_CODEC_ERROR;
1107 }
1108 }
sprang3958ed82017-08-17 08:12:10 -07001109 vpx_codec_iter_t iter = nullptr;
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001110 vpx_image_t* img;
1111 uint8_t* buffer = input_image._buffer;
1112 if (input_image._length == 0) {
sprang3958ed82017-08-17 08:12:10 -07001113 buffer = nullptr; // Triggers full frame concealment.
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001114 }
Henrik Boström9695d852015-05-06 10:42:15 +02001115 // During decode libvpx may get and release buffers from |frame_buffer_pool_|.
1116 // In practice libvpx keeps a few (~3-4) buffers alive at a time.
philipelcce46fc2015-12-21 03:04:49 -08001117 if (vpx_codec_decode(decoder_, buffer,
1118 static_cast<unsigned int>(input_image._length), 0,
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001119 VPX_DL_REALTIME)) {
1120 return WEBRTC_VIDEO_CODEC_ERROR;
1121 }
Henrik Boström9695d852015-05-06 10:42:15 +02001122 // |img->fb_priv| contains the image data, a reference counted Vp9FrameBuffer.
1123 // It may be released by libvpx during future vpx_codec_decode or
1124 // vpx_codec_destroy calls.
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001125 img = vpx_codec_get_frame(decoder_, &iter);
sakal7adadb12017-02-23 02:54:57 -08001126 int qp;
1127 vpx_codec_err_t vpx_ret =
1128 vpx_codec_control(decoder_, VPXD_GET_LAST_QUANTIZER, &qp);
1129 RTC_DCHECK_EQ(vpx_ret, VPX_CODEC_OK);
1130 int ret =
1131 ReturnFrame(img, input_image._timeStamp, input_image.ntp_time_ms_, qp);
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001132 if (ret != 0) {
1133 return ret;
1134 }
1135 return WEBRTC_VIDEO_CODEC_OK;
1136}
1137
asapersson1490f7a2016-09-23 02:09:46 -07001138int VP9DecoderImpl::ReturnFrame(const vpx_image_t* img,
1139 uint32_t timestamp,
sakal7adadb12017-02-23 02:54:57 -08001140 int64_t ntp_time_ms,
1141 int qp) {
sprang3958ed82017-08-17 08:12:10 -07001142 if (img == nullptr) {
1143 // Decoder OK and nullptr image => No show frame.
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001144 return WEBRTC_VIDEO_CODEC_NO_OUTPUT;
1145 }
Henrik Boström9695d852015-05-06 10:42:15 +02001146
1147 // This buffer contains all of |img|'s image data, a reference counted
perkj14f41442015-11-30 22:15:45 -08001148 // Vp9FrameBuffer. (libvpx is done with the buffers after a few
Henrik Boström9695d852015-05-06 10:42:15 +02001149 // vpx_codec_decode calls or vpx_codec_destroy).
1150 Vp9FrameBufferPool::Vp9FrameBuffer* img_buffer =
1151 static_cast<Vp9FrameBufferPool::Vp9FrameBuffer*>(img->fb_priv);
Emircan Uysaler0823eec2018-07-13 17:10:00 -07001152
Miguel Casas-Sanchez47650702015-05-29 17:21:40 -07001153 // The buffer can be used directly by the VideoFrame (without copy) by
Emircan Uysaler0823eec2018-07-13 17:10:00 -07001154 // using a Wrapped*Buffer.
1155 rtc::scoped_refptr<VideoFrameBuffer> img_wrapped_buffer;
1156 switch (img->bit_depth) {
1157 case 8:
1158 img_wrapped_buffer = WrapI420Buffer(
philipelcce46fc2015-12-21 03:04:49 -08001159 img->d_w, img->d_h, img->planes[VPX_PLANE_Y],
1160 img->stride[VPX_PLANE_Y], img->planes[VPX_PLANE_U],
1161 img->stride[VPX_PLANE_U], img->planes[VPX_PLANE_V],
1162 img->stride[VPX_PLANE_V],
Henrik Boström9695d852015-05-06 10:42:15 +02001163 // WrappedI420Buffer's mechanism for allowing the release of its frame
1164 // buffer is through a callback function. This is where we should
1165 // release |img_buffer|.
Emircan Uysaler0823eec2018-07-13 17:10:00 -07001166 rtc::KeepRefUntilDone(img_buffer));
1167 break;
1168 case 10:
1169 img_wrapped_buffer = WrapI010Buffer(
1170 img->d_w, img->d_h,
1171 reinterpret_cast<const uint16_t*>(img->planes[VPX_PLANE_Y]),
1172 img->stride[VPX_PLANE_Y] / 2,
1173 reinterpret_cast<const uint16_t*>(img->planes[VPX_PLANE_U]),
1174 img->stride[VPX_PLANE_U] / 2,
1175 reinterpret_cast<const uint16_t*>(img->planes[VPX_PLANE_V]),
1176 img->stride[VPX_PLANE_V] / 2, rtc::KeepRefUntilDone(img_buffer));
1177 break;
1178 default:
1179 RTC_NOTREACHED();
1180 return WEBRTC_VIDEO_CODEC_NO_OUTPUT;
1181 }
nisseca6d5d12016-06-17 05:03:04 -07001182
Emircan Uysaler800787f2018-07-16 10:01:49 -07001183 ColorSpace::PrimaryID primaries = ColorSpace::PrimaryID::kInvalid;
1184 ColorSpace::TransferID transfer = ColorSpace::TransferID::kInvalid;
1185 ColorSpace::MatrixID matrix = ColorSpace::MatrixID::kInvalid;
1186 switch (img->cs) {
1187 case VPX_CS_BT_601:
1188 case VPX_CS_SMPTE_170:
1189 primaries = ColorSpace::PrimaryID::kSMPTE170M;
1190 transfer = ColorSpace::TransferID::kSMPTE170M;
1191 matrix = ColorSpace::MatrixID::kSMPTE170M;
1192 break;
1193 case VPX_CS_SMPTE_240:
1194 primaries = ColorSpace::PrimaryID::kSMPTE240M;
1195 transfer = ColorSpace::TransferID::kSMPTE240M;
1196 matrix = ColorSpace::MatrixID::kSMPTE240M;
1197 break;
1198 case VPX_CS_BT_709:
1199 primaries = ColorSpace::PrimaryID::kBT709;
1200 transfer = ColorSpace::TransferID::kBT709;
1201 matrix = ColorSpace::MatrixID::kBT709;
1202 break;
1203 case VPX_CS_BT_2020:
1204 primaries = ColorSpace::PrimaryID::kBT2020;
1205 switch (img->bit_depth) {
1206 case 8:
1207 transfer = ColorSpace::TransferID::kBT709;
1208 break;
1209 case 10:
1210 transfer = ColorSpace::TransferID::kBT2020_10;
1211 break;
1212 default:
1213 RTC_NOTREACHED();
1214 break;
1215 }
1216 matrix = ColorSpace::MatrixID::kBT2020_NCL;
1217 break;
1218 case VPX_CS_SRGB:
1219 primaries = ColorSpace::PrimaryID::kBT709;
1220 transfer = ColorSpace::TransferID::kIEC61966_2_1;
1221 matrix = ColorSpace::MatrixID::kBT709;
1222 break;
1223 default:
1224 break;
1225 }
1226
1227 ColorSpace::RangeID range = ColorSpace::RangeID::kInvalid;
1228 switch (img->range) {
1229 case VPX_CR_STUDIO_RANGE:
1230 range = ColorSpace::RangeID::kLimited;
1231 break;
1232 case VPX_CR_FULL_RANGE:
1233 range = ColorSpace::RangeID::kFull;
1234 break;
1235 default:
1236 break;
1237 }
1238
1239 VideoFrame decoded_image =
1240 VideoFrame::Builder()
1241 .set_video_frame_buffer(img_wrapped_buffer)
1242 .set_timestamp_ms(0)
1243 .set_timestamp_rtp(timestamp)
1244 .set_ntp_time_ms(ntp_time_ms)
1245 .set_rotation(webrtc::kVideoRotation_0)
1246 .set_color_space(ColorSpace(primaries, transfer, matrix, range))
1247 .build();
Danil Chapovalov0040b662018-06-18 10:48:16 +02001248 decode_complete_callback_->Decoded(decoded_image, absl::nullopt, qp);
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001249 return WEBRTC_VIDEO_CODEC_OK;
1250}
1251
1252int VP9DecoderImpl::RegisterDecodeCompleteCallback(
1253 DecodedImageCallback* callback) {
1254 decode_complete_callback_ = callback;
1255 return WEBRTC_VIDEO_CODEC_OK;
1256}
1257
1258int VP9DecoderImpl::Release() {
Sergey Silkin3e871ea2018-03-02 13:11:04 +01001259 int ret_val = WEBRTC_VIDEO_CODEC_OK;
1260
sprang3958ed82017-08-17 08:12:10 -07001261 if (decoder_ != nullptr) {
Sergey Silkin90399692018-03-02 14:44:10 +01001262 if (inited_) {
1263 // When a codec is destroyed libvpx will release any buffers of
1264 // |frame_buffer_pool_| it is currently using.
1265 if (vpx_codec_destroy(decoder_)) {
1266 ret_val = WEBRTC_VIDEO_CODEC_MEMORY;
1267 }
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001268 }
1269 delete decoder_;
sprang3958ed82017-08-17 08:12:10 -07001270 decoder_ = nullptr;
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001271 }
Henrik Boström9695d852015-05-06 10:42:15 +02001272 // Releases buffers from the pool. Any buffers not in use are deleted. Buffers
1273 // still referenced externally are deleted once fully released, not returning
1274 // to the pool.
1275 frame_buffer_pool_.ClearPool();
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001276 inited_ = false;
Sergey Silkin3e871ea2018-03-02 13:11:04 +01001277 return ret_val;
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001278}
Peter Boströmb7d9a972015-12-18 16:01:11 +01001279
1280const char* VP9DecoderImpl::ImplementationName() const {
1281 return "libvpx";
1282}
1283
marpan@webrtc.org5b883172014-11-01 06:10:48 +00001284} // namespace webrtc