blob: 93ef6548e5bb4fd5b86f6137873f6d54e8b47e1c [file] [log] [blame]
Stefan Holmerf7044682018-07-17 10:16:41 +02001/*
2 * Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11#include "call/rtp_payload_params.h"
12
Yves Gerey3e707812018-11-28 16:47:49 +010013#include <stddef.h>
Elad Alonf5b216a2019-01-28 14:25:17 +010014#include <algorithm>
Yves Gerey3e707812018-11-28 16:47:49 +010015
16#include "absl/container/inlined_vector.h"
Yves Gerey3e707812018-11-28 16:47:49 +010017#include "absl/types/variant.h"
18#include "api/video/video_timing.h"
19#include "common_types.h" // NOLINT(build/include)
20#include "modules/video_coding/codecs/h264/include/h264_globals.h"
21#include "modules/video_coding/codecs/interface/common_constants.h"
22#include "modules/video_coding/codecs/vp8/include/vp8_globals.h"
23#include "modules/video_coding/codecs/vp9/include/vp9_globals.h"
Elad Alonf5b216a2019-01-28 14:25:17 +010024#include "rtc_base/arraysize.h"
Stefan Holmerf7044682018-07-17 10:16:41 +020025#include "rtc_base/checks.h"
philipelbf2b6202018-08-27 14:33:18 +020026#include "rtc_base/logging.h"
Stefan Holmerf7044682018-07-17 10:16:41 +020027#include "rtc_base/random.h"
Steve Anton10542f22019-01-11 09:11:00 -080028#include "rtc_base/time_utils.h"
philipelbf2b6202018-08-27 14:33:18 +020029#include "system_wrappers/include/field_trial.h"
Stefan Holmerf7044682018-07-17 10:16:41 +020030
31namespace webrtc {
32
33namespace {
34void PopulateRtpWithCodecSpecifics(const CodecSpecificInfo& info,
Niels Möllerd3b8c632018-08-27 15:33:42 +020035 absl::optional<int> spatial_index,
Stefan Holmerf7044682018-07-17 10:16:41 +020036 RTPVideoHeader* rtp) {
37 rtp->codec = info.codecType;
38 switch (info.codecType) {
39 case kVideoCodecVP8: {
Philip Eliassond52a1a62018-09-07 13:03:55 +000040 auto& vp8_header = rtp->video_type_header.emplace<RTPVideoHeaderVP8>();
41 vp8_header.InitRTPVideoHeaderVP8();
42 vp8_header.nonReference = info.codecSpecific.VP8.nonReference;
43 vp8_header.temporalIdx = info.codecSpecific.VP8.temporalIdx;
44 vp8_header.layerSync = info.codecSpecific.VP8.layerSync;
45 vp8_header.keyIdx = info.codecSpecific.VP8.keyIdx;
Niels Möllerd3b8c632018-08-27 15:33:42 +020046 rtp->simulcastIdx = spatial_index.value_or(0);
Stefan Holmerf7044682018-07-17 10:16:41 +020047 return;
48 }
49 case kVideoCodecVP9: {
philipel29d88462018-08-08 14:26:00 +020050 auto& vp9_header = rtp->video_type_header.emplace<RTPVideoHeaderVP9>();
51 vp9_header.InitRTPVideoHeaderVP9();
52 vp9_header.inter_pic_predicted =
Stefan Holmerf7044682018-07-17 10:16:41 +020053 info.codecSpecific.VP9.inter_pic_predicted;
philipel29d88462018-08-08 14:26:00 +020054 vp9_header.flexible_mode = info.codecSpecific.VP9.flexible_mode;
55 vp9_header.ss_data_available = info.codecSpecific.VP9.ss_data_available;
56 vp9_header.non_ref_for_inter_layer_pred =
Stefan Holmerf7044682018-07-17 10:16:41 +020057 info.codecSpecific.VP9.non_ref_for_inter_layer_pred;
philipel29d88462018-08-08 14:26:00 +020058 vp9_header.temporal_idx = info.codecSpecific.VP9.temporal_idx;
philipel29d88462018-08-08 14:26:00 +020059 vp9_header.temporal_up_switch = info.codecSpecific.VP9.temporal_up_switch;
60 vp9_header.inter_layer_predicted =
Stefan Holmerf7044682018-07-17 10:16:41 +020061 info.codecSpecific.VP9.inter_layer_predicted;
philipel29d88462018-08-08 14:26:00 +020062 vp9_header.gof_idx = info.codecSpecific.VP9.gof_idx;
63 vp9_header.num_spatial_layers = info.codecSpecific.VP9.num_spatial_layers;
Niels Möllerd3b8c632018-08-27 15:33:42 +020064 if (vp9_header.num_spatial_layers > 1) {
65 vp9_header.spatial_idx = spatial_index.value_or(kNoSpatialIdx);
66 } else {
67 vp9_header.spatial_idx = kNoSpatialIdx;
68 }
Stefan Holmerf7044682018-07-17 10:16:41 +020069 if (info.codecSpecific.VP9.ss_data_available) {
philipel29d88462018-08-08 14:26:00 +020070 vp9_header.spatial_layer_resolution_present =
Stefan Holmerf7044682018-07-17 10:16:41 +020071 info.codecSpecific.VP9.spatial_layer_resolution_present;
72 if (info.codecSpecific.VP9.spatial_layer_resolution_present) {
73 for (size_t i = 0; i < info.codecSpecific.VP9.num_spatial_layers;
74 ++i) {
philipel29d88462018-08-08 14:26:00 +020075 vp9_header.width[i] = info.codecSpecific.VP9.width[i];
76 vp9_header.height[i] = info.codecSpecific.VP9.height[i];
Stefan Holmerf7044682018-07-17 10:16:41 +020077 }
78 }
philipel29d88462018-08-08 14:26:00 +020079 vp9_header.gof.CopyGofInfoVP9(info.codecSpecific.VP9.gof);
Stefan Holmerf7044682018-07-17 10:16:41 +020080 }
81
philipel29d88462018-08-08 14:26:00 +020082 vp9_header.num_ref_pics = info.codecSpecific.VP9.num_ref_pics;
Stefan Holmerf7044682018-07-17 10:16:41 +020083 for (int i = 0; i < info.codecSpecific.VP9.num_ref_pics; ++i) {
philipel29d88462018-08-08 14:26:00 +020084 vp9_header.pid_diff[i] = info.codecSpecific.VP9.p_diff[i];
Stefan Holmerf7044682018-07-17 10:16:41 +020085 }
philipel29d88462018-08-08 14:26:00 +020086 vp9_header.end_of_picture = info.codecSpecific.VP9.end_of_picture;
Stefan Holmerf7044682018-07-17 10:16:41 +020087 return;
88 }
89 case kVideoCodecH264: {
philipel7d745e52018-08-02 14:03:53 +020090 auto& h264_header = rtp->video_type_header.emplace<RTPVideoHeaderH264>();
91 h264_header.packetization_mode =
Stefan Holmerf7044682018-07-17 10:16:41 +020092 info.codecSpecific.H264.packetization_mode;
Niels Möllerd3b8c632018-08-27 15:33:42 +020093 rtp->simulcastIdx = spatial_index.value_or(0);
Stefan Holmerf7044682018-07-17 10:16:41 +020094 return;
95 }
96 case kVideoCodecMultiplex:
97 case kVideoCodecGeneric:
98 rtp->codec = kVideoCodecGeneric;
Niels Möllerd3b8c632018-08-27 15:33:42 +020099 rtp->simulcastIdx = spatial_index.value_or(0);
Stefan Holmerf7044682018-07-17 10:16:41 +0200100 return;
101 default:
102 return;
103 }
104}
105
106void SetVideoTiming(const EncodedImage& image, VideoSendTiming* timing) {
107 if (image.timing_.flags == VideoSendTiming::TimingFrameFlags::kInvalid ||
108 image.timing_.flags == VideoSendTiming::TimingFrameFlags::kNotTriggered) {
109 timing->flags = VideoSendTiming::TimingFrameFlags::kInvalid;
110 return;
111 }
112
113 timing->encode_start_delta_ms = VideoSendTiming::GetDeltaCappedMs(
114 image.capture_time_ms_, image.timing_.encode_start_ms);
115 timing->encode_finish_delta_ms = VideoSendTiming::GetDeltaCappedMs(
116 image.capture_time_ms_, image.timing_.encode_finish_ms);
117 timing->packetization_finish_delta_ms = 0;
118 timing->pacer_exit_delta_ms = 0;
119 timing->network_timestamp_delta_ms = 0;
120 timing->network2_timestamp_delta_ms = 0;
121 timing->flags = image.timing_.flags;
122}
123} // namespace
124
125RtpPayloadParams::RtpPayloadParams(const uint32_t ssrc,
126 const RtpPayloadState* state)
philipelbf2b6202018-08-27 14:33:18 +0200127 : ssrc_(ssrc),
128 generic_picture_id_experiment_(
philipel569397f2018-09-26 12:25:31 +0200129 field_trial::IsEnabled("WebRTC-GenericPictureId")),
130 generic_descriptor_experiment_(
131 field_trial::IsEnabled("WebRTC-GenericDescriptor")) {
philipelbf2b6202018-08-27 14:33:18 +0200132 for (auto& spatial_layer : last_shared_frame_id_)
133 spatial_layer.fill(-1);
134
Elad Alonf5b216a2019-01-28 14:25:17 +0100135 buffer_id_to_frame_id_.fill(-1);
136
Stefan Holmerf7044682018-07-17 10:16:41 +0200137 Random random(rtc::TimeMicros());
138 state_.picture_id =
139 state ? state->picture_id : (random.Rand<int16_t>() & 0x7FFF);
140 state_.tl0_pic_idx = state ? state->tl0_pic_idx : (random.Rand<uint8_t>());
141}
philipelbf2b6202018-08-27 14:33:18 +0200142
143RtpPayloadParams::RtpPayloadParams(const RtpPayloadParams& other) = default;
144
Stefan Holmerf7044682018-07-17 10:16:41 +0200145RtpPayloadParams::~RtpPayloadParams() {}
146
147RTPVideoHeader RtpPayloadParams::GetRtpVideoHeader(
148 const EncodedImage& image,
philipelbf2b6202018-08-27 14:33:18 +0200149 const CodecSpecificInfo* codec_specific_info,
150 int64_t shared_frame_id) {
Stefan Holmerf7044682018-07-17 10:16:41 +0200151 RTPVideoHeader rtp_video_header;
152 if (codec_specific_info) {
Niels Möllerd3b8c632018-08-27 15:33:42 +0200153 PopulateRtpWithCodecSpecifics(*codec_specific_info, image.SpatialIndex(),
154 &rtp_video_header);
Stefan Holmerf7044682018-07-17 10:16:41 +0200155 }
156 rtp_video_header.rotation = image.rotation_;
157 rtp_video_header.content_type = image.content_type_;
158 rtp_video_header.playout_delay = image.playout_delay_;
philipelfab91292018-10-17 14:36:08 +0200159 rtp_video_header.width = image._encodedWidth;
160 rtp_video_header.height = image._encodedHeight;
Johannes Krond0b69a82018-12-03 14:18:53 +0100161 rtp_video_header.color_space = image.ColorSpace()
162 ? absl::make_optional(*image.ColorSpace())
163 : absl::nullopt;
Stefan Holmerf7044682018-07-17 10:16:41 +0200164 SetVideoTiming(image, &rtp_video_header.video_timing);
165
philipelbf2b6202018-08-27 14:33:18 +0200166 const bool is_keyframe = image._frameType == kVideoFrameKey;
Stefan Holmerf7044682018-07-17 10:16:41 +0200167 const bool first_frame_in_picture =
168 (codec_specific_info && codec_specific_info->codecType == kVideoCodecVP9)
169 ? codec_specific_info->codecSpecific.VP9.first_frame_in_picture
170 : true;
philipelbf2b6202018-08-27 14:33:18 +0200171
172 SetCodecSpecific(&rtp_video_header, first_frame_in_picture);
philipel569397f2018-09-26 12:25:31 +0200173
174 if (generic_descriptor_experiment_)
Elad Alonf5b216a2019-01-28 14:25:17 +0100175 SetGeneric(codec_specific_info, shared_frame_id, is_keyframe,
176 &rtp_video_header);
philipelbf2b6202018-08-27 14:33:18 +0200177
Stefan Holmerf7044682018-07-17 10:16:41 +0200178 return rtp_video_header;
179}
180
181uint32_t RtpPayloadParams::ssrc() const {
182 return ssrc_;
183}
184
185RtpPayloadState RtpPayloadParams::state() const {
186 return state_;
187}
188
philipelbf2b6202018-08-27 14:33:18 +0200189void RtpPayloadParams::SetCodecSpecific(RTPVideoHeader* rtp_video_header,
190 bool first_frame_in_picture) {
Stefan Holmerf7044682018-07-17 10:16:41 +0200191 // Always set picture id. Set tl0_pic_idx iff temporal index is set.
192 if (first_frame_in_picture) {
193 state_.picture_id = (static_cast<uint16_t>(state_.picture_id) + 1) & 0x7FFF;
194 }
195 if (rtp_video_header->codec == kVideoCodecVP8) {
Philip Eliassond52a1a62018-09-07 13:03:55 +0000196 auto& vp8_header =
197 absl::get<RTPVideoHeaderVP8>(rtp_video_header->video_type_header);
198 vp8_header.pictureId = state_.picture_id;
Stefan Holmerf7044682018-07-17 10:16:41 +0200199
Philip Eliassond52a1a62018-09-07 13:03:55 +0000200 if (vp8_header.temporalIdx != kNoTemporalIdx) {
201 if (vp8_header.temporalIdx == 0) {
Stefan Holmerf7044682018-07-17 10:16:41 +0200202 ++state_.tl0_pic_idx;
203 }
Philip Eliassond52a1a62018-09-07 13:03:55 +0000204 vp8_header.tl0PicIdx = state_.tl0_pic_idx;
Stefan Holmerf7044682018-07-17 10:16:41 +0200205 }
206 }
207 if (rtp_video_header->codec == kVideoCodecVP9) {
philipel29d88462018-08-08 14:26:00 +0200208 auto& vp9_header =
209 absl::get<RTPVideoHeaderVP9>(rtp_video_header->video_type_header);
210 vp9_header.picture_id = state_.picture_id;
Stefan Holmerf7044682018-07-17 10:16:41 +0200211
212 // Note that in the case that we have no temporal layers but we do have
213 // spatial layers, packets will carry layering info with a temporal_idx of
214 // zero, and we then have to set and increment tl0_pic_idx.
philipel29d88462018-08-08 14:26:00 +0200215 if (vp9_header.temporal_idx != kNoTemporalIdx ||
216 vp9_header.spatial_idx != kNoSpatialIdx) {
Stefan Holmerf7044682018-07-17 10:16:41 +0200217 if (first_frame_in_picture &&
philipel29d88462018-08-08 14:26:00 +0200218 (vp9_header.temporal_idx == 0 ||
219 vp9_header.temporal_idx == kNoTemporalIdx)) {
Stefan Holmerf7044682018-07-17 10:16:41 +0200220 ++state_.tl0_pic_idx;
221 }
philipel29d88462018-08-08 14:26:00 +0200222 vp9_header.tl0_pic_idx = state_.tl0_pic_idx;
Stefan Holmerf7044682018-07-17 10:16:41 +0200223 }
224 }
philipelbf2b6202018-08-27 14:33:18 +0200225 // There are currently two generic descriptors in WebRTC. The old descriptor
226 // can not share a picture id space between simulcast streams, so we use the
227 // |picture_id| in this case. We let the |picture_id| tag along in |frame_id|
228 // until the old generic format can be removed.
229 // TODO(philipel): Remove this when the new generic format has been fully
230 // implemented.
231 if (generic_picture_id_experiment_ &&
232 rtp_video_header->codec == kVideoCodecGeneric) {
233 rtp_video_header->generic.emplace().frame_id = state_.picture_id;
234 }
Stefan Holmerf7044682018-07-17 10:16:41 +0200235}
philipelbf2b6202018-08-27 14:33:18 +0200236
Elad Alonf5b216a2019-01-28 14:25:17 +0100237void RtpPayloadParams::SetGeneric(const CodecSpecificInfo* codec_specific_info,
238 int64_t frame_id,
philipelbf2b6202018-08-27 14:33:18 +0200239 bool is_keyframe,
240 RTPVideoHeader* rtp_video_header) {
Elad Alonf5b216a2019-01-28 14:25:17 +0100241 switch (rtp_video_header->codec) {
242 case VideoCodecType::kVideoCodecGeneric:
243 // TODO(philipel): Implement generic codec to new generic descriptor.
244 return;
245 case VideoCodecType::kVideoCodecVP8:
246 if (codec_specific_info) {
247 Vp8ToGeneric(codec_specific_info->codecSpecific.VP8, frame_id,
248 is_keyframe, rtp_video_header);
249 }
250 return;
251 case VideoCodecType::kVideoCodecVP9:
252 // TODO(philipel): Implement VP9 to new generic descriptor.
253 return;
254 case VideoCodecType::kVideoCodecH264:
255 // TODO(philipel): Implement H264 to new generic descriptor.
256 case VideoCodecType::kVideoCodecMultiplex:
257 return;
philipelbf2b6202018-08-27 14:33:18 +0200258 }
Elad Alonf5b216a2019-01-28 14:25:17 +0100259 RTC_NOTREACHED() << "Unsupported codec.";
philipelbf2b6202018-08-27 14:33:18 +0200260}
261
Elad Alonf5b216a2019-01-28 14:25:17 +0100262void RtpPayloadParams::Vp8ToGeneric(const CodecSpecificInfoVP8& vp8_info,
263 int64_t shared_frame_id,
philipelbf2b6202018-08-27 14:33:18 +0200264 bool is_keyframe,
265 RTPVideoHeader* rtp_video_header) {
266 const auto& vp8_header =
267 absl::get<RTPVideoHeaderVP8>(rtp_video_header->video_type_header);
268 const int spatial_index = 0;
269 const int temporal_index =
270 vp8_header.temporalIdx != kNoTemporalIdx ? vp8_header.temporalIdx : 0;
271
272 if (temporal_index >= RtpGenericFrameDescriptor::kMaxTemporalLayers ||
273 spatial_index >= RtpGenericFrameDescriptor::kMaxSpatialLayers) {
274 RTC_LOG(LS_WARNING) << "Temporal and/or spatial index is too high to be "
275 "used with generic frame descriptor.";
276 return;
277 }
278
279 RTPVideoHeader::GenericDescriptorInfo& generic =
280 rtp_video_header->generic.emplace();
281
282 generic.frame_id = shared_frame_id;
283 generic.spatial_index = spatial_index;
284 generic.temporal_index = temporal_index;
285
Elad Alonf5b216a2019-01-28 14:25:17 +0100286 if (vp8_info.useExplicitDependencies) {
287 SetDependenciesVp8New(vp8_info, shared_frame_id, is_keyframe,
288 vp8_header.layerSync, &generic);
289 } else {
290 SetDependenciesVp8Deprecated(vp8_info, shared_frame_id, is_keyframe,
291 spatial_index, temporal_index,
292 vp8_header.layerSync, &generic);
293 }
294}
295
296void RtpPayloadParams::SetDependenciesVp8Deprecated(
297 const CodecSpecificInfoVP8& vp8_info,
298 int64_t shared_frame_id,
299 bool is_keyframe,
300 int spatial_index,
301 int temporal_index,
302 bool layer_sync,
303 RTPVideoHeader::GenericDescriptorInfo* generic) {
304 RTC_DCHECK(!vp8_info.useExplicitDependencies);
305 RTC_DCHECK(!new_version_used_.has_value() || !new_version_used_.value());
306 new_version_used_ = false;
307
philipelbf2b6202018-08-27 14:33:18 +0200308 if (is_keyframe) {
309 RTC_DCHECK_EQ(temporal_index, 0);
310 last_shared_frame_id_[spatial_index].fill(-1);
311 last_shared_frame_id_[spatial_index][temporal_index] = shared_frame_id;
312 return;
313 }
314
Elad Alonf5b216a2019-01-28 14:25:17 +0100315 if (layer_sync) {
philipelbf2b6202018-08-27 14:33:18 +0200316 int64_t tl0_frame_id = last_shared_frame_id_[spatial_index][0];
317
318 for (int i = 1; i < RtpGenericFrameDescriptor::kMaxTemporalLayers; ++i) {
319 if (last_shared_frame_id_[spatial_index][i] < tl0_frame_id) {
320 last_shared_frame_id_[spatial_index][i] = -1;
321 }
322 }
323
324 RTC_DCHECK_GE(tl0_frame_id, 0);
325 RTC_DCHECK_LT(tl0_frame_id, shared_frame_id);
Elad Alonf5b216a2019-01-28 14:25:17 +0100326 generic->dependencies.push_back(tl0_frame_id);
philipelbf2b6202018-08-27 14:33:18 +0200327 } else {
328 for (int i = 0; i <= temporal_index; ++i) {
329 int64_t frame_id = last_shared_frame_id_[spatial_index][i];
330
331 if (frame_id != -1) {
332 RTC_DCHECK_LT(frame_id, shared_frame_id);
Elad Alonf5b216a2019-01-28 14:25:17 +0100333 generic->dependencies.push_back(frame_id);
philipelbf2b6202018-08-27 14:33:18 +0200334 }
335 }
336 }
337
338 last_shared_frame_id_[spatial_index][temporal_index] = shared_frame_id;
339}
340
Elad Alonf5b216a2019-01-28 14:25:17 +0100341void RtpPayloadParams::SetDependenciesVp8New(
342 const CodecSpecificInfoVP8& vp8_info,
343 int64_t shared_frame_id,
344 bool is_keyframe,
345 bool layer_sync,
346 RTPVideoHeader::GenericDescriptorInfo* generic) {
347 RTC_DCHECK(vp8_info.useExplicitDependencies);
348 RTC_DCHECK(!new_version_used_.has_value() || new_version_used_.value());
349 new_version_used_ = true;
350
351 if (is_keyframe) {
352 RTC_DCHECK_EQ(vp8_info.referencedBuffersCount, 0u);
353 buffer_id_to_frame_id_.fill(shared_frame_id);
354 return;
355 }
356
357 constexpr size_t kBuffersCountVp8 = CodecSpecificInfoVP8::kBuffersCount;
358
359 RTC_DCHECK_GT(vp8_info.referencedBuffersCount, 0u);
360 RTC_DCHECK_LE(vp8_info.referencedBuffersCount,
361 arraysize(vp8_info.referencedBuffers));
362
363 for (size_t i = 0; i < vp8_info.referencedBuffersCount; ++i) {
364 const size_t referenced_buffer = vp8_info.referencedBuffers[i];
365 RTC_DCHECK_LT(referenced_buffer, kBuffersCountVp8);
366 RTC_DCHECK_LT(referenced_buffer, buffer_id_to_frame_id_.size());
367
368 const int64_t dependency_frame_id =
369 buffer_id_to_frame_id_[referenced_buffer];
370 RTC_DCHECK_GE(dependency_frame_id, 0);
371 RTC_DCHECK_LT(dependency_frame_id, shared_frame_id);
372
373 const bool is_new_dependency =
374 std::find(generic->dependencies.begin(), generic->dependencies.end(),
375 dependency_frame_id) == generic->dependencies.end();
376 if (is_new_dependency) {
377 generic->dependencies.push_back(dependency_frame_id);
378 }
379 }
380
381 RTC_DCHECK_LE(vp8_info.updatedBuffersCount, kBuffersCountVp8);
382 for (size_t i = 0; i < vp8_info.updatedBuffersCount; ++i) {
383 const size_t updated_id = vp8_info.updatedBuffers[i];
384 buffer_id_to_frame_id_[updated_id] = shared_frame_id;
385 }
386
387 RTC_DCHECK_LE(buffer_id_to_frame_id_.size(), kBuffersCountVp8);
388}
389
Stefan Holmerf7044682018-07-17 10:16:41 +0200390} // namespace webrtc