webrtc/modules/video_coding/packet_buffer.cc - Issue 1903523003: Convert Vp9 Rtp headers to frame references.

Unified Diff: webrtc/modules/video_coding/packet_buffer.cc

Issue 1903523003: Convert Vp9 Rtp headers to frame references. (Closed) Base URL: https://chromium.googlesource.com/external/webrtc.git@master

Patch Set: Includes in alphabetic order. Created 4 years, 7 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: webrtc/modules/video_coding/packet_buffer.cc

diff --git a/webrtc/modules/video_coding/packet_buffer.cc b/webrtc/modules/video_coding/packet_buffer.cc

index d7b4f449e7be065f1bb2872678f0863f9fe0de56..71ab3e57d859fe20a5d518cb3a96856280c3fc1e 100644

--- a/webrtc/modules/video_coding/packet_buffer.cc

+++ b/webrtc/modules/video_coding/packet_buffer.cc

@@ -14,6 +14,7 @@

#include <limits>

#include "webrtc/base/checks.h"

+#include "webrtc/base/logging.h"

#include "webrtc/modules/video_coding/frame_object.h"

namespace webrtc {

@@ -31,7 +32,8 @@ PacketBuffer::PacketBuffer(size_t start_buffer_size,

sequence_buffer_(start_buffer_size),

frame_callback_(frame_callback),

last_picture_id_(-1),

- last_unwrap_(-1) {

+ last_unwrap_(-1),

+ current_ss_idx_(0) {

RTC_DCHECK_LE(start_buffer_size, max_buffer_size);

// Buffer size must always be a power of 2.

RTC_DCHECK((start_buffer_size & (start_buffer_size - 1)) == 0);

@@ -216,7 +218,7 @@ void PacketBuffer::ManageFrame(std::unique_ptr<RtpFrameObject> frame) {

ManageFrameVp8(std::move(frame));

break;

case kVideoCodecVP9:

- // TODO(philipel): ManageFrameVp9(std::move(frame));

+ ManageFrameVp9(std::move(frame));

break;

case kVideoCodecH264:

case kVideoCodecI420:

@@ -316,7 +318,7 @@ void PacketBuffer::ManageFrameVp8(std::unique_ptr<RtpFrameObject> frame) {

// Find if there has been a gap in fully received frames and save the picture

// id of those frames in |not_yet_received_frames_|.

- if (AheadOf<uint8_t, kPicIdLength>(frame->picture_id, last_picture_id_)) {

+ if (AheadOf<uint16_t, kPicIdLength>(frame->picture_id, last_picture_id_)) {

last_picture_id_ = Add<kPicIdLength>(last_picture_id_, 1);

while (last_picture_id_ != frame->picture_id) {

not_yet_received_frames_.insert(last_picture_id_);

@@ -386,10 +388,10 @@ void PacketBuffer::ManageFrameVp8(std::unique_ptr<RtpFrameObject> frame) {

auto not_received_frame_it =

not_yet_received_frames_.upper_bound(layer_info_it->second[layer]);

if (not_received_frame_it != not_yet_received_frames_.end() &&

- AheadOf<uint8_t, kPicIdLength>(frame->picture_id,

- *not_received_frame_it)) {

- stashed_frames_.emplace(std::move(frame));

- return;

+ AheadOf<uint16_t, kPicIdLength>(frame->picture_id,

+ *not_received_frame_it)) {

+ stashed_frames_.emplace(std::move(frame));

+ return;

}

++frame->num_references;

@@ -425,22 +427,228 @@ void PacketBuffer::CompletedFrameVp8(std::unique_ptr<RtpFrameObject> frame) {

}

not_yet_received_frames_.erase(frame->picture_id);

- for (size_t r = 0; r < frame->num_references; ++r)

- frame->references[r] = UnwrapPictureId(frame->references[r]);

+ for (size_t i = 0; i < frame->num_references; ++i)

+ frame->references[i] = UnwrapPictureId(frame->references[i]);

frame->picture_id = UnwrapPictureId(frame->picture_id);

frame_callback_->OnCompleteFrame(std::move(frame));

RetryStashedFrames();

}

-uint16_t PacketBuffer::UnwrapPictureId(uint16_t picture_id) {

+void PacketBuffer::ManageFrameVp9(std::unique_ptr<RtpFrameObject> frame) {

+ size_t index = frame->first_seq_num() % size_;

+ const VCMPacket& packet = data_buffer_[index];

+ const RTPVideoHeaderVP9& codec_header =

+ packet.codecSpecificHeader.codecHeader.VP9;

+ if (codec_header.picture_id == kNoPictureId) {

+ ManageFrameGeneric(std::move(frame));

+ return;

+ }

+ frame->spatial_layer = codec_header.spatial_idx;

+ frame->inter_layer_predicted = codec_header.inter_layer_predicted;

+ frame->picture_id = codec_header.picture_id % kPicIdLength;

if (last_unwrap_ == -1)

- last_unwrap_ = picture_id;

+ last_unwrap_ = codec_header.picture_id;

+ if (last_picture_id_ == -1)

+ last_picture_id_ = frame->picture_id;

+ if (codec_header.flexible_mode) {

+ frame->num_references = codec_header.num_ref_pics;

+ for (size_t i = 0; i < frame->num_references; ++i) {

+ frame->references[i] =

+ Subtract<1 << 16>(frame->picture_id, codec_header.pid_diff[i]);

+ }

+ CompletedFrameVp9(std::move(frame));

+ return;

+ }

+ if (codec_header.ss_data_available) {

+ // Scalability structures can only be sent with tl0 frames.

+ if (codec_header.temporal_idx != 0) {

+ LOG(LS_WARNING) << "Received scalability structure on a non base layer"

+ " frame. Scalability structure ignored.";

+ } else {

+ current_ss_idx_ = Add<kMaxGofSaved>(current_ss_idx_, 1);

+ scalability_structures_[current_ss_idx_] = codec_header.gof;

+ scalability_structures_[current_ss_idx_].pid_start = frame->picture_id;

+ auto pid_and_gof = std::make_pair(

+ frame->picture_id, &scalability_structures_[current_ss_idx_]);

+ gof_info_.insert(std::make_pair(codec_header.tl0_pic_idx, pid_and_gof));

+ }

+ // Clean up info for base layers that are too old.

+ uint8_t old_tl0_pic_idx = codec_header.tl0_pic_idx - kMaxGofSaved;

+ auto clean_gof_info_to = gof_info_.lower_bound(old_tl0_pic_idx);

+ gof_info_.erase(gof_info_.begin(), clean_gof_info_to);

+ if (packet.frameType == kVideoFrameKey) {

+ // When using GOF all keyframes must include the scalability structure.

+ if (!codec_header.ss_data_available)

+ LOG(LS_WARNING) << "Received keyframe without scalability structure";

+ frame->num_references = 0;

+ GofInfoVP9* gof = gof_info_.find(codec_header.tl0_pic_idx)->second.second;

+ FrameReceivedVp9(frame->picture_id, *gof);

+ CompletedFrameVp9(std::move(frame));

+ return;

+ }

+ auto gof_info_it = gof_info_.find(

+ (codec_header.temporal_idx == 0 && !codec_header.ss_data_available)

+ ? codec_header.tl0_pic_idx - 1

+ : codec_header.tl0_pic_idx);

+ // Gof info for this frame is not available yet, stash this frame.

+ if (gof_info_it == gof_info_.end()) {

+ stashed_frames_.emplace(std::move(frame));

+ return;

+ }

+ GofInfoVP9* gof = gof_info_it->second.second;

+ uint16_t picture_id_tl0 = gof_info_it->second.first;

+ FrameReceivedVp9(frame->picture_id, *gof);

+ // Make sure we don't miss any frame that could potentially have the

+ // up switch flag set.

+ if (MissingRequiredFrameVp9(frame->picture_id, *gof)) {

+ stashed_frames_.emplace(std::move(frame));

+ return;

+ }

+ if (codec_header.temporal_up_switch) {

+ auto pid_tidx =

+ std::make_pair(frame->picture_id, codec_header.temporal_idx);

+ up_switch_.insert(pid_tidx);

+ }

+ // If this is a base layer frame that contains a scalability structure

+ // then gof info has already been inserted earlier, so we only want to

+ // insert if we haven't done so already.

+ if (codec_header.temporal_idx == 0 && !codec_header.ss_data_available) {

+ auto pid_and_gof = std::make_pair(frame->picture_id, gof);

+ gof_info_.insert(std::make_pair(codec_header.tl0_pic_idx, pid_and_gof));

+ }

+ // Clean out old info about up switch frames.

+ uint16_t old_picture_id = Subtract<kPicIdLength>(last_picture_id_, 50);

+ auto up_switch_erase_to = up_switch_.lower_bound(old_picture_id);

+ up_switch_.erase(up_switch_.begin(), up_switch_erase_to);

+ RTC_DCHECK(

+ (AheadOrAt<uint16_t, kPicIdLength>(frame->picture_id, picture_id_tl0)));

+ size_t diff =

+ ForwardDiff<uint16_t, kPicIdLength>(gof->pid_start, frame->picture_id);

+ size_t gof_idx = diff % gof->num_frames_in_gof;

+ // Populate references according to the scalability structure.

+ frame->num_references = gof->num_ref_pics[gof_idx];

+ for (size_t i = 0; i < frame->num_references; ++i) {

+ frame->references[i] =

+ Subtract<kPicIdLength>(frame->picture_id, gof->pid_diff[gof_idx][i]);

+ // If this is a reference to a frame earlier than the last up switch point,

+ // then ignore this reference.

+ if (UpSwitchInIntervalVp9(frame->picture_id, codec_header.temporal_idx,

+ frame->references[i])) {

+ --frame->num_references;

+ }

+ CompletedFrameVp9(std::move(frame));

+bool PacketBuffer::MissingRequiredFrameVp9(uint16_t picture_id,

+ const GofInfoVP9& gof) {

+ size_t diff = ForwardDiff<uint16_t, kPicIdLength>(gof.pid_start, picture_id);

+ size_t gof_idx = diff % gof.num_frames_in_gof;

+ size_t temporal_idx = gof.temporal_idx[gof_idx];

+ // For every reference this frame has, check if there is a frame missing in

+ // the interval (|ref_pid|, |picture_id|) in any of the lower temporal

+ // layers. If so, we are missing a required frame.

+ uint8_t num_references = gof.num_ref_pics[gof_idx];

+ for (size_t i = 0; i < num_references; ++i) {

+ uint16_t ref_pid =

+ Subtract<kPicIdLength>(picture_id, gof.pid_diff[gof_idx][i]);

+ for (size_t l = 0; l < temporal_idx; ++l) {

+ auto missing_frame_it = missing_frames_for_layer_[l].lower_bound(ref_pid);

+ if (missing_frame_it != missing_frames_for_layer_[l].end() &&

+ AheadOf<uint16_t, kPicIdLength>(picture_id, *missing_frame_it)) {

+ return true;

+ }

+ return false;

+void PacketBuffer::FrameReceivedVp9(uint16_t picture_id,

+ const GofInfoVP9& gof) {

+ RTC_DCHECK_NE(-1, last_picture_id_);

+ // If there is a gap, find which temporal layer the missing frames

+ // belong to and add the frame as missing for that temporal layer.

+ // Otherwise, remove this frame from the set of missing frames.

+ if (AheadOf<uint16_t, kPicIdLength>(picture_id, last_picture_id_)) {

+ size_t diff =

+ ForwardDiff<uint16_t, kPicIdLength>(gof.pid_start, last_picture_id_);

+ size_t gof_idx = diff % gof.num_frames_in_gof;

+ last_picture_id_ = Add<kPicIdLength>(last_picture_id_, 1);

+ while (last_picture_id_ != picture_id) {

+ ++gof_idx;

+ RTC_DCHECK_NE(0ul, gof_idx % gof.num_frames_in_gof);

+ size_t temporal_idx = gof.temporal_idx[gof_idx];

+ missing_frames_for_layer_[temporal_idx].insert(last_picture_id_);

+ last_picture_id_ = Add<kPicIdLength>(last_picture_id_, 1);

+ }

+ } else {

+ size_t diff =

+ ForwardDiff<uint16_t, kPicIdLength>(gof.pid_start, picture_id);

+ size_t gof_idx = diff % gof.num_frames_in_gof;

+ size_t temporal_idx = gof.temporal_idx[gof_idx];

+ missing_frames_for_layer_[temporal_idx].erase(picture_id);

+ }

+bool PacketBuffer::UpSwitchInIntervalVp9(uint16_t picture_id,

+ uint8_t temporal_idx,

+ uint16_t pid_ref) {

+ for (auto up_switch_it = up_switch_.upper_bound(pid_ref);

+ up_switch_it != up_switch_.end() &&

+ AheadOf<uint16_t, kPicIdLength>(picture_id, up_switch_it->first);

+ ++up_switch_it) {

+ if (up_switch_it->second < temporal_idx)

+ return true;

+ }

+ return false;

+void PacketBuffer::CompletedFrameVp9(std::unique_ptr<RtpFrameObject> frame) {

+ for (size_t i = 0; i < frame->num_references; ++i)

+ frame->references[i] = UnwrapPictureId(frame->references[i]);

+ frame->picture_id = UnwrapPictureId(frame->picture_id);

+ frame_callback_->OnCompleteFrame(std::move(frame));

+ RetryStashedFrames();

+uint16_t PacketBuffer::UnwrapPictureId(uint16_t picture_id) {

+ RTC_DCHECK_NE(-1, last_unwrap_);

uint16_t unwrap_truncated = last_unwrap_ % kPicIdLength;

- uint16_t diff = MinDiff<uint8_t, kPicIdLength>(unwrap_truncated, picture_id);

+ uint16_t diff = MinDiff<uint16_t, kPicIdLength>(unwrap_truncated, picture_id);

- if (AheadOf<uint8_t, kPicIdLength>(picture_id, unwrap_truncated))

+ if (AheadOf<uint16_t, kPicIdLength>(picture_id, unwrap_truncated))

last_unwrap_ = Add<1 << 16>(last_unwrap_, diff);

else

last_unwrap_ = Subtract<1 << 16>(last_unwrap_, diff);

« no previous file with comments | « webrtc/modules/video_coding/packet_buffer.h ('k') | webrtc/modules/video_coding/packet_buffer_unittest.cc » ('j') | no next file with comments »