| Index: webrtc/modules/video_coding/packet_buffer.cc
|
| diff --git a/webrtc/modules/video_coding/packet_buffer.cc b/webrtc/modules/video_coding/packet_buffer.cc
|
| index d7b4f449e7be065f1bb2872678f0863f9fe0de56..71ab3e57d859fe20a5d518cb3a96856280c3fc1e 100644
|
| --- a/webrtc/modules/video_coding/packet_buffer.cc
|
| +++ b/webrtc/modules/video_coding/packet_buffer.cc
|
| @@ -14,6 +14,7 @@
|
| #include <limits>
|
|
|
| #include "webrtc/base/checks.h"
|
| +#include "webrtc/base/logging.h"
|
| #include "webrtc/modules/video_coding/frame_object.h"
|
|
|
| namespace webrtc {
|
| @@ -31,7 +32,8 @@ PacketBuffer::PacketBuffer(size_t start_buffer_size,
|
| sequence_buffer_(start_buffer_size),
|
| frame_callback_(frame_callback),
|
| last_picture_id_(-1),
|
| - last_unwrap_(-1) {
|
| + last_unwrap_(-1),
|
| + current_ss_idx_(0) {
|
| RTC_DCHECK_LE(start_buffer_size, max_buffer_size);
|
| // Buffer size must always be a power of 2.
|
| RTC_DCHECK((start_buffer_size & (start_buffer_size - 1)) == 0);
|
| @@ -216,7 +218,7 @@ void PacketBuffer::ManageFrame(std::unique_ptr<RtpFrameObject> frame) {
|
| ManageFrameVp8(std::move(frame));
|
| break;
|
| case kVideoCodecVP9:
|
| - // TODO(philipel): ManageFrameVp9(std::move(frame));
|
| + ManageFrameVp9(std::move(frame));
|
| break;
|
| case kVideoCodecH264:
|
| case kVideoCodecI420:
|
| @@ -316,7 +318,7 @@ void PacketBuffer::ManageFrameVp8(std::unique_ptr<RtpFrameObject> frame) {
|
|
|
| // Find if there has been a gap in fully received frames and save the picture
|
| // id of those frames in |not_yet_received_frames_|.
|
| - if (AheadOf<uint8_t, kPicIdLength>(frame->picture_id, last_picture_id_)) {
|
| + if (AheadOf<uint16_t, kPicIdLength>(frame->picture_id, last_picture_id_)) {
|
| last_picture_id_ = Add<kPicIdLength>(last_picture_id_, 1);
|
| while (last_picture_id_ != frame->picture_id) {
|
| not_yet_received_frames_.insert(last_picture_id_);
|
| @@ -386,10 +388,10 @@ void PacketBuffer::ManageFrameVp8(std::unique_ptr<RtpFrameObject> frame) {
|
| auto not_received_frame_it =
|
| not_yet_received_frames_.upper_bound(layer_info_it->second[layer]);
|
| if (not_received_frame_it != not_yet_received_frames_.end() &&
|
| - AheadOf<uint8_t, kPicIdLength>(frame->picture_id,
|
| - *not_received_frame_it)) {
|
| - stashed_frames_.emplace(std::move(frame));
|
| - return;
|
| + AheadOf<uint16_t, kPicIdLength>(frame->picture_id,
|
| + *not_received_frame_it)) {
|
| + stashed_frames_.emplace(std::move(frame));
|
| + return;
|
| }
|
|
|
| ++frame->num_references;
|
| @@ -425,22 +427,228 @@ void PacketBuffer::CompletedFrameVp8(std::unique_ptr<RtpFrameObject> frame) {
|
| }
|
| not_yet_received_frames_.erase(frame->picture_id);
|
|
|
| - for (size_t r = 0; r < frame->num_references; ++r)
|
| - frame->references[r] = UnwrapPictureId(frame->references[r]);
|
| + for (size_t i = 0; i < frame->num_references; ++i)
|
| + frame->references[i] = UnwrapPictureId(frame->references[i]);
|
| frame->picture_id = UnwrapPictureId(frame->picture_id);
|
|
|
| frame_callback_->OnCompleteFrame(std::move(frame));
|
| RetryStashedFrames();
|
| }
|
|
|
| -uint16_t PacketBuffer::UnwrapPictureId(uint16_t picture_id) {
|
| +void PacketBuffer::ManageFrameVp9(std::unique_ptr<RtpFrameObject> frame) {
|
| + size_t index = frame->first_seq_num() % size_;
|
| + const VCMPacket& packet = data_buffer_[index];
|
| + const RTPVideoHeaderVP9& codec_header =
|
| + packet.codecSpecificHeader.codecHeader.VP9;
|
| +
|
| + if (codec_header.picture_id == kNoPictureId) {
|
| + ManageFrameGeneric(std::move(frame));
|
| + return;
|
| + }
|
| +
|
| + frame->spatial_layer = codec_header.spatial_idx;
|
| + frame->inter_layer_predicted = codec_header.inter_layer_predicted;
|
| + frame->picture_id = codec_header.picture_id % kPicIdLength;
|
| +
|
| if (last_unwrap_ == -1)
|
| - last_unwrap_ = picture_id;
|
| + last_unwrap_ = codec_header.picture_id;
|
| +
|
| + if (last_picture_id_ == -1)
|
| + last_picture_id_ = frame->picture_id;
|
| +
|
| + if (codec_header.flexible_mode) {
|
| + frame->num_references = codec_header.num_ref_pics;
|
| + for (size_t i = 0; i < frame->num_references; ++i) {
|
| + frame->references[i] =
|
| + Subtract<1 << 16>(frame->picture_id, codec_header.pid_diff[i]);
|
| + }
|
| +
|
| + CompletedFrameVp9(std::move(frame));
|
| + return;
|
| + }
|
| +
|
| + if (codec_header.ss_data_available) {
|
| + // Scalability structures can only be sent with tl0 frames.
|
| + if (codec_header.temporal_idx != 0) {
|
| + LOG(LS_WARNING) << "Received scalability structure on a non base layer"
|
| + " frame. Scalability structure ignored.";
|
| + } else {
|
| + current_ss_idx_ = Add<kMaxGofSaved>(current_ss_idx_, 1);
|
| + scalability_structures_[current_ss_idx_] = codec_header.gof;
|
| + scalability_structures_[current_ss_idx_].pid_start = frame->picture_id;
|
| +
|
| + auto pid_and_gof = std::make_pair(
|
| + frame->picture_id, &scalability_structures_[current_ss_idx_]);
|
| + gof_info_.insert(std::make_pair(codec_header.tl0_pic_idx, pid_and_gof));
|
| + }
|
| + }
|
| +
|
| + // Clean up info for base layers that are too old.
|
| + uint8_t old_tl0_pic_idx = codec_header.tl0_pic_idx - kMaxGofSaved;
|
| + auto clean_gof_info_to = gof_info_.lower_bound(old_tl0_pic_idx);
|
| + gof_info_.erase(gof_info_.begin(), clean_gof_info_to);
|
| +
|
| + if (packet.frameType == kVideoFrameKey) {
|
| + // When using GOF all keyframes must include the scalability structure.
|
| + if (!codec_header.ss_data_available)
|
| + LOG(LS_WARNING) << "Received keyframe without scalability structure";
|
| +
|
| + frame->num_references = 0;
|
| + GofInfoVP9* gof = gof_info_.find(codec_header.tl0_pic_idx)->second.second;
|
| + FrameReceivedVp9(frame->picture_id, *gof);
|
| + CompletedFrameVp9(std::move(frame));
|
| + return;
|
| + }
|
| +
|
| + auto gof_info_it = gof_info_.find(
|
| + (codec_header.temporal_idx == 0 && !codec_header.ss_data_available)
|
| + ? codec_header.tl0_pic_idx - 1
|
| + : codec_header.tl0_pic_idx);
|
| +
|
| + // Gof info for this frame is not available yet, stash this frame.
|
| + if (gof_info_it == gof_info_.end()) {
|
| + stashed_frames_.emplace(std::move(frame));
|
| + return;
|
| + }
|
| +
|
| + GofInfoVP9* gof = gof_info_it->second.second;
|
| + uint16_t picture_id_tl0 = gof_info_it->second.first;
|
| +
|
| + FrameReceivedVp9(frame->picture_id, *gof);
|
| +
|
| + // Make sure we don't miss any frame that could potentially have the
|
| + // up switch flag set.
|
| + if (MissingRequiredFrameVp9(frame->picture_id, *gof)) {
|
| + stashed_frames_.emplace(std::move(frame));
|
| + return;
|
| + }
|
| +
|
| + if (codec_header.temporal_up_switch) {
|
| + auto pid_tidx =
|
| + std::make_pair(frame->picture_id, codec_header.temporal_idx);
|
| + up_switch_.insert(pid_tidx);
|
| + }
|
| +
|
| + // If this is a base layer frame that contains a scalability structure
|
| + // then gof info has already been inserted earlier, so we only want to
|
| + // insert if we haven't done so already.
|
| + if (codec_header.temporal_idx == 0 && !codec_header.ss_data_available) {
|
| + auto pid_and_gof = std::make_pair(frame->picture_id, gof);
|
| + gof_info_.insert(std::make_pair(codec_header.tl0_pic_idx, pid_and_gof));
|
| + }
|
| +
|
| + // Clean out old info about up switch frames.
|
| + uint16_t old_picture_id = Subtract<kPicIdLength>(last_picture_id_, 50);
|
| + auto up_switch_erase_to = up_switch_.lower_bound(old_picture_id);
|
| + up_switch_.erase(up_switch_.begin(), up_switch_erase_to);
|
| +
|
| + RTC_DCHECK(
|
| + (AheadOrAt<uint16_t, kPicIdLength>(frame->picture_id, picture_id_tl0)));
|
| +
|
| + size_t diff =
|
| + ForwardDiff<uint16_t, kPicIdLength>(gof->pid_start, frame->picture_id);
|
| + size_t gof_idx = diff % gof->num_frames_in_gof;
|
| +
|
| + // Populate references according to the scalability structure.
|
| + frame->num_references = gof->num_ref_pics[gof_idx];
|
| + for (size_t i = 0; i < frame->num_references; ++i) {
|
| + frame->references[i] =
|
| + Subtract<kPicIdLength>(frame->picture_id, gof->pid_diff[gof_idx][i]);
|
| +
|
| + // If this is a reference to a frame earlier than the last up switch point,
|
| + // then ignore this reference.
|
| + if (UpSwitchInIntervalVp9(frame->picture_id, codec_header.temporal_idx,
|
| + frame->references[i])) {
|
| + --frame->num_references;
|
| + }
|
| + }
|
| +
|
| + CompletedFrameVp9(std::move(frame));
|
| +}
|
| +
|
| +bool PacketBuffer::MissingRequiredFrameVp9(uint16_t picture_id,
|
| + const GofInfoVP9& gof) {
|
| + size_t diff = ForwardDiff<uint16_t, kPicIdLength>(gof.pid_start, picture_id);
|
| + size_t gof_idx = diff % gof.num_frames_in_gof;
|
| + size_t temporal_idx = gof.temporal_idx[gof_idx];
|
| +
|
| + // For every reference this frame has, check if there is a frame missing in
|
| + // the interval (|ref_pid|, |picture_id|) in any of the lower temporal
|
| + // layers. If so, we are missing a required frame.
|
| + uint8_t num_references = gof.num_ref_pics[gof_idx];
|
| + for (size_t i = 0; i < num_references; ++i) {
|
| + uint16_t ref_pid =
|
| + Subtract<kPicIdLength>(picture_id, gof.pid_diff[gof_idx][i]);
|
| + for (size_t l = 0; l < temporal_idx; ++l) {
|
| + auto missing_frame_it = missing_frames_for_layer_[l].lower_bound(ref_pid);
|
| + if (missing_frame_it != missing_frames_for_layer_[l].end() &&
|
| + AheadOf<uint16_t, kPicIdLength>(picture_id, *missing_frame_it)) {
|
| + return true;
|
| + }
|
| + }
|
| + }
|
| + return false;
|
| +}
|
| +
|
| +void PacketBuffer::FrameReceivedVp9(uint16_t picture_id,
|
| + const GofInfoVP9& gof) {
|
| + RTC_DCHECK_NE(-1, last_picture_id_);
|
| +
|
| + // If there is a gap, find which temporal layer the missing frames
|
| + // belong to and add the frame as missing for that temporal layer.
|
| + // Otherwise, remove this frame from the set of missing frames.
|
| + if (AheadOf<uint16_t, kPicIdLength>(picture_id, last_picture_id_)) {
|
| + size_t diff =
|
| + ForwardDiff<uint16_t, kPicIdLength>(gof.pid_start, last_picture_id_);
|
| + size_t gof_idx = diff % gof.num_frames_in_gof;
|
| +
|
| + last_picture_id_ = Add<kPicIdLength>(last_picture_id_, 1);
|
| + while (last_picture_id_ != picture_id) {
|
| + ++gof_idx;
|
| + RTC_DCHECK_NE(0ul, gof_idx % gof.num_frames_in_gof);
|
| + size_t temporal_idx = gof.temporal_idx[gof_idx];
|
| + missing_frames_for_layer_[temporal_idx].insert(last_picture_id_);
|
| + last_picture_id_ = Add<kPicIdLength>(last_picture_id_, 1);
|
| + }
|
| + } else {
|
| + size_t diff =
|
| + ForwardDiff<uint16_t, kPicIdLength>(gof.pid_start, picture_id);
|
| + size_t gof_idx = diff % gof.num_frames_in_gof;
|
| + size_t temporal_idx = gof.temporal_idx[gof_idx];
|
| + missing_frames_for_layer_[temporal_idx].erase(picture_id);
|
| + }
|
| +}
|
| +
|
| +bool PacketBuffer::UpSwitchInIntervalVp9(uint16_t picture_id,
|
| + uint8_t temporal_idx,
|
| + uint16_t pid_ref) {
|
| + for (auto up_switch_it = up_switch_.upper_bound(pid_ref);
|
| + up_switch_it != up_switch_.end() &&
|
| + AheadOf<uint16_t, kPicIdLength>(picture_id, up_switch_it->first);
|
| + ++up_switch_it) {
|
| + if (up_switch_it->second < temporal_idx)
|
| + return true;
|
| + }
|
| +
|
| + return false;
|
| +}
|
| +
|
| +void PacketBuffer::CompletedFrameVp9(std::unique_ptr<RtpFrameObject> frame) {
|
| + for (size_t i = 0; i < frame->num_references; ++i)
|
| + frame->references[i] = UnwrapPictureId(frame->references[i]);
|
| + frame->picture_id = UnwrapPictureId(frame->picture_id);
|
| +
|
| + frame_callback_->OnCompleteFrame(std::move(frame));
|
| + RetryStashedFrames();
|
| +}
|
| +
|
| +uint16_t PacketBuffer::UnwrapPictureId(uint16_t picture_id) {
|
| + RTC_DCHECK_NE(-1, last_unwrap_);
|
|
|
| uint16_t unwrap_truncated = last_unwrap_ % kPicIdLength;
|
| - uint16_t diff = MinDiff<uint8_t, kPicIdLength>(unwrap_truncated, picture_id);
|
| + uint16_t diff = MinDiff<uint16_t, kPicIdLength>(unwrap_truncated, picture_id);
|
|
|
| - if (AheadOf<uint8_t, kPicIdLength>(picture_id, unwrap_truncated))
|
| + if (AheadOf<uint16_t, kPicIdLength>(picture_id, unwrap_truncated))
|
| last_unwrap_ = Add<1 << 16>(last_unwrap_, diff);
|
| else
|
| last_unwrap_ = Subtract<1 << 16>(last_unwrap_, diff);
|
|
|