OLD | NEW |
---|---|
1 /* | 1 /* |
2 * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved. | 2 * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license | 4 * Use of this source code is governed by a BSD-style license |
5 * that can be found in the LICENSE file in the root of the source | 5 * that can be found in the LICENSE file in the root of the source |
6 * tree. An additional intellectual property rights grant can be found | 6 * tree. An additional intellectual property rights grant can be found |
7 * in the file PATENTS. All contributing project authors may | 7 * in the file PATENTS. All contributing project authors may |
8 * be found in the AUTHORS file in the root of the source tree. | 8 * be found in the AUTHORS file in the root of the source tree. |
9 */ | 9 */ |
10 | 10 |
11 #include "webrtc/modules/video_coding/decoding_state.h" | 11 #include "webrtc/modules/video_coding/decoding_state.h" |
12 | 12 |
13 #include "webrtc/base/logging.h" | |
14 #include "webrtc/common_video/h264/h264_common.h" | |
13 #include "webrtc/modules/include/module_common_types.h" | 15 #include "webrtc/modules/include/module_common_types.h" |
14 #include "webrtc/modules/video_coding/frame_buffer.h" | 16 #include "webrtc/modules/video_coding/frame_buffer.h" |
15 #include "webrtc/modules/video_coding/jitter_buffer_common.h" | 17 #include "webrtc/modules/video_coding/jitter_buffer_common.h" |
16 #include "webrtc/modules/video_coding/packet.h" | 18 #include "webrtc/modules/video_coding/packet.h" |
17 | 19 |
18 namespace webrtc { | 20 namespace webrtc { |
19 | 21 |
20 VCMDecodingState::VCMDecodingState() | 22 VCMDecodingState::VCMDecodingState() |
21 : sequence_num_(0), | 23 : sequence_num_(0), |
22 time_stamp_(0), | 24 time_stamp_(0), |
(...skipping 10 matching lines...) Expand all Loading... | |
33 void VCMDecodingState::Reset() { | 35 void VCMDecodingState::Reset() { |
34 // TODO(mikhal): Verify - not always would want to reset the sync | 36 // TODO(mikhal): Verify - not always would want to reset the sync |
35 sequence_num_ = 0; | 37 sequence_num_ = 0; |
36 time_stamp_ = 0; | 38 time_stamp_ = 0; |
37 picture_id_ = kNoPictureId; | 39 picture_id_ = kNoPictureId; |
38 temporal_id_ = kNoTemporalIdx; | 40 temporal_id_ = kNoTemporalIdx; |
39 tl0_pic_id_ = kNoTl0PicIdx; | 41 tl0_pic_id_ = kNoTl0PicIdx; |
40 full_sync_ = true; | 42 full_sync_ = true; |
41 in_initial_state_ = true; | 43 in_initial_state_ = true; |
42 memset(frame_decoded_, 0, sizeof(frame_decoded_)); | 44 memset(frame_decoded_, 0, sizeof(frame_decoded_)); |
45 received_sps_.clear(); | |
46 received_pps_.clear(); | |
43 } | 47 } |
44 | 48 |
45 uint32_t VCMDecodingState::time_stamp() const { | 49 uint32_t VCMDecodingState::time_stamp() const { |
46 return time_stamp_; | 50 return time_stamp_; |
47 } | 51 } |
48 | 52 |
49 uint16_t VCMDecodingState::sequence_num() const { | 53 uint16_t VCMDecodingState::sequence_num() const { |
50 return sequence_num_; | 54 return sequence_num_; |
51 } | 55 } |
52 | 56 |
(...skipping 14 matching lines...) Expand all Loading... | |
67 void VCMDecodingState::SetState(const VCMFrameBuffer* frame) { | 71 void VCMDecodingState::SetState(const VCMFrameBuffer* frame) { |
68 assert(frame != NULL && frame->GetHighSeqNum() >= 0); | 72 assert(frame != NULL && frame->GetHighSeqNum() >= 0); |
69 if (!UsingFlexibleMode(frame)) | 73 if (!UsingFlexibleMode(frame)) |
70 UpdateSyncState(frame); | 74 UpdateSyncState(frame); |
71 sequence_num_ = static_cast<uint16_t>(frame->GetHighSeqNum()); | 75 sequence_num_ = static_cast<uint16_t>(frame->GetHighSeqNum()); |
72 time_stamp_ = frame->TimeStamp(); | 76 time_stamp_ = frame->TimeStamp(); |
73 picture_id_ = frame->PictureId(); | 77 picture_id_ = frame->PictureId(); |
74 temporal_id_ = frame->TemporalId(); | 78 temporal_id_ = frame->TemporalId(); |
75 tl0_pic_id_ = frame->Tl0PicId(); | 79 tl0_pic_id_ = frame->Tl0PicId(); |
76 | 80 |
81 for (const NaluInfo& nalu : frame->GetNaluInfos()) { | |
82 if (nalu.type == H264::NaluType::kPps) { | |
83 if (nalu.pps_id < 0) { | |
84 LOG(LS_WARNING) << "Received pps without pps id."; | |
85 } else if (nalu.sps_id < 0) { | |
86 LOG(LS_WARNING) << "Received pps without sps id."; | |
87 } else { | |
88 received_pps_[nalu.pps_id] = nalu.sps_id; | |
89 } | |
90 } else if (nalu.type == H264::NaluType::kSps) { | |
91 if (nalu.sps_id < 0) { | |
92 LOG(LS_WARNING) << "Received sps without sps id."; | |
93 } else { | |
94 received_sps_.insert(nalu.sps_id); | |
95 } | |
96 } | |
97 } | |
98 | |
77 if (UsingFlexibleMode(frame)) { | 99 if (UsingFlexibleMode(frame)) { |
78 uint16_t frame_index = picture_id_ % kFrameDecodedLength; | 100 uint16_t frame_index = picture_id_ % kFrameDecodedLength; |
79 if (in_initial_state_) { | 101 if (in_initial_state_) { |
80 frame_decoded_cleared_to_ = frame_index; | 102 frame_decoded_cleared_to_ = frame_index; |
81 } else if (frame->FrameType() == kVideoFrameKey) { | 103 } else if (frame->FrameType() == kVideoFrameKey) { |
82 memset(frame_decoded_, 0, sizeof(frame_decoded_)); | 104 memset(frame_decoded_, 0, sizeof(frame_decoded_)); |
83 frame_decoded_cleared_to_ = frame_index; | 105 frame_decoded_cleared_to_ = frame_index; |
84 } else { | 106 } else { |
85 if (AheadOfFramesDecodedClearedTo(frame_index)) { | 107 if (AheadOfFramesDecodedClearedTo(frame_index)) { |
86 while (frame_decoded_cleared_to_ != frame_index) { | 108 while (frame_decoded_cleared_to_ != frame_index) { |
(...skipping 12 matching lines...) Expand all Loading... | |
99 void VCMDecodingState::CopyFrom(const VCMDecodingState& state) { | 121 void VCMDecodingState::CopyFrom(const VCMDecodingState& state) { |
100 sequence_num_ = state.sequence_num_; | 122 sequence_num_ = state.sequence_num_; |
101 time_stamp_ = state.time_stamp_; | 123 time_stamp_ = state.time_stamp_; |
102 picture_id_ = state.picture_id_; | 124 picture_id_ = state.picture_id_; |
103 temporal_id_ = state.temporal_id_; | 125 temporal_id_ = state.temporal_id_; |
104 tl0_pic_id_ = state.tl0_pic_id_; | 126 tl0_pic_id_ = state.tl0_pic_id_; |
105 full_sync_ = state.full_sync_; | 127 full_sync_ = state.full_sync_; |
106 in_initial_state_ = state.in_initial_state_; | 128 in_initial_state_ = state.in_initial_state_; |
107 frame_decoded_cleared_to_ = state.frame_decoded_cleared_to_; | 129 frame_decoded_cleared_to_ = state.frame_decoded_cleared_to_; |
108 memcpy(frame_decoded_, state.frame_decoded_, sizeof(frame_decoded_)); | 130 memcpy(frame_decoded_, state.frame_decoded_, sizeof(frame_decoded_)); |
131 received_sps_ = state.received_sps_; | |
132 received_pps_ = state.received_pps_; | |
109 } | 133 } |
110 | 134 |
111 bool VCMDecodingState::UpdateEmptyFrame(const VCMFrameBuffer* frame) { | 135 bool VCMDecodingState::UpdateEmptyFrame(const VCMFrameBuffer* frame) { |
112 bool empty_packet = frame->GetHighSeqNum() == frame->GetLowSeqNum(); | 136 bool empty_packet = frame->GetHighSeqNum() == frame->GetLowSeqNum(); |
113 if (in_initial_state_ && empty_packet) { | 137 if (in_initial_state_ && empty_packet) { |
114 // Drop empty packets as long as we are in the initial state. | 138 // Drop empty packets as long as we are in the initial state. |
115 return true; | 139 return true; |
116 } | 140 } |
117 if ((empty_packet && ContinuousSeqNum(frame->GetHighSeqNum())) || | 141 if ((empty_packet && ContinuousSeqNum(frame->GetHighSeqNum())) || |
118 ContinuousFrame(frame)) { | 142 ContinuousFrame(frame)) { |
(...skipping 57 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
176 // Check continuity based on the following hierarchy: | 200 // Check continuity based on the following hierarchy: |
177 // - Temporal layers (stop here if out of sync). | 201 // - Temporal layers (stop here if out of sync). |
178 // - Picture Id when available. | 202 // - Picture Id when available. |
179 // - Sequence numbers. | 203 // - Sequence numbers. |
180 // Return true when in initial state. | 204 // Return true when in initial state. |
181 // Note that when a method is not applicable it will return false. | 205 // Note that when a method is not applicable it will return false. |
182 assert(frame != NULL); | 206 assert(frame != NULL); |
183 // A key frame is always considered continuous as it doesn't refer to any | 207 // A key frame is always considered continuous as it doesn't refer to any |
184 // frames and therefore won't introduce any errors even if prior frames are | 208 // frames and therefore won't introduce any errors even if prior frames are |
185 // missing. | 209 // missing. |
186 if (frame->FrameType() == kVideoFrameKey) | 210 if (frame->FrameType() == kVideoFrameKey && |
211 HaveSpsAndPps(frame->GetNaluInfos())) { | |
philipel
2016/10/06 10:49:47
Can a h264 frame ever not have nalus? In that case
stefan-webrtc
2016/10/06 11:00:02
Right, it shouldn't be possible, except if we'd pa
philipel
2016/10/06 11:10:51
Right, so if we have a valid h264 frame then it mu
| |
187 return true; | 212 return true; |
213 } | |
188 // When in the initial state we always require a key frame to start decoding. | 214 // When in the initial state we always require a key frame to start decoding. |
189 if (in_initial_state_) | 215 if (in_initial_state_) |
190 return false; | 216 return false; |
191 if (ContinuousLayer(frame->TemporalId(), frame->Tl0PicId())) | 217 if (ContinuousLayer(frame->TemporalId(), frame->Tl0PicId())) |
192 return true; | 218 return true; |
193 // tl0picId is either not used, or should remain unchanged. | 219 // tl0picId is either not used, or should remain unchanged. |
194 if (frame->Tl0PicId() != tl0_pic_id_) | 220 if (frame->Tl0PicId() != tl0_pic_id_) |
195 return false; | 221 return false; |
196 // Base layers are not continuous or temporal layers are inactive. | 222 // Base layers are not continuous or temporal layers are inactive. |
197 // In the presence of temporal layers, check for Picture ID/sequence number | 223 // In the presence of temporal layers, check for Picture ID/sequence number |
198 // continuity if sync can be restored by this frame. | 224 // continuity if sync can be restored by this frame. |
199 if (!full_sync_ && !frame->LayerSync()) | 225 if (!full_sync_ && !frame->LayerSync()) |
200 return false; | 226 return false; |
201 if (UsingPictureId(frame)) { | 227 if (UsingPictureId(frame)) { |
202 if (UsingFlexibleMode(frame)) { | 228 if (UsingFlexibleMode(frame)) { |
203 return ContinuousFrameRefs(frame); | 229 return ContinuousFrameRefs(frame); |
204 } else { | 230 } else { |
205 return ContinuousPictureId(frame->PictureId()); | 231 return ContinuousPictureId(frame->PictureId()); |
206 } | 232 } |
207 } else { | 233 } else { |
208 return ContinuousSeqNum(static_cast<uint16_t>(frame->GetLowSeqNum())); | 234 return ContinuousSeqNum(static_cast<uint16_t>(frame->GetLowSeqNum())) && |
235 HaveSpsAndPps(frame->GetNaluInfos()); | |
209 } | 236 } |
210 } | 237 } |
211 | 238 |
212 bool VCMDecodingState::ContinuousPictureId(int picture_id) const { | 239 bool VCMDecodingState::ContinuousPictureId(int picture_id) const { |
213 int next_picture_id = picture_id_ + 1; | 240 int next_picture_id = picture_id_ + 1; |
214 if (picture_id < picture_id_) { | 241 if (picture_id < picture_id_) { |
215 // Wrap | 242 // Wrap |
216 if (picture_id_ >= 0x80) { | 243 if (picture_id_ >= 0x80) { |
217 // 15 bits used for picture id | 244 // 15 bits used for picture id |
218 return ((next_picture_id & 0x7FFF) == picture_id); | 245 return ((next_picture_id & 0x7FFF) == picture_id); |
(...skipping 56 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
275 // frame_decoded_cleared_to_. We just make the assumption | 302 // frame_decoded_cleared_to_. We just make the assumption |
276 // that we are not trying to reference back to a very old | 303 // that we are not trying to reference back to a very old |
277 // index, but instead are referencing a newer index. | 304 // index, but instead are referencing a newer index. |
278 uint16_t diff = | 305 uint16_t diff = |
279 index > frame_decoded_cleared_to_ | 306 index > frame_decoded_cleared_to_ |
280 ? kFrameDecodedLength - (index - frame_decoded_cleared_to_) | 307 ? kFrameDecodedLength - (index - frame_decoded_cleared_to_) |
281 : frame_decoded_cleared_to_ - index; | 308 : frame_decoded_cleared_to_ - index; |
282 return diff > kFrameDecodedLength / 2; | 309 return diff > kFrameDecodedLength / 2; |
283 } | 310 } |
284 | 311 |
312 bool VCMDecodingState::HaveSpsAndPps(const std::vector<NaluInfo>& nalus) const { | |
313 std::set<int> new_sps; | |
314 std::map<int, int> new_pps; | |
315 for (const NaluInfo& nalu : nalus) { | |
316 // Check if this nalu actually contains sps/pps information or dependencies. | |
317 if (nalu.sps_id == -1 && nalu.pps_id == -1) | |
318 continue; | |
319 switch (nalu.type) { | |
320 case H264::NaluType::kPps: | |
321 if (nalu.pps_id < 0) { | |
322 LOG(LS_WARNING) << "Received pps without pps id."; | |
323 } else if (nalu.sps_id < 0) { | |
324 LOG(LS_WARNING) << "Received pps without sps id."; | |
325 } else { | |
326 new_pps[nalu.pps_id] = nalu.sps_id; | |
327 } | |
328 break; | |
329 case H264::NaluType::kSps: | |
330 if (nalu.sps_id < 0) { | |
331 LOG(LS_WARNING) << "Received sps without sps id."; | |
332 } else { | |
333 new_sps.insert(nalu.sps_id); | |
334 } | |
335 break; | |
336 default: { | |
337 int sps_needed = -1; | |
philipel
2016/10/06 10:49:47
|sps_needed| sounds like you want to determine if
stefan-webrtc
2016/10/06 11:00:02
Done.
| |
338 auto pps_it = new_pps.find(nalu.pps_id); | |
339 if (pps_it != new_pps.end()) { | |
340 sps_needed = pps_it->second; | |
341 } else { | |
342 auto pps_it2 = received_pps_.find(nalu.pps_id); | |
343 if (pps_it2 == received_pps_.end()) { | |
344 return false; | |
345 } | |
346 sps_needed = pps_it2->second; | |
347 } | |
348 if (new_sps.find(sps_needed) == new_sps.end() && | |
349 received_sps_.find(sps_needed) == received_sps_.end()) { | |
350 return false; | |
351 } | |
352 break; | |
353 } | |
354 } | |
355 } | |
356 return true; | |
357 } | |
358 | |
285 } // namespace webrtc | 359 } // namespace webrtc |
OLD | NEW |