webrtc/common_video/h264/sps_parser_unittest.cc - Issue 1979443004: Add H264 bitstream rewriting to limit frame reordering marker in header

Side by Side Diff: webrtc/common_video/h264/sps_parser_unittest.cc

Issue 1979443004: Add H264 bitstream rewriting to limit frame reordering marker in header (Closed) Base URL: https://chromium.googlesource.com/external/webrtc.git@master

Patch Set: Addressed comments Created 4 years, 6 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

OLD	NEW
1 /*	1 /*

2 * Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.	2 * Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.

3 *	3 *

4 * Use of this source code is governed by a BSD-style license	4 * Use of this source code is governed by a BSD-style license

5 * that can be found in the LICENSE file in the root of the source	5 * that can be found in the LICENSE file in the root of the source

6 * tree. An additional intellectual property rights grant can be found	6 * tree. An additional intellectual property rights grant can be found

7 * in the file PATENTS. All contributing project authors may	7 * in the file PATENTS. All contributing project authors may

8 * be found in the AUTHORS file in the root of the source tree.	8 * be found in the AUTHORS file in the root of the source tree.

9 */	9 */

10	10

11 #include "webrtc/modules/rtp_rtcp/source/h264_sps_parser.h"	11 #include "webrtc/common_video/h264/sps_parser.h"

12	12

13 #include "testing/gtest/include/gtest/gtest.h"	13 #include "testing/gtest/include/gtest/gtest.h"

14	14

15 #include "webrtc/base/arraysize.h"	15 #include "webrtc/base/arraysize.h"

16 #include "webrtc/base/bitbuffer.h"	16 #include "webrtc/base/bitbuffer.h"

	17 #include "webrtc/base/buffer.h"

	18 #include "webrtc/common_video/h264/h264_common.h"

17	19

18 namespace webrtc {	20 namespace webrtc {

19	21

20 // Example SPS can be generated with ffmpeg. Here's an example set of commands,	22 // Example SPS can be generated with ffmpeg. Here's an example set of commands,

21 // runnable on OS X:	23 // runnable on OS X:

22 // 1) Generate a video, from the camera:	24 // 1) Generate a video, from the camera:

23 // ffmpeg -f avfoundation -i "0" -video_size 640x360 camera.mov	25 // ffmpeg -f avfoundation -i "0" -video_size 640x360 camera.mov

24 //	26 //

25 // 2) Scale the video to the desired size:	27 // 2) Scale the video to the desired size:

26 // ffmpeg -i camera.mov -vf scale=640x360 scaled.mov	28 // ffmpeg -i camera.mov -vf scale=640x360 scaled.mov

27 //	29 //

28 // 3) Get just the H.264 bitstream in AnnexB:	30 // 3) Get just the H.264 bitstream in AnnexB:

29 // ffmpeg -i scaled.mov -vcodec copy -vbsf h264_mp4toannexb -an out.h264	31 // ffmpeg -i scaled.mov -vcodec copy -vbsf h264_mp4toannexb -an out.h264

30 //	32 //

31 // 4) Open out.h264 and find the SPS, generally everything between the first	33 // 4) Open out.h264 and find the SPS, generally everything between the first

32 // two start codes (0 0 0 1 or 0 0 1). The first byte should be 0x67,	34 // two start codes (0 0 0 1 or 0 0 1). The first byte should be 0x67,

33 // which should be stripped out before being passed to the parser.	35 // which should be stripped out before being passed to the parser.

34	36

35 static const size_t kSpsBufferMaxSize = 256;	37 static const size_t kSpsBufferMaxSize = 256;

36	38

37 // Generates a fake SPS with basically everything empty but the width/height.	39 // Generates a fake SPS with basically everything empty but the width/height.

38 // Pass in a buffer of at least kSpsBufferMaxSize.	40 // Pass in a buffer of at least kSpsBufferMaxSize.

39 // The fake SPS that this generates also always has at least one emulation byte	41 // The fake SPS that this generates also always has at least one emulation byte

40 // at offset 2, since the first two bytes are always 0, and has a 0x3 as the	42 // at offset 2, since the first two bytes are always 0, and has a 0x3 as the

41 // level_idc, to make sure the parser doesn't eat all 0x3 bytes.	43 // level_idc, to make sure the parser doesn't eat all 0x3 bytes.

42 void GenerateFakeSps(uint16_t width, uint16_t height, uint8_t buffer[]) {	44 void GenerateFakeSps(uint16_t width, uint16_t height, rtc::Buffer* out_buffer) {

43 uint8_t rbsp[kSpsBufferMaxSize] = {0};	45 uint8_t rbsp[kSpsBufferMaxSize] = {0};

44 rtc::BitBufferWriter writer(rbsp, kSpsBufferMaxSize);	46 rtc::BitBufferWriter writer(rbsp, kSpsBufferMaxSize);

45 // Profile byte.	47 // Profile byte.

46 writer.WriteUInt8(0);	48 writer.WriteUInt8(0);

47 // Constraint sets and reserved zero bits.	49 // Constraint sets and reserved zero bits.

48 writer.WriteUInt8(0);	50 writer.WriteUInt8(0);

49 // level_idc.	51 // level_idc.

50 writer.WriteUInt8(0x3u);	52 writer.WriteUInt8(0x3u);

51 // seq_paramter_set_id.	53 // seq_paramter_set_id.

52 writer.WriteExponentialGolomb(0);	54 writer.WriteExponentialGolomb(0);

(...skipping 30 matching lines...) Expand all Loading...
83 // Now we write the left/right/top/bottom crop. For simplicity, we'll put all	85 // Now we write the left/right/top/bottom crop. For simplicity, we'll put all

84 // the crop at the left/top.	86 // the crop at the left/top.

85 // We picked a 4:2:0 format, so the crops are 1/2 the pixel crop values.	87 // We picked a 4:2:0 format, so the crops are 1/2 the pixel crop values.

86 // Left/right.	88 // Left/right.

87 writer.WriteExponentialGolomb(((16 - (width % 16)) % 16) / 2);	89 writer.WriteExponentialGolomb(((16 - (width % 16)) % 16) / 2);

88 writer.WriteExponentialGolomb(0);	90 writer.WriteExponentialGolomb(0);

89 // Top/bottom.	91 // Top/bottom.

90 writer.WriteExponentialGolomb(((16 - (height % 16)) % 16) / 2);	92 writer.WriteExponentialGolomb(((16 - (height % 16)) % 16) / 2);

91 writer.WriteExponentialGolomb(0);	93 writer.WriteExponentialGolomb(0);

92	94

	95 // vui_parameters_present_flag: u(1)

	96 writer.WriteBits(0, 1);

	97

93 // Get the number of bytes written (including the last partial byte).	98 // Get the number of bytes written (including the last partial byte).

94 size_t byte_count, bit_offset;	99 size_t byte_count, bit_offset;

95 writer.GetCurrentOffset(&byte_count, &bit_offset);	100 writer.GetCurrentOffset(&byte_count, &bit_offset);

96 if (bit_offset > 0) {	101 if (bit_offset > 0) {

97 byte_count++;	102 byte_count++;

98 }	103 }

99	104

100 // Now, we need to write the rbsp into bytes. To do that, we'll need to add	105 H264::WriteRbsp(rbsp, byte_count, out_buffer);

101 // emulation 0x03 bytes if there's ever a sequence of 00 00 01 or 00 00 00 01.

102 // To be simple, just add a 0x03 after every 0x00. Extra emulation doesn't

103 // hurt.

104 for (size_t i = 0; i < byte_count;) {

105 // The -3 is intentional; we never need to write an emulation byte if the 00

106 // is at the end.

107 if (i < byte_count - 3 && rbsp[i] == 0 && rbsp[i + 1] == 0) {

108 *buffer++ = rbsp[i];

109 *buffer++ = rbsp[i + 1];

110 *buffer++ = 0x3u;

111 i += 2;

112 } else {

113 *buffer++ = rbsp[i];

114 ++i;

115 }

116 }

117 }	106 }

118	107

119 TEST(H264SpsParserTest, TestSampleSPSHdLandscape) {	108 class H264SpsParserTest : public ::testing::Test {

	109 public:

	110 H264SpsParserTest() {}

	111 virtual ~H264SpsParserTest() {}

	112

	113 rtc::Optional<SpsParser::SpsState> sps_;

	114 };

	115

	116 TEST_F(H264SpsParserTest, TestSampleSPSHdLandscape) {

120 // SPS for a 1280x720 camera capture from ffmpeg on osx. Contains	117 // SPS for a 1280x720 camera capture from ffmpeg on osx. Contains

121 // emulation bytes but no cropping.	118 // emulation bytes but no cropping.

122 const uint8_t buffer[] = {0x7A, 0x00, 0x1F, 0xBC, 0xD9, 0x40, 0x50, 0x05,	119 const uint8_t buffer[] = {0x7A, 0x00, 0x1F, 0xBC, 0xD9, 0x40, 0x50, 0x05,

123 0xBA, 0x10, 0x00, 0x00, 0x03, 0x00, 0xC0, 0x00,	120 0xBA, 0x10, 0x00, 0x00, 0x03, 0x00, 0xC0, 0x00,

124 0x00, 0x2A, 0xE0, 0xF1, 0x83, 0x19, 0x60};	121 0x00, 0x2A, 0xE0, 0xF1, 0x83, 0x19, 0x60};

125 H264SpsParser parser = H264SpsParser(buffer, arraysize(buffer));	122 EXPECT_TRUE(

126 EXPECT_TRUE(parser.Parse());	123 static_cast<bool>(sps_ = SpsParser::ParseSps(buffer, arraysize(buffer))));

127 EXPECT_EQ(1280u, parser.width());	124 EXPECT_EQ(1280u, sps_->width);

128 EXPECT_EQ(720u, parser.height());	125 EXPECT_EQ(720u, sps_->height);

129 }	126 }

130	127

131 TEST(H264SpsParserTest, TestSampleSPSVgaLandscape) {	128 TEST_F(H264SpsParserTest, TestSampleSPSVgaLandscape) {

132 // SPS for a 640x360 camera capture from ffmpeg on osx. Contains emulation	129 // SPS for a 640x360 camera capture from ffmpeg on osx. Contains emulation

133 // bytes and cropping (360 isn't divisible by 16).	130 // bytes and cropping (360 isn't divisible by 16).

134 const uint8_t buffer[] = {0x7A, 0x00, 0x1E, 0xBC, 0xD9, 0x40, 0xA0, 0x2F,	131 const uint8_t buffer[] = {0x7A, 0x00, 0x1E, 0xBC, 0xD9, 0x40, 0xA0, 0x2F,

135 0xF8, 0x98, 0x40, 0x00, 0x00, 0x03, 0x01, 0x80,	132 0xF8, 0x98, 0x40, 0x00, 0x00, 0x03, 0x01, 0x80,

136 0x00, 0x00, 0x56, 0x83, 0xC5, 0x8B, 0x65, 0x80};	133 0x00, 0x00, 0x56, 0x83, 0xC5, 0x8B, 0x65, 0x80};

137 H264SpsParser parser = H264SpsParser(buffer, arraysize(buffer));	134 EXPECT_TRUE(

138 EXPECT_TRUE(parser.Parse());	135 static_cast<bool>(sps_ = SpsParser::ParseSps(buffer, arraysize(buffer))));

139 EXPECT_EQ(640u, parser.width());	136 EXPECT_EQ(640u, sps_->width);

140 EXPECT_EQ(360u, parser.height());	137 EXPECT_EQ(360u, sps_->height);

141 }	138 }

142	139

143 TEST(H264SpsParserTest, TestSampleSPSWeirdResolution) {	140 TEST_F(H264SpsParserTest, TestSampleSPSWeirdResolution) {

144 // SPS for a 200x400 camera capture from ffmpeg on osx. Horizontal and	141 // SPS for a 200x400 camera capture from ffmpeg on osx. Horizontal and

145 // veritcal crop (neither dimension is divisible by 16).	142 // veritcal crop (neither dimension is divisible by 16).

146 const uint8_t buffer[] = {0x7A, 0x00, 0x0D, 0xBC, 0xD9, 0x43, 0x43, 0x3E,	143 const uint8_t buffer[] = {0x7A, 0x00, 0x0D, 0xBC, 0xD9, 0x43, 0x43, 0x3E,

147 0x5E, 0x10, 0x00, 0x00, 0x03, 0x00, 0x60, 0x00,	144 0x5E, 0x10, 0x00, 0x00, 0x03, 0x00, 0x60, 0x00,

148 0x00, 0x15, 0xA0, 0xF1, 0x42, 0x99, 0x60};	145 0x00, 0x15, 0xA0, 0xF1, 0x42, 0x99, 0x60};

149 H264SpsParser parser = H264SpsParser(buffer, arraysize(buffer));	146 EXPECT_TRUE(

150 EXPECT_TRUE(parser.Parse());	147 static_cast<bool>(sps_ = SpsParser::ParseSps(buffer, arraysize(buffer))));

151 EXPECT_EQ(200u, parser.width());	148 EXPECT_EQ(200u, sps_->width);

152 EXPECT_EQ(400u, parser.height());	149 EXPECT_EQ(400u, sps_->height);

153 }	150 }

154	151

155 TEST(H264SpsParserTest, TestSyntheticSPSQvgaLandscape) {	152 TEST_F(H264SpsParserTest, TestSyntheticSPSQvgaLandscape) {

156 uint8_t buffer[kSpsBufferMaxSize] = {0};	153 rtc::Buffer buffer;

157 GenerateFakeSps(320u, 180u, buffer);	154 GenerateFakeSps(320u, 180u, &buffer);

158 H264SpsParser parser = H264SpsParser(buffer, arraysize(buffer));	155 EXPECT_TRUE(static_cast<bool>(

159 EXPECT_TRUE(parser.Parse());	156 sps_ = SpsParser::ParseSps(buffer.data(), buffer.size())));

160 EXPECT_EQ(320u, parser.width());	157 EXPECT_EQ(320u, sps_->width);

161 EXPECT_EQ(180u, parser.height());	158 EXPECT_EQ(180u, sps_->height);

162 }	159 }

163	160

164 TEST(H264SpsParserTest, TestSyntheticSPSWeirdResolution) {	161 TEST_F(H264SpsParserTest, TestSyntheticSPSWeirdResolution) {

165 uint8_t buffer[kSpsBufferMaxSize] = {0};	162 rtc::Buffer buffer;

166 GenerateFakeSps(156u, 122u, buffer);	163 GenerateFakeSps(156u, 122u, &buffer);

167 H264SpsParser parser = H264SpsParser(buffer, arraysize(buffer));	164 EXPECT_TRUE(static_cast<bool>(

168 EXPECT_TRUE(parser.Parse());	165 sps_ = SpsParser::ParseSps(buffer.data(), buffer.size())));

169 EXPECT_EQ(156u, parser.width());	166 EXPECT_EQ(156u, sps_->width);

170 EXPECT_EQ(122u, parser.height());	167 EXPECT_EQ(122u, sps_->height);

171 }	168 }

172	169

173 } // namespace webrtc	170 } // namespace webrtc

OLD	NEW

« no previous file with comments | « webrtc/common_video/h264/sps_parser.cc ('k') | webrtc/common_video/h264/sps_vui_rewriter.h » ('j') | no next file with comments »