webrtc/media/base/videoadapter.cc - Issue 2555483005: Add ability to scale to arbitrary factors

Side by Side Diff: webrtc/media/base/videoadapter.cc

Issue 2555483005: Add ability to scale to arbitrary factors (Closed)

Patch Set: rebase Created 4 years ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

« webrtc/media/base/videoadapter.h ('K') | « webrtc/media/base/videoadapter.h ('k') | webrtc/sdk/android/src/jni/androidvideotracksource.h » ('j') | webrtc/sdk/android/src/jni/androidvideotracksource.h » ('J')
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

OLD	NEW
1 /*	1 /*

2 * Copyright (c) 2010 The WebRTC project authors. All Rights Reserved.	2 * Copyright (c) 2010 The WebRTC project authors. All Rights Reserved.

3 *	3 *

4 * Use of this source code is governed by a BSD-style license	4 * Use of this source code is governed by a BSD-style license

5 * that can be found in the LICENSE file in the root of the source	5 * that can be found in the LICENSE file in the root of the source

6 * tree. An additional intellectual property rights grant can be found	6 * tree. An additional intellectual property rights grant can be found

7 * in the file PATENTS. All contributing project authors may	7 * in the file PATENTS. All contributing project authors may

8 * be found in the AUTHORS file in the root of the source tree.	8 * be found in the AUTHORS file in the root of the source tree.

9 */	9 */

10	10

11 #include "webrtc/media/base/videoadapter.h"	11 #include "webrtc/media/base/videoadapter.h"

12	12

13 #include <algorithm>	13 #include <algorithm>

	14 #include <cmath>

14 #include <cstdlib>	15 #include <cstdlib>

15 #include <limits>	16 #include <limits>

16	17

	18 #include "webrtc/base/arraysize.h"

17 #include "webrtc/base/checks.h"	19 #include "webrtc/base/checks.h"

18 #include "webrtc/base/logging.h"	20 #include "webrtc/base/logging.h"

	21 #include "webrtc/base/optional.h"

19 #include "webrtc/media/base/mediaconstants.h"	22 #include "webrtc/media/base/mediaconstants.h"

20 #include "webrtc/media/base/videocommon.h"	23 #include "webrtc/media/base/videocommon.h"

21	24

22 namespace {	25 namespace {

23

24 struct Fraction {	26 struct Fraction {

25 int numerator;	27 int numerator;

26 int denominator;	28 int denominator;

27 };	29 };

28	30

29 // Scale factors optimized for in libYUV that we accept.	31 // Scale factors optimized for in libYUV that we accept.

30 // Must be sorted in decreasing scale factors for FindScaleLargerThan to work.	32 // Must be sorted in decreasing scale factors for FindScaleLargerThan to work.

31 const Fraction kScaleFractions[] = {	33 const Fraction kScaleFractions[] = {

32 {1, 1},	34 {1, 1},

33 {3, 4},	35 {3, 4},

34 {1, 2},	36 {1, 2},

35 {3, 8},	37 {3, 8},

36 {1, 4},	38 {1, 4},

37 {3, 16},	39 {3, 16},

38 };	40 };

39	41

40 // Round \|valueToRound\| to a multiple of \|multiple\|. Prefer rounding upwards,	42 // Round \|valueToRound\| to a multiple of \|multiple\|. Prefer rounding upwards,

41 // but never more than \|maxValue\|.	43 // but never more than \|maxValue\|.

42 int roundUp(int valueToRound, int multiple, int maxValue) {	44 int roundUp(int valueToRound, int multiple, int maxValue) {
	magjed_webrtc 2016/12/07 13:44:51 nit: I know it's unrelated but can you please clea nit: I know it's unrelated but can you please clean up my naming mistake, i.e. rename \|valueToRound\| to \|value_to_round\| and same for \|maxValue\|. kthelgason 2016/12/08 08:42:03 Done. Show quoted text On 2016/12/07 13:44:51, magjed_webrtc wrote: > nit: I know it's unrelated but can you please clean up my naming mistake, i.e. > rename \|valueToRound\| to \|value_to_round\| and same for \|maxValue\|. Done.
43 const int roundedValue = (valueToRound + multiple - 1) / multiple * multiple;	45 const int roundedValue = (valueToRound + multiple - 1) / multiple * multiple;

44 return roundedValue <= maxValue ? roundedValue	46 return roundedValue <= maxValue ? roundedValue

45 : (maxValue / multiple * multiple);	47 : (maxValue / multiple * multiple);

46 }	48 }

47	49

48 Fraction FindScaleLessThanOrEqual(int input_num_pixels, int target_num_pixels) {	50 Fraction FindScaleLessThanOrEqual(int input_num_pixels, int target_num_pixels) {

	51 // Start searching from the last of the optimal fractions;
	magjed_webrtc 2016/12/07 13:44:51 It would be nice with a high level comment explain It would be nice with a high level comment explaining what this functions does. kthelgason 2016/12/08 08:42:03 Done. Show quoted text On 2016/12/07 13:44:51, magjed_webrtc wrote: > It would be nice with a high level comment explaining what this functions does. Done.
	52 Fraction best_scale = kScaleFractions[arraysize(kScaleFractions) - 1];

	53 while (true) {

	54 const float scale =

	55 best_scale.numerator / static_cast<float>(best_scale.denominator);

	56 float test_num_pixels = input_num_pixels * scale * scale;

	57 if (target_num_pixels >= test_num_pixels) {
	magjed_webrtc 2016/12/07 13:44:51 Can we do like this instead: const float target_sc Can we do like this instead: const float target_scale = sqrt(target_num_pixels / static_cast<float>(input_num_pixels)); Fraction best_scale = kScaleFractions[arraysize(kScaleFractions) - 1]; while (best_scale.numerator > target_scale * best_scale.denominator) { ... } ? kthelgason 2016/12/08 08:42:03 Done. Show quoted text On 2016/12/07 13:44:51, magjed_webrtc wrote: > Can we do like this instead: > const float target_scale = > sqrt(target_num_pixels / static_cast<float>(input_num_pixels)); > Fraction best_scale = kScaleFractions[arraysize(kScaleFractions) - 1]; > while (best_scale.numerator > target_scale * best_scale.denominator) { > ... > } > ? Done.
	58 if (best_scale.numerator == 1) {
	magjed_webrtc 2016/12/07 13:44:51 nit: I think this makes the intent clearer: if (be nit: I think this makes the intent clearer: if (best_scale.numerator % 3 == 0 && best_scale.denominator % 2 == 0) { // Multiply with 2/3. best_scale.numerator /= 3; best_scale.denominator /= 2; } else { // Multiply with 3/4. best_scale.numerator = 3; best_scale.denominator = 4; } kthelgason 2016/12/08 08:42:03 Done. Show quoted text On 2016/12/07 13:44:51, magjed_webrtc wrote: > nit: I think this makes the intent clearer: > if (best_scale.numerator % 3 == 0 && best_scale.denominator % 2 == 0) { > // Multiply with 2/3. > best_scale.numerator /= 3; > best_scale.denominator /= 2; > } else { > // Multiply with 3/4. > best_scale.numerator = 3; > best_scale.denominator = 4; > } Done.
	59 best_scale.numerator = 3;

	60 best_scale.denominator *= 4;

	61 } else {

	62 best_scale.numerator = 1;

	63 best_scale.denominator /= 2;

	64 }

	65 } else {

	66 return best_scale;

	67 }

	68 }

	69 }

	70

	71 rtc::Optional<Fraction> FindOptimizedScaleLessThanOrEqual(

	72 int input_num_pixels,

	73 int target_num_pixels) {

49 float best_distance = std::numeric_limits<float>::max();	74 float best_distance = std::numeric_limits<float>::max();

50 Fraction best_scale = {0, 1}; // Default to 0 if nothing matches.	75 rtc::Optional<Fraction> best_scale;

51 for (const auto& fraction : kScaleFractions) {	76 for (const auto& fraction : kScaleFractions) {

52 const float scale =	77 const float scale =

53 fraction.numerator / static_cast<float>(fraction.denominator);	78 fraction.numerator / static_cast<float>(fraction.denominator);

54 float test_num_pixels = input_num_pixels * scale * scale;	79 float test_num_pixels = input_num_pixels * scale * scale;

55 float diff = target_num_pixels - test_num_pixels;	80 float diff = target_num_pixels - test_num_pixels;

56 if (diff < 0) {	81 if (diff < 0) {

57 continue;	82 continue;

58 }	83 }

59 if (diff < best_distance) {	84 if (diff < best_distance) {

60 best_distance = diff;	85 best_distance = diff;

61 best_scale = fraction;	86 best_scale = rtc::Optional<Fraction>(fraction);

62 if (best_distance == 0) { // Found exact match.	87 if (best_distance == 0) { // Found exact match.

63 break;	88 break;

64 }	89 }

65 }	90 }

66 }	91 }

67 return best_scale;	92 return best_scale;

68 }	93 }

69	94

70 Fraction FindScaleLargerThan(int input_num_pixels,	95 Fraction FindOptimizedScaleLargerThan(int input_num_pixels,

71 int target_num_pixels,	96 int target_num_pixels,

72 int* resulting_number_of_pixels) {	97 int* resulting_number_of_pixels) {

73 float best_distance = std::numeric_limits<float>::max();	98 float best_distance = std::numeric_limits<float>::max();

74 Fraction best_scale = {1, 1}; // Default to unscaled if nothing matches.	99 Fraction best_scale = {1, 1}; // Default to unscaled if nothing matches.

75 // Default to input number of pixels.	100 // Default to input number of pixels.

76 float best_number_of_pixels = input_num_pixels;	101 float best_number_of_pixels = input_num_pixels;

77 for (const auto& fraction : kScaleFractions) {	102 for (const auto& fraction : kScaleFractions) {

78 const float scale =	103 const float scale =

79 fraction.numerator / static_cast<float>(fraction.denominator);	104 fraction.numerator / static_cast<float>(fraction.denominator);

80 float test_num_pixels = input_num_pixels * scale * scale;	105 float test_num_pixels = input_num_pixels * scale * scale;

81 float diff = test_num_pixels - target_num_pixels;	106 float diff = test_num_pixels - target_num_pixels;

82 if (diff <= 0) {	107 if (diff <= 0) {

83 break;	108 break;

84 }	109 }

85 if (diff < best_distance) {	110 if (diff < best_distance) {

86 best_distance = diff;	111 best_distance = diff;

87 best_scale = fraction;	112 best_scale = fraction;

88 best_number_of_pixels = test_num_pixels;	113 best_number_of_pixels = test_num_pixels;

89 }	114 }

90 }	115 }

91	116

92 *resulting_number_of_pixels = static_cast<int>(best_number_of_pixels + .5f);	117 *resulting_number_of_pixels = static_cast<int>(best_number_of_pixels + .5f);

93 return best_scale;	118 return best_scale;

94 }	119 }

95	120

	121 rtc::Optional<Fraction> FindOptimizedScale(int input_num_pixels,

	122 int max_pixel_count_step_up,

	123 int max_pixel_count) {

	124 // Try scale just above \|max_pixel_count_step_up_\|.
	magjed_webrtc 2016/12/07 13:44:51 I find the code in the existing FindOptimizedScale I find the code in the existing FindOptimizedScaleLessThanOrEqual and FindOptimizedScaleLargerThan really ugly. I think it would be cleaner to remove them and do std::upper_bound on kScaleFractions directly here + logic for handling the max_pixel_count_step_up. But this is totally unrelated so do it only if you want and have time. kthelgason 2016/12/08 08:42:03 I agree that this code is more complex than it nee Show quoted text On 2016/12/07 13:44:51, magjed_webrtc wrote: > I find the code in the existing FindOptimizedScaleLessThanOrEqual and > FindOptimizedScaleLargerThan really ugly. I think it would be cleaner to remove > them and do std::upper_bound on kScaleFractions directly here + logic for > handling the max_pixel_count_step_up. > > But this is totally unrelated so do it only if you want and have time. I agree that this code is more complex than it needs to be, but in the interest of keeping this CL small and landing it sooner as is does fix an actual crash I'd like to do it in a follow-up CL. I filed 6848 and assigned to me to track it.
	125 if (max_pixel_count_step_up > 0) {

	126 int resulting_pixel_count;

	127 const Fraction scale = FindOptimizedScaleLargerThan(

	128 input_num_pixels, max_pixel_count_step_up, &resulting_pixel_count);

	129 if (resulting_pixel_count <= max_pixel_count)

	130 return rtc::Optional<Fraction>(scale);

	131 }

	132 // Return largest scale below \|max_pixel_count\|.

	133 return FindOptimizedScaleLessThanOrEqual(input_num_pixels, max_pixel_count);

	134 }

	135

96 Fraction FindScale(int input_num_pixels,	136 Fraction FindScale(int input_num_pixels,

97 int max_pixel_count_step_up,	137 int max_pixel_count_step_up,

98 int max_pixel_count) {	138 int max_pixel_count) {

99 // Try scale just above \|max_pixel_count_step_up_\|.	139 const rtc::Optional<Fraction> optimized_scale = FindOptimizedScale(

100 if (max_pixel_count_step_up > 0) {	140 input_num_pixels, max_pixel_count_step_up, max_pixel_count);

101 int resulting_pixel_count;	141 if (optimized_scale)

102 const Fraction scale = FindScaleLargerThan(	142 return *optimized_scale;

103 input_num_pixels, max_pixel_count_step_up, &resulting_pixel_count);

104 if (resulting_pixel_count <= max_pixel_count)

105 return scale;

106 }

107 // Return largest scale below \|max_pixel_count\|.

108 return FindScaleLessThanOrEqual(input_num_pixels, max_pixel_count);	143 return FindScaleLessThanOrEqual(input_num_pixels, max_pixel_count);

109 }	144 }

110

111 } // namespace	145 } // namespace

112	146

113 namespace cricket {	147 namespace cricket {

114	148

115 VideoAdapter::VideoAdapter()	149 VideoAdapter::VideoAdapter(int required_resolution_divisor)

116 : frames_in_(0),	150 : frames_in_(0),

117 frames_out_(0),	151 frames_out_(0),

118 frames_scaled_(0),	152 frames_scaled_(0),

119 adaption_changes_(0),	153 adaption_changes_(0),

120 previous_width_(0),	154 previous_width_(0),

121 previous_height_(0),	155 previous_height_(0),

	156 required_resolution_divisor_(required_resolution_divisor),

122 resolution_request_max_pixel_count_(std::numeric_limits<int>::max()),	157 resolution_request_max_pixel_count_(std::numeric_limits<int>::max()),

123 resolution_request_max_pixel_count_step_up_(0) {}	158 resolution_request_max_pixel_count_step_up_(0) {}

124	159

	160 VideoAdapter::VideoAdapter() : VideoAdapter(1) {}

	161

125 VideoAdapter::~VideoAdapter() {}	162 VideoAdapter::~VideoAdapter() {}

126	163

127 bool VideoAdapter::KeepFrame(int64_t in_timestamp_ns) {	164 bool VideoAdapter::KeepFrame(int64_t in_timestamp_ns) {

128 rtc::CritScope cs(&critical_section_);	165 rtc::CritScope cs(&critical_section_);

129 if (!requested_format_ \|\| requested_format_->interval == 0)	166 if (!requested_format_ \|\| requested_format_->interval == 0)

130 return true;	167 return true;

131	168

132 if (next_frame_timestamp_ns_) {	169 if (next_frame_timestamp_ns_) {

133 // Time until next frame should be outputted.	170 // Time until next frame should be outputted.

134 const int64_t time_until_next_frame_ns =	171 const int64_t time_until_next_frame_ns =

(...skipping 69 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
204 std::swap(requested_format_->width, requested_format_->height);	241 std::swap(requested_format_->width, requested_format_->height);

205 }	242 }

206 const float requested_aspect =	243 const float requested_aspect =

207 requested_format_->width /	244 requested_format_->width /

208 static_cast<float>(requested_format_->height);	245 static_cast<float>(requested_format_->height);

209 *cropped_width =	246 *cropped_width =

210 std::min(in_width, static_cast<int>(in_height * requested_aspect));	247 std::min(in_width, static_cast<int>(in_height * requested_aspect));

211 *cropped_height =	248 *cropped_height =

212 std::min(in_height, static_cast<int>(in_width / requested_aspect));	249 std::min(in_height, static_cast<int>(in_width / requested_aspect));

213 }	250 }

214

215 // Find best scale factor.

216 const Fraction scale =	251 const Fraction scale =

217 FindScale(cropped_width *cropped_height,	252 FindScale(cropped_width *cropped_height,

218 resolution_request_max_pixel_count_step_up_, max_pixel_count);	253 resolution_request_max_pixel_count_step_up_, max_pixel_count);

219

220 // Adjust cropping slightly to get even integer output size and a perfect	254 // Adjust cropping slightly to get even integer output size and a perfect

221 // scale factor.	255 // scale factor. Make sure the resulting dimensions are a multiple of 4
	magjed_webrtc 2016/12/07 13:44:51 Update the comment. Update the comment. kthelgason 2016/12/08 08:42:03 Done. Show quoted text On 2016/12/07 13:44:51, magjed_webrtc wrote: > Update the comment. Done.
222 cropped_width = roundUp(cropped_width, scale.denominator, in_width);	256 // to be nice to hardware encoders.

223 cropped_height = roundUp(cropped_height, scale.denominator, in_height);	257 *cropped_width =

224 RTC_DCHECK_EQ(0, *cropped_width % scale.denominator);	258 roundUp(cropped_width, scale.denominator required_resolution_divisor_,

225 RTC_DCHECK_EQ(0, *cropped_height % scale.denominator);	259 in_width);

	260 *cropped_height =

	261 roundUp(cropped_height, scale.denominator required_resolution_divisor_,

	262 in_height);

	263 RTC_DCHECK_EQ(
	magjed_webrtc 2016/12/07 13:44:51 I think it's more clear to do: RTC_DCHECK_EQ(0, c I think it's more clear to do: RTC_DCHECK_EQ(0, cropped_width % scale.denominator); and RTC_DCHECK_EQ(0, out_width % required_resolution_divisor_); kthelgason* 2016/12/08 08:42:03 Done. Show quoted text On 2016/12/07 13:44:51, magjed_webrtc wrote: > I think it's more clear to do: > RTC_DCHECK_EQ(0, cropped_width % scale.denominator); > and > RTC_DCHECK_EQ(0, out_width % required_resolution_divisor_); Done.
	264 0, cropped_width % scale.denominator required_resolution_divisor_);

	265 RTC_DCHECK_EQ(

	266 0, cropped_height % scale.denominator required_resolution_divisor_);

226	267

227 // Calculate final output size.	268 // Calculate final output size.

228 out_width = cropped_width / scale.denominator * scale.numerator;	269 out_width = cropped_width / scale.denominator * scale.numerator;

229 out_height = cropped_height / scale.denominator * scale.numerator;	270 out_height = cropped_height / scale.denominator * scale.numerator;

230

231 ++frames_out_;	271 ++frames_out_;

232 if (scale.numerator != scale.denominator)	272 if (scale.numerator != scale.denominator)

233 ++frames_scaled_;	273 ++frames_scaled_;

234	274

235 if (previous_width_ && (previous_width_ != *out_width \|\|	275 if (previous_width_ && (previous_width_ != *out_width \|\|

236 previous_height_ != *out_height)) {	276 previous_height_ != *out_height)) {

237 ++adaption_changes_;	277 ++adaption_changes_;

238 LOG(LS_INFO) << "Frame size changed: scaled " << frames_scaled_ << " / out "	278 LOG(LS_INFO) << "Frame size changed: scaled " << frames_scaled_ << " / out "

239 << frames_out_ << " / in " << frames_in_	279 << frames_out_ << " / in " << frames_in_

240 << " Changes: " << adaption_changes_ << " Input: " << in_width	280 << " Changes: " << adaption_changes_ << " Input: " << in_width

(...skipping 19 matching lines...) Expand all Loading...
260 rtc::Optional<int> max_pixel_count,	300 rtc::Optional<int> max_pixel_count,

261 rtc::Optional<int> max_pixel_count_step_up) {	301 rtc::Optional<int> max_pixel_count_step_up) {

262 rtc::CritScope cs(&critical_section_);	302 rtc::CritScope cs(&critical_section_);

263 resolution_request_max_pixel_count_ =	303 resolution_request_max_pixel_count_ =

264 max_pixel_count.value_or(std::numeric_limits<int>::max());	304 max_pixel_count.value_or(std::numeric_limits<int>::max());

265 resolution_request_max_pixel_count_step_up_ =	305 resolution_request_max_pixel_count_step_up_ =

266 max_pixel_count_step_up.value_or(0);	306 max_pixel_count_step_up.value_or(0);

267 }	307 }

268	308

269 } // namespace cricket	309 } // namespace cricket

OLD	NEW