Chromium Code Reviews

Side by Side Diff: webrtc/media/base/videoadapter.cc

Issue 2555483005: Add ability to scale to arbitrary factors (Closed)
Patch Set: rebase Created 4 years ago
Use n/p to move between diff chunks; N/P to move between comments.
Jump to:
View unified diff |
OLDNEW
1 /* 1 /*
2 * Copyright (c) 2010 The WebRTC project authors. All Rights Reserved. 2 * Copyright (c) 2010 The WebRTC project authors. All Rights Reserved.
3 * 3 *
4 * Use of this source code is governed by a BSD-style license 4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source 5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found 6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may 7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree. 8 * be found in the AUTHORS file in the root of the source tree.
9 */ 9 */
10 10
11 #include "webrtc/media/base/videoadapter.h" 11 #include "webrtc/media/base/videoadapter.h"
12 12
13 #include <algorithm> 13 #include <algorithm>
14 #include <cmath>
14 #include <cstdlib> 15 #include <cstdlib>
15 #include <limits> 16 #include <limits>
16 17
18 #include "webrtc/base/arraysize.h"
17 #include "webrtc/base/checks.h" 19 #include "webrtc/base/checks.h"
18 #include "webrtc/base/logging.h" 20 #include "webrtc/base/logging.h"
21 #include "webrtc/base/optional.h"
19 #include "webrtc/media/base/mediaconstants.h" 22 #include "webrtc/media/base/mediaconstants.h"
20 #include "webrtc/media/base/videocommon.h" 23 #include "webrtc/media/base/videocommon.h"
21 24
22 namespace { 25 namespace {
23
24 struct Fraction { 26 struct Fraction {
25 int numerator; 27 int numerator;
26 int denominator; 28 int denominator;
27 }; 29 };
28 30
29 // Scale factors optimized for in libYUV that we accept. 31 // Scale factors optimized for in libYUV that we accept.
30 // Must be sorted in decreasing scale factors for FindScaleLargerThan to work. 32 // Must be sorted in decreasing scale factors for FindScaleLargerThan to work.
31 const Fraction kScaleFractions[] = { 33 const Fraction kScaleFractions[] = {
32 {1, 1}, 34 {1, 1},
33 {3, 4}, 35 {3, 4},
34 {1, 2}, 36 {1, 2},
35 {3, 8}, 37 {3, 8},
36 {1, 4}, 38 {1, 4},
37 {3, 16}, 39 {3, 16},
38 }; 40 };
39 41
40 // Round |valueToRound| to a multiple of |multiple|. Prefer rounding upwards, 42 // Round |valueToRound| to a multiple of |multiple|. Prefer rounding upwards,
41 // but never more than |maxValue|. 43 // but never more than |maxValue|.
42 int roundUp(int valueToRound, int multiple, int maxValue) { 44 int roundUp(int valueToRound, int multiple, int maxValue) {
magjed_webrtc 2016/12/07 13:44:51 nit: I know it's unrelated but can you please clea
kthelgason 2016/12/08 08:42:03 Done.
43 const int roundedValue = (valueToRound + multiple - 1) / multiple * multiple; 45 const int roundedValue = (valueToRound + multiple - 1) / multiple * multiple;
44 return roundedValue <= maxValue ? roundedValue 46 return roundedValue <= maxValue ? roundedValue
45 : (maxValue / multiple * multiple); 47 : (maxValue / multiple * multiple);
46 } 48 }
47 49
48 Fraction FindScaleLessThanOrEqual(int input_num_pixels, int target_num_pixels) { 50 Fraction FindScaleLessThanOrEqual(int input_num_pixels, int target_num_pixels) {
51 // Start searching from the last of the optimal fractions;
magjed_webrtc 2016/12/07 13:44:51 It would be nice with a high level comment explain
kthelgason 2016/12/08 08:42:03 Done.
52 Fraction best_scale = kScaleFractions[arraysize(kScaleFractions) - 1];
53 while (true) {
54 const float scale =
55 best_scale.numerator / static_cast<float>(best_scale.denominator);
56 float test_num_pixels = input_num_pixels * scale * scale;
57 if (target_num_pixels >= test_num_pixels) {
magjed_webrtc 2016/12/07 13:44:51 Can we do like this instead: const float target_sc
kthelgason 2016/12/08 08:42:03 Done.
58 if (best_scale.numerator == 1) {
magjed_webrtc 2016/12/07 13:44:51 nit: I think this makes the intent clearer: if (be
kthelgason 2016/12/08 08:42:03 Done.
59 best_scale.numerator = 3;
60 best_scale.denominator *= 4;
61 } else {
62 best_scale.numerator = 1;
63 best_scale.denominator /= 2;
64 }
65 } else {
66 return best_scale;
67 }
68 }
69 }
70
71 rtc::Optional<Fraction> FindOptimizedScaleLessThanOrEqual(
72 int input_num_pixels,
73 int target_num_pixels) {
49 float best_distance = std::numeric_limits<float>::max(); 74 float best_distance = std::numeric_limits<float>::max();
50 Fraction best_scale = {0, 1}; // Default to 0 if nothing matches. 75 rtc::Optional<Fraction> best_scale;
51 for (const auto& fraction : kScaleFractions) { 76 for (const auto& fraction : kScaleFractions) {
52 const float scale = 77 const float scale =
53 fraction.numerator / static_cast<float>(fraction.denominator); 78 fraction.numerator / static_cast<float>(fraction.denominator);
54 float test_num_pixels = input_num_pixels * scale * scale; 79 float test_num_pixels = input_num_pixels * scale * scale;
55 float diff = target_num_pixels - test_num_pixels; 80 float diff = target_num_pixels - test_num_pixels;
56 if (diff < 0) { 81 if (diff < 0) {
57 continue; 82 continue;
58 } 83 }
59 if (diff < best_distance) { 84 if (diff < best_distance) {
60 best_distance = diff; 85 best_distance = diff;
61 best_scale = fraction; 86 best_scale = rtc::Optional<Fraction>(fraction);
62 if (best_distance == 0) { // Found exact match. 87 if (best_distance == 0) { // Found exact match.
63 break; 88 break;
64 } 89 }
65 } 90 }
66 } 91 }
67 return best_scale; 92 return best_scale;
68 } 93 }
69 94
70 Fraction FindScaleLargerThan(int input_num_pixels, 95 Fraction FindOptimizedScaleLargerThan(int input_num_pixels,
71 int target_num_pixels, 96 int target_num_pixels,
72 int* resulting_number_of_pixels) { 97 int* resulting_number_of_pixels) {
73 float best_distance = std::numeric_limits<float>::max(); 98 float best_distance = std::numeric_limits<float>::max();
74 Fraction best_scale = {1, 1}; // Default to unscaled if nothing matches. 99 Fraction best_scale = {1, 1}; // Default to unscaled if nothing matches.
75 // Default to input number of pixels. 100 // Default to input number of pixels.
76 float best_number_of_pixels = input_num_pixels; 101 float best_number_of_pixels = input_num_pixels;
77 for (const auto& fraction : kScaleFractions) { 102 for (const auto& fraction : kScaleFractions) {
78 const float scale = 103 const float scale =
79 fraction.numerator / static_cast<float>(fraction.denominator); 104 fraction.numerator / static_cast<float>(fraction.denominator);
80 float test_num_pixels = input_num_pixels * scale * scale; 105 float test_num_pixels = input_num_pixels * scale * scale;
81 float diff = test_num_pixels - target_num_pixels; 106 float diff = test_num_pixels - target_num_pixels;
82 if (diff <= 0) { 107 if (diff <= 0) {
83 break; 108 break;
84 } 109 }
85 if (diff < best_distance) { 110 if (diff < best_distance) {
86 best_distance = diff; 111 best_distance = diff;
87 best_scale = fraction; 112 best_scale = fraction;
88 best_number_of_pixels = test_num_pixels; 113 best_number_of_pixels = test_num_pixels;
89 } 114 }
90 } 115 }
91 116
92 *resulting_number_of_pixels = static_cast<int>(best_number_of_pixels + .5f); 117 *resulting_number_of_pixels = static_cast<int>(best_number_of_pixels + .5f);
93 return best_scale; 118 return best_scale;
94 } 119 }
95 120
121 rtc::Optional<Fraction> FindOptimizedScale(int input_num_pixels,
122 int max_pixel_count_step_up,
123 int max_pixel_count) {
124 // Try scale just above |max_pixel_count_step_up_|.
magjed_webrtc 2016/12/07 13:44:51 I find the code in the existing FindOptimizedScale
kthelgason 2016/12/08 08:42:03 I agree that this code is more complex than it nee
125 if (max_pixel_count_step_up > 0) {
126 int resulting_pixel_count;
127 const Fraction scale = FindOptimizedScaleLargerThan(
128 input_num_pixels, max_pixel_count_step_up, &resulting_pixel_count);
129 if (resulting_pixel_count <= max_pixel_count)
130 return rtc::Optional<Fraction>(scale);
131 }
132 // Return largest scale below |max_pixel_count|.
133 return FindOptimizedScaleLessThanOrEqual(input_num_pixels, max_pixel_count);
134 }
135
96 Fraction FindScale(int input_num_pixels, 136 Fraction FindScale(int input_num_pixels,
97 int max_pixel_count_step_up, 137 int max_pixel_count_step_up,
98 int max_pixel_count) { 138 int max_pixel_count) {
99 // Try scale just above |max_pixel_count_step_up_|. 139 const rtc::Optional<Fraction> optimized_scale = FindOptimizedScale(
100 if (max_pixel_count_step_up > 0) { 140 input_num_pixels, max_pixel_count_step_up, max_pixel_count);
101 int resulting_pixel_count; 141 if (optimized_scale)
102 const Fraction scale = FindScaleLargerThan( 142 return *optimized_scale;
103 input_num_pixels, max_pixel_count_step_up, &resulting_pixel_count);
104 if (resulting_pixel_count <= max_pixel_count)
105 return scale;
106 }
107 // Return largest scale below |max_pixel_count|.
108 return FindScaleLessThanOrEqual(input_num_pixels, max_pixel_count); 143 return FindScaleLessThanOrEqual(input_num_pixels, max_pixel_count);
109 } 144 }
110
111 } // namespace 145 } // namespace
112 146
113 namespace cricket { 147 namespace cricket {
114 148
115 VideoAdapter::VideoAdapter() 149 VideoAdapter::VideoAdapter(int required_resolution_divisor)
116 : frames_in_(0), 150 : frames_in_(0),
117 frames_out_(0), 151 frames_out_(0),
118 frames_scaled_(0), 152 frames_scaled_(0),
119 adaption_changes_(0), 153 adaption_changes_(0),
120 previous_width_(0), 154 previous_width_(0),
121 previous_height_(0), 155 previous_height_(0),
156 required_resolution_divisor_(required_resolution_divisor),
122 resolution_request_max_pixel_count_(std::numeric_limits<int>::max()), 157 resolution_request_max_pixel_count_(std::numeric_limits<int>::max()),
123 resolution_request_max_pixel_count_step_up_(0) {} 158 resolution_request_max_pixel_count_step_up_(0) {}
124 159
160 VideoAdapter::VideoAdapter() : VideoAdapter(1) {}
161
125 VideoAdapter::~VideoAdapter() {} 162 VideoAdapter::~VideoAdapter() {}
126 163
127 bool VideoAdapter::KeepFrame(int64_t in_timestamp_ns) { 164 bool VideoAdapter::KeepFrame(int64_t in_timestamp_ns) {
128 rtc::CritScope cs(&critical_section_); 165 rtc::CritScope cs(&critical_section_);
129 if (!requested_format_ || requested_format_->interval == 0) 166 if (!requested_format_ || requested_format_->interval == 0)
130 return true; 167 return true;
131 168
132 if (next_frame_timestamp_ns_) { 169 if (next_frame_timestamp_ns_) {
133 // Time until next frame should be outputted. 170 // Time until next frame should be outputted.
134 const int64_t time_until_next_frame_ns = 171 const int64_t time_until_next_frame_ns =
(...skipping 69 matching lines...)
204 std::swap(requested_format_->width, requested_format_->height); 241 std::swap(requested_format_->width, requested_format_->height);
205 } 242 }
206 const float requested_aspect = 243 const float requested_aspect =
207 requested_format_->width / 244 requested_format_->width /
208 static_cast<float>(requested_format_->height); 245 static_cast<float>(requested_format_->height);
209 *cropped_width = 246 *cropped_width =
210 std::min(in_width, static_cast<int>(in_height * requested_aspect)); 247 std::min(in_width, static_cast<int>(in_height * requested_aspect));
211 *cropped_height = 248 *cropped_height =
212 std::min(in_height, static_cast<int>(in_width / requested_aspect)); 249 std::min(in_height, static_cast<int>(in_width / requested_aspect));
213 } 250 }
214
215 // Find best scale factor.
216 const Fraction scale = 251 const Fraction scale =
217 FindScale(*cropped_width * *cropped_height, 252 FindScale(*cropped_width * *cropped_height,
218 resolution_request_max_pixel_count_step_up_, max_pixel_count); 253 resolution_request_max_pixel_count_step_up_, max_pixel_count);
219
220 // Adjust cropping slightly to get even integer output size and a perfect 254 // Adjust cropping slightly to get even integer output size and a perfect
221 // scale factor. 255 // scale factor. Make sure the resulting dimensions are a multiple of 4
magjed_webrtc 2016/12/07 13:44:51 Update the comment.
kthelgason 2016/12/08 08:42:03 Done.
222 *cropped_width = roundUp(*cropped_width, scale.denominator, in_width); 256 // to be nice to hardware encoders.
223 *cropped_height = roundUp(*cropped_height, scale.denominator, in_height); 257 *cropped_width =
224 RTC_DCHECK_EQ(0, *cropped_width % scale.denominator); 258 roundUp(*cropped_width, scale.denominator * required_resolution_divisor_,
225 RTC_DCHECK_EQ(0, *cropped_height % scale.denominator); 259 in_width);
260 *cropped_height =
261 roundUp(*cropped_height, scale.denominator * required_resolution_divisor_,
262 in_height);
263 RTC_DCHECK_EQ(
magjed_webrtc 2016/12/07 13:44:51 I think it's more clear to do: RTC_DCHECK_EQ(0, *c
kthelgason 2016/12/08 08:42:03 Done.
264 0, *cropped_width % scale.denominator * required_resolution_divisor_);
265 RTC_DCHECK_EQ(
266 0, *cropped_height % scale.denominator * required_resolution_divisor_);
226 267
227 // Calculate final output size. 268 // Calculate final output size.
228 *out_width = *cropped_width / scale.denominator * scale.numerator; 269 *out_width = *cropped_width / scale.denominator * scale.numerator;
229 *out_height = *cropped_height / scale.denominator * scale.numerator; 270 *out_height = *cropped_height / scale.denominator * scale.numerator;
230
231 ++frames_out_; 271 ++frames_out_;
232 if (scale.numerator != scale.denominator) 272 if (scale.numerator != scale.denominator)
233 ++frames_scaled_; 273 ++frames_scaled_;
234 274
235 if (previous_width_ && (previous_width_ != *out_width || 275 if (previous_width_ && (previous_width_ != *out_width ||
236 previous_height_ != *out_height)) { 276 previous_height_ != *out_height)) {
237 ++adaption_changes_; 277 ++adaption_changes_;
238 LOG(LS_INFO) << "Frame size changed: scaled " << frames_scaled_ << " / out " 278 LOG(LS_INFO) << "Frame size changed: scaled " << frames_scaled_ << " / out "
239 << frames_out_ << " / in " << frames_in_ 279 << frames_out_ << " / in " << frames_in_
240 << " Changes: " << adaption_changes_ << " Input: " << in_width 280 << " Changes: " << adaption_changes_ << " Input: " << in_width
(...skipping 19 matching lines...)
260 rtc::Optional<int> max_pixel_count, 300 rtc::Optional<int> max_pixel_count,
261 rtc::Optional<int> max_pixel_count_step_up) { 301 rtc::Optional<int> max_pixel_count_step_up) {
262 rtc::CritScope cs(&critical_section_); 302 rtc::CritScope cs(&critical_section_);
263 resolution_request_max_pixel_count_ = 303 resolution_request_max_pixel_count_ =
264 max_pixel_count.value_or(std::numeric_limits<int>::max()); 304 max_pixel_count.value_or(std::numeric_limits<int>::max());
265 resolution_request_max_pixel_count_step_up_ = 305 resolution_request_max_pixel_count_step_up_ =
266 max_pixel_count_step_up.value_or(0); 306 max_pixel_count_step_up.value_or(0);
267 } 307 }
268 308
269 } // namespace cricket 309 } // namespace cricket
OLDNEW

Powered by Google App Engine