webrtc/modules/video_coding/main/source/qm_select.h - Issue 1417283007: modules/video_coding refactorings

Side by Side Diff: webrtc/modules/video_coding/main/source/qm_select.h

Issue 1417283007: modules/video_coding refactorings (Closed) Base URL: https://chromium.googlesource.com/external/webrtc.git@master

Patch Set: Fix the other copy of the mock include header Created 5 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

OLD	NEW
	(Empty)
1 /*

2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.

3 *

4 * Use of this source code is governed by a BSD-style license

5 * that can be found in the LICENSE file in the root of the source

6 * tree. An additional intellectual property rights grant can be found

7 * in the file PATENTS. All contributing project authors may

8 * be found in the AUTHORS file in the root of the source tree.

9 */

10

11 #ifndef WEBRTC_MODULES_VIDEO_CODING_QM_SELECT_H_

12 #define WEBRTC_MODULES_VIDEO_CODING_QM_SELECT_H_

13

14 #include "webrtc/common_types.h"

15 #include "webrtc/typedefs.h"

16

17 /******************************************************/

18 /* Quality Modes: Resolution and Robustness settings */

19 /******************************************************/

20

21 namespace webrtc {

22 struct VideoContentMetrics;

23

24 struct VCMResolutionScale {

25 VCMResolutionScale()

26 : codec_width(640),

27 codec_height(480),

28 frame_rate(30.0f),

29 spatial_width_fact(1.0f),

30 spatial_height_fact(1.0f),

31 temporal_fact(1.0f),

32 change_resolution_spatial(false),

33 change_resolution_temporal(false) {

34 }

35 uint16_t codec_width;

36 uint16_t codec_height;

37 float frame_rate;

38 float spatial_width_fact;

39 float spatial_height_fact;

40 float temporal_fact;

41 bool change_resolution_spatial;

42 bool change_resolution_temporal;

43 };

44

45 enum ImageType {

46 kQCIF = 0, // 176x144

47 kHCIF, // 264x216 = half(~3/4x3/4) CIF.

48 kQVGA, // 320x240 = quarter VGA.

49 kCIF, // 352x288

50 kHVGA, // 480x360 = half(~3/4x3/4) VGA.

51 kVGA, // 640x480

52 kQFULLHD, // 960x540 = quarter FULLHD, and half(~3/4x3/4) WHD.

53 kWHD, // 1280x720

54 kFULLHD, // 1920x1080

55 kNumImageTypes

56 };

57

58 const uint32_t kSizeOfImageType[kNumImageTypes] =

59 { 25344, 57024, 76800, 101376, 172800, 307200, 518400, 921600, 2073600 };

60

61 enum FrameRateLevelClass {

62 kFrameRateLow,

63 kFrameRateMiddle1,

64 kFrameRateMiddle2,

65 kFrameRateHigh

66 };

67

68 enum ContentLevelClass {

69 kLow,

70 kHigh,

71 kDefault

72 };

73

74 struct VCMContFeature {

75 VCMContFeature()

76 : value(0.0f),

77 level(kDefault) {

78 }

79 void Reset() {

80 value = 0.0f;

81 level = kDefault;

82 }

83 float value;

84 ContentLevelClass level;

85 };

86

87 enum UpDownAction {

88 kUpResolution,

89 kDownResolution

90 };

91

92 enum SpatialAction {

93 kNoChangeSpatial,

94 kOneHalfSpatialUniform, // 3/4 x 3/4: 9/6 ~1/2 pixel reduction.

95 kOneQuarterSpatialUniform, // 1/2 x 1/2: 1/4 pixel reduction.

96 kNumModesSpatial

97 };

98

99 enum TemporalAction {

100 kNoChangeTemporal,

101 kTwoThirdsTemporal, // 2/3 frame rate reduction

102 kOneHalfTemporal, // 1/2 frame rate reduction

103 kNumModesTemporal

104 };

105

106 struct ResolutionAction {

107 ResolutionAction()

108 : spatial(kNoChangeSpatial),

109 temporal(kNoChangeTemporal) {

110 }

111 SpatialAction spatial;

112 TemporalAction temporal;

113 };

114

115 // Down-sampling factors for spatial (width and height), and temporal.

116 const float kFactorWidthSpatial[kNumModesSpatial] =

117 { 1.0f, 4.0f / 3.0f, 2.0f };

118

119 const float kFactorHeightSpatial[kNumModesSpatial] =

120 { 1.0f, 4.0f / 3.0f, 2.0f };

121

122 const float kFactorTemporal[kNumModesTemporal] =

123 { 1.0f, 1.5f, 2.0f };

124

125 enum EncoderState {

126 kStableEncoding, // Low rate mis-match, stable buffer levels.

127 kStressedEncoding, // Significant over-shooting of target rate,

128 // Buffer under-flow, etc.

129 kEasyEncoding // Significant under-shooting of target rate.

130 };

131

132 // QmMethod class: main class for resolution and robustness settings

133

134 class VCMQmMethod {

135 public:

136 VCMQmMethod();

137 virtual ~VCMQmMethod();

138

139 // Reset values

140 void ResetQM();

141 virtual void Reset() = 0;

142

143 // Compute content class.

144 uint8_t ComputeContentClass();

145

146 // Update with the content metrics.

147 void UpdateContent(const VideoContentMetrics* content_metrics);

148

149 // Compute spatial texture magnitude and level.

150 // Spatial texture is a spatial prediction error measure.

151 void ComputeSpatial();

152

153 // Compute motion magnitude and level for NFD metric.

154 // NFD is normalized frame difference (normalized by spatial variance).

155 void ComputeMotionNFD();

156

157 // Get the imageType (CIF, VGA, HD, etc) for the system width/height.

158 ImageType GetImageType(uint16_t width, uint16_t height);

159

160 // Return the closest image type.

161 ImageType FindClosestImageType(uint16_t width, uint16_t height);

162

163 // Get the frame rate level.

164 FrameRateLevelClass FrameRateLevel(float frame_rate);

165

166 protected:

167 // Content Data.

168 const VideoContentMetrics* content_metrics_;

169

170 // Encoder frame sizes and native frame sizes.

171 uint16_t width_;

172 uint16_t height_;

173 float user_frame_rate_;

174 uint16_t native_width_;

175 uint16_t native_height_;

176 float native_frame_rate_;

177 float aspect_ratio_;

178 // Image type and frame rate leve, for the current encoder resolution.

179 ImageType image_type_;

180 FrameRateLevelClass framerate_level_;

181 // Content class data.

182 VCMContFeature motion_;

183 VCMContFeature spatial_;

184 uint8_t content_class_;

185 bool init_;

186 };

187

188 // Resolution settings class

189

190 class VCMQmResolution : public VCMQmMethod {

191 public:

192 VCMQmResolution();

193 virtual ~VCMQmResolution();

194

195 // Reset all quantities.

196 virtual void Reset();

197

198 // Reset rate quantities and counters after every SelectResolution() call.

199 void ResetRates();

200

201 // Reset down-sampling state.

202 void ResetDownSamplingState();

203

204 // Get the encoder state.

205 EncoderState GetEncoderState();

206

207 // Initialize after SetEncodingData in media_opt.

208 int Initialize(float bitrate,

209 float user_framerate,

210 uint16_t width,

211 uint16_t height,

212 int num_layers);

213

214 // Update the encoder frame size.

215 void UpdateCodecParameters(float frame_rate, uint16_t width, uint16_t height);

216

217 // Update with actual bit rate (size of the latest encoded frame)

218 // and frame type, after every encoded frame.

219 void UpdateEncodedSize(size_t encoded_size);

220

221 // Update with new target bitrate, actual encoder sent rate, frame_rate,

222 // loss rate: every ~1 sec from SetTargetRates in media_opt.

223 void UpdateRates(float target_bitrate,

224 float encoder_sent_rate,

225 float incoming_framerate,

226 uint8_t packet_loss);

227

228 // Extract ST (spatio-temporal) resolution action.

229 // Inputs: qm: Reference to the quality modes pointer.

230 // Output: the spatial and/or temporal scale change.

231 int SelectResolution(VCMResolutionScale** qm);

232

233 private:

234 // Set the default resolution action.

235 void SetDefaultAction();

236

237 // Compute rates for the selection of down-sampling action.

238 void ComputeRatesForSelection();

239

240 // Compute the encoder state.

241 void ComputeEncoderState();

242

243 // Return true if the action is to go back up in resolution.

244 bool GoingUpResolution();

245

246 // Return true if the action is to go down in resolution.

247 bool GoingDownResolution();

248

249 // Check the condition for going up in resolution by the scale factors:

250 // \|facWidth\|, \|facHeight\|, \|facTemp\|.

251 // \|scaleFac\| is a scale factor for the transition rate.

252 bool ConditionForGoingUp(float fac_width,

253 float fac_height,

254 float fac_temp,

255 float scale_fac);

256

257 // Get the bitrate threshold for the resolution action.

258 // The case \|facWidth\|=\|facHeight\|=\|facTemp\|==1 is for down-sampling action.

259 // \|scaleFac\| is a scale factor for the transition rate.

260 float GetTransitionRate(float fac_width,

261 float fac_height,

262 float fac_temp,

263 float scale_fac);

264

265 // Update the down-sampling state.

266 void UpdateDownsamplingState(UpDownAction up_down);

267

268 // Update the codec frame size and frame rate.

269 void UpdateCodecResolution();

270

271 // Return a state based on average target rate relative transition rate.

272 uint8_t RateClass(float transition_rate);

273

274 // Adjust the action selected from the table.

275 void AdjustAction();

276

277 // Covert 2 stages of 3/4 (=9/16) spatial decimation to 1/2.

278 void ConvertSpatialFractionalToWhole();

279

280 // Returns true if the new frame sizes, under the selected spatial action,

281 // are of even size.

282 bool EvenFrameSize();

283

284 // Insert latest down-sampling action into the history list.

285 void InsertLatestDownAction();

286

287 // Remove the last (first element) down-sampling action from the list.

288 void RemoveLastDownAction();

289

290 // Check constraints on the amount of down-sampling allowed.

291 void ConstrainAmountOfDownSampling();

292

293 // For going up in resolution: pick spatial or temporal action,

294 // if both actions were separately selected.

295 void PickSpatialOrTemporal();

296

297 // Select the directional (1x2 or 2x1) spatial down-sampling action.

298 void SelectSpatialDirectionMode(float transition_rate);

299

300 enum { kDownActionHistorySize = 10};

301

302 VCMResolutionScale* qm_;

303 // Encoder rate control parameters.

304 float target_bitrate_;

305 float incoming_framerate_;

306 float per_frame_bandwidth_;

307 float buffer_level_;

308

309 // Data accumulated every ~1sec from MediaOpt.

310 float sum_target_rate_;

311 float sum_incoming_framerate_;

312 float sum_rate_MM_;

313 float sum_rate_MM_sgn_;

314 float sum_packet_loss_;

315 // Counters.

316 uint32_t frame_cnt_;

317 uint32_t frame_cnt_delta_;

318 uint32_t update_rate_cnt_;

319 uint32_t low_buffer_cnt_;

320

321 // Resolution state parameters.

322 float state_dec_factor_spatial_;

323 float state_dec_factor_temporal_;

324

325 // Quantities used for selection.

326 float avg_target_rate_;

327 float avg_incoming_framerate_;

328 float avg_ratio_buffer_low_;

329 float avg_rate_mismatch_;

330 float avg_rate_mismatch_sgn_;

331 float avg_packet_loss_;

332 EncoderState encoder_state_;

333 ResolutionAction action_;

334 // Short history of the down-sampling actions from the Initialize() state.

335 // This is needed for going up in resolution. Since the total amount of

336 // down-sampling actions are constrained, the length of the list need not be

337 // large: i.e., (4/3) ^{kDownActionHistorySize} <= kMaxDownSample.

338 ResolutionAction down_action_history_[kDownActionHistorySize];

339 int num_layers_;

340 };

341

342 // Robustness settings class.

343

344 class VCMQmRobustness : public VCMQmMethod {

345 public:

346 VCMQmRobustness();

347 ~VCMQmRobustness();

348

349 virtual void Reset();

350

351 // Adjust FEC rate based on content: every ~1 sec from SetTargetRates.

352 // Returns an adjustment factor.

353 float AdjustFecFactor(uint8_t code_rate_delta,

354 float total_rate,

355 float framerate,

356 int64_t rtt_time,

357 uint8_t packet_loss);

358

359 // Set the UEP protection on/off.

360 bool SetUepProtection(uint8_t code_rate_delta,

361 float total_rate,

362 uint8_t packet_loss,

363 bool frame_type);

364

365 private:

366 // Previous state of network parameters.

367 float prev_total_rate_;

368 int64_t prev_rtt_time_;

369 uint8_t prev_packet_loss_;

370 uint8_t prev_code_rate_delta_;

371 };

372 } // namespace webrtc

373 #endif // WEBRTC_MODULES_VIDEO_CODING_QM_SELECT_H_

OLD	NEW

« no previous file with comments | « webrtc/modules/video_coding/main/source/packet.cc ('k') | webrtc/modules/video_coding/main/source/qm_select.cc » ('j') | no next file with comments »