webrtc/modules/video_processing/main/source/content_analysis.cc - Issue 1410663004: modules/video_processing: refactor interface->include + more.

Side by Side Diff: webrtc/modules/video_processing/main/source/content_analysis.cc

Issue 1410663004: modules/video_processing: refactor interface->include + more. (Closed) Base URL: https://chromium.googlesource.com/external/webrtc.git@master

Patch Set: Rebased Created 5 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

« no previous file with comments | « webrtc/modules/video_processing/main/source/content_analysis.h ('k') | webrtc/modules/video_processing/main/source/content_analysis_sse2.cc » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

OLD	NEW
	(Empty)
1 /*

2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.

3 *

4 * Use of this source code is governed by a BSD-style license

5 * that can be found in the LICENSE file in the root of the source

6 * tree. An additional intellectual property rights grant can be found

7 * in the file PATENTS. All contributing project authors may

8 * be found in the AUTHORS file in the root of the source tree.

9 */

10 #include "webrtc/modules/video_processing/main/source/content_analysis.h"

11

12 #include <math.h>

13 #include <stdlib.h>

14

15 #include "webrtc/system_wrappers/include/cpu_features_wrapper.h"

16 #include "webrtc/system_wrappers/include/tick_util.h"

17

18 namespace webrtc {

19

20 VPMContentAnalysis::VPMContentAnalysis(bool runtime_cpu_detection)

21 : orig_frame_(NULL),

22 prev_frame_(NULL),

23 width_(0),

24 height_(0),

25 skip_num_(1),

26 border_(8),

27 motion_magnitude_(0.0f),

28 spatial_pred_err_(0.0f),

29 spatial_pred_err_h_(0.0f),

30 spatial_pred_err_v_(0.0f),

31 first_frame_(true),

32 ca_Init_(false),

33 content_metrics_(NULL) {

34 ComputeSpatialMetrics = &VPMContentAnalysis::ComputeSpatialMetrics_C;

35 TemporalDiffMetric = &VPMContentAnalysis::TemporalDiffMetric_C;

36

37 if (runtime_cpu_detection) {

38 #if defined(WEBRTC_ARCH_X86_FAMILY)

39 if (WebRtc_GetCPUInfo(kSSE2)) {

40 ComputeSpatialMetrics = &VPMContentAnalysis::ComputeSpatialMetrics_SSE2;

41 TemporalDiffMetric = &VPMContentAnalysis::TemporalDiffMetric_SSE2;

42 }

43 #endif

44 }

45 Release();

46 }

47

48 VPMContentAnalysis::~VPMContentAnalysis() {

49 Release();

50 }

51

52 VideoContentMetrics* VPMContentAnalysis::ComputeContentMetrics(

53 const VideoFrame& inputFrame) {

54 if (inputFrame.IsZeroSize())

55 return NULL;

56

57 // Init if needed (native dimension change).

58 if (width_ != inputFrame.width() \|\| height_ != inputFrame.height()) {

59 if (VPM_OK != Initialize(inputFrame.width(), inputFrame.height()))

60 return NULL;

61 }

62 // Only interested in the Y plane.

63 orig_frame_ = inputFrame.buffer(kYPlane);

64

65 // Compute spatial metrics: 3 spatial prediction errors.

66 (this->*ComputeSpatialMetrics)();

67

68 // Compute motion metrics

69 if (first_frame_ == false)

70 ComputeMotionMetrics();

71

72 // Saving current frame as previous one: Y only.

73 memcpy(prev_frame_, orig_frame_, width_ * height_);

74

75 first_frame_ = false;

76 ca_Init_ = true;

77

78 return ContentMetrics();

79 }

80

81 int32_t VPMContentAnalysis::Release() {

82 if (content_metrics_ != NULL) {

83 delete content_metrics_;

84 content_metrics_ = NULL;

85 }

86

87 if (prev_frame_ != NULL) {

88 delete [] prev_frame_;

89 prev_frame_ = NULL;

90 }

91

92 width_ = 0;

93 height_ = 0;

94 first_frame_ = true;

95

96 return VPM_OK;

97 }

98

99 int32_t VPMContentAnalysis::Initialize(int width, int height) {

100 width_ = width;

101 height_ = height;

102 first_frame_ = true;

103

104 // skip parameter: # of skipped rows: for complexity reduction

105 // temporal also currently uses it for column reduction.

106 skip_num_ = 1;

107

108 // use skipNum = 2 for 4CIF, WHD

109 if ( (height_ >= 576) && (width_ >= 704) ) {

110 skip_num_ = 2;

111 }

112 // use skipNum = 4 for FULLL_HD images

113 if ( (height_ >= 1080) && (width_ >= 1920) ) {

114 skip_num_ = 4;

115 }

116

117 if (content_metrics_ != NULL) {

118 delete content_metrics_;

119 }

120

121 if (prev_frame_ != NULL) {

122 delete [] prev_frame_;

123 }

124

125 // Spatial Metrics don't work on a border of 8. Minimum processing

126 // block size is 16 pixels. So make sure the width and height support this.

127 if (width_ <= 32 \|\| height_ <= 32) {

128 ca_Init_ = false;

129 return VPM_PARAMETER_ERROR;

130 }

131

132 content_metrics_ = new VideoContentMetrics();

133 if (content_metrics_ == NULL) {

134 return VPM_MEMORY;

135 }

136

137 prev_frame_ = new uint8_t[width_ * height_]; // Y only.

138 if (prev_frame_ == NULL) return VPM_MEMORY;

139

140 return VPM_OK;

141 }

142

143

144 // Compute motion metrics: magnitude over non-zero motion vectors,

145 // and size of zero cluster

146 int32_t VPMContentAnalysis::ComputeMotionMetrics() {

147 // Motion metrics: only one is derived from normalized

148 // (MAD) temporal difference

149 (this->*TemporalDiffMetric)();

150 return VPM_OK;

151 }

152

153 // Normalized temporal difference (MAD): used as a motion level metric

154 // Normalize MAD by spatial contrast: images with more contrast

155 // (pixel variance) likely have larger temporal difference

156 // To reduce complexity, we compute the metric for a reduced set of points.

157 int32_t VPMContentAnalysis::TemporalDiffMetric_C() {

158 // size of original frame

159 int sizei = height_;

160 int sizej = width_;

161 uint32_t tempDiffSum = 0;

162 uint32_t pixelSum = 0;

163 uint64_t pixelSqSum = 0;

164

165 uint32_t num_pixels = 0; // Counter for # of pixels.

166 const int width_end = ((width_ - 2*border_) & -16) + border_;

167

168 for (int i = border_; i < sizei - border_; i += skip_num_) {

169 for (int j = border_; j < width_end; j++) {

170 num_pixels += 1;

171 int ssn = i * sizej + j;

172

173 uint8_t currPixel = orig_frame_[ssn];

174 uint8_t prevPixel = prev_frame_[ssn];

175

176 tempDiffSum += (uint32_t)abs((int16_t)(currPixel - prevPixel));

177 pixelSum += (uint32_t) currPixel;

178 pixelSqSum += (uint64_t) (currPixel * currPixel);

179 }

180 }

181

182 // Default.

183 motion_magnitude_ = 0.0f;

184

185 if (tempDiffSum == 0) return VPM_OK;

186

187 // Normalize over all pixels.

188 float const tempDiffAvg = (float)tempDiffSum / (float)(num_pixels);

189 float const pixelSumAvg = (float)pixelSum / (float)(num_pixels);

190 float const pixelSqSumAvg = (float)pixelSqSum / (float)(num_pixels);

191 float contrast = pixelSqSumAvg - (pixelSumAvg * pixelSumAvg);

192

193 if (contrast > 0.0) {

194 contrast = sqrt(contrast);

195 motion_magnitude_ = tempDiffAvg/contrast;

196 }

197 return VPM_OK;

198 }

199

200 // Compute spatial metrics:

201 // To reduce complexity, we compute the metric for a reduced set of points.

202 // The spatial metrics are rough estimates of the prediction error cost for

203 // each QM spatial mode: 2x2,1x2,2x1

204 // The metrics are a simple estimate of the up-sampling prediction error,

205 // estimated assuming sub-sampling for decimation (no filtering),

206 // and up-sampling back up with simple bilinear interpolation.

207 int32_t VPMContentAnalysis::ComputeSpatialMetrics_C() {

208 const int sizei = height_;

209 const int sizej = width_;

210

211 // Pixel mean square average: used to normalize the spatial metrics.

212 uint32_t pixelMSA = 0;

213

214 uint32_t spatialErrSum = 0;

215 uint32_t spatialErrVSum = 0;

216 uint32_t spatialErrHSum = 0;

217

218 // make sure work section is a multiple of 16

219 const int width_end = ((sizej - 2*border_) & -16) + border_;

220

221 for (int i = border_; i < sizei - border_; i += skip_num_) {

222 for (int j = border_; j < width_end; j++) {

223 int ssn1= i * sizej + j;

224 int ssn2 = (i + 1) * sizej + j; // bottom

225 int ssn3 = (i - 1) * sizej + j; // top

226 int ssn4 = i * sizej + j + 1; // right

227 int ssn5 = i * sizej + j - 1; // left

228

229 uint16_t refPixel1 = orig_frame_[ssn1] << 1;

230 uint16_t refPixel2 = orig_frame_[ssn1] << 2;

231

232 uint8_t bottPixel = orig_frame_[ssn2];

233 uint8_t topPixel = orig_frame_[ssn3];

234 uint8_t rightPixel = orig_frame_[ssn4];

235 uint8_t leftPixel = orig_frame_[ssn5];

236

237 spatialErrSum += (uint32_t) abs((int16_t)(refPixel2

238 - (uint16_t)(bottPixel + topPixel + leftPixel + rightPixel)));

239 spatialErrVSum += (uint32_t) abs((int16_t)(refPixel1

240 - (uint16_t)(bottPixel + topPixel)));

241 spatialErrHSum += (uint32_t) abs((int16_t)(refPixel1

242 - (uint16_t)(leftPixel + rightPixel)));

243 pixelMSA += orig_frame_[ssn1];

244 }

245 }

246

247 // Normalize over all pixels.

248 const float spatialErr = (float)(spatialErrSum >> 2);

249 const float spatialErrH = (float)(spatialErrHSum >> 1);

250 const float spatialErrV = (float)(spatialErrVSum >> 1);

251 const float norm = (float)pixelMSA;

252

253 // 2X2:

254 spatial_pred_err_ = spatialErr / norm;

255 // 1X2:

256 spatial_pred_err_h_ = spatialErrH / norm;

257 // 2X1:

258 spatial_pred_err_v_ = spatialErrV / norm;

259 return VPM_OK;

260 }

261

262 VideoContentMetrics* VPMContentAnalysis::ContentMetrics() {

263 if (ca_Init_ == false) return NULL;

264

265 content_metrics_->spatial_pred_err = spatial_pred_err_;

266 content_metrics_->spatial_pred_err_h = spatial_pred_err_h_;

267 content_metrics_->spatial_pred_err_v = spatial_pred_err_v_;

268 // Motion metric: normalized temporal difference (MAD).

269 content_metrics_->motion_magnitude = motion_magnitude_;

270

271 return content_metrics_;

272 }

273

274 } // namespace webrtc

OLD	NEW