Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(4)

Side by Side Diff: webrtc/modules/audio_processing/audio_buffer.cc

Issue 1226093007: Allow more than 2 input channels in AudioProcessing. (Closed) Base URL: https://chromium.googlesource.com/external/webrtc.git@master
Patch Set: Fix docs Created 5 years, 5 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
1 /* 1 /*
2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. 2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
3 * 3 *
4 * Use of this source code is governed by a BSD-style license 4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source 5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found 6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may 7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree. 8 * be found in the AUTHORS file in the root of the source tree.
9 */ 9 */
10 10
11 #include "webrtc/modules/audio_processing/audio_buffer.h" 11 #include "webrtc/modules/audio_processing/audio_buffer.h"
12 12
13 #include "webrtc/common_audio/include/audio_util.h" 13 #include "webrtc/common_audio/include/audio_util.h"
14 #include "webrtc/common_audio/resampler/push_sinc_resampler.h" 14 #include "webrtc/common_audio/resampler/push_sinc_resampler.h"
15 #include "webrtc/common_audio/signal_processing/include/signal_processing_librar y.h" 15 #include "webrtc/common_audio/signal_processing/include/signal_processing_librar y.h"
16 #include "webrtc/common_audio/channel_buffer.h" 16 #include "webrtc/common_audio/channel_buffer.h"
17 #include "webrtc/modules/audio_processing/common.h" 17 #include "webrtc/modules/audio_processing/common.h"
18 18
19 namespace webrtc { 19 namespace webrtc {
20 namespace { 20 namespace {
21 21
22 const int kSamplesPer16kHzChannel = 160; 22 const int kSamplesPer16kHzChannel = 160;
23 const int kSamplesPer32kHzChannel = 320; 23 const int kSamplesPer32kHzChannel = 320;
24 const int kSamplesPer48kHzChannel = 480; 24 const int kSamplesPer48kHzChannel = 480;
25 25
26 bool HasKeyboardChannel(AudioProcessing::ChannelLayout layout) { 26 int KeyboardChannelIndex(const StreamConfig& stream_config) {
27 switch (layout) { 27 if (!stream_config.has_keyboard()) {
28 case AudioProcessing::kMono: 28 assert(false);
29 case AudioProcessing::kStereo: 29 return -1;
30 return false;
31 case AudioProcessing::kMonoAndKeyboard:
32 case AudioProcessing::kStereoAndKeyboard:
33 return true;
34 } 30 }
35 assert(false);
36 return false;
37 }
38 31
39 int KeyboardChannelIndex(AudioProcessing::ChannelLayout layout) { 32 return stream_config.num_channels();
40 switch (layout) {
41 case AudioProcessing::kMono:
42 case AudioProcessing::kStereo:
43 assert(false);
44 return -1;
45 case AudioProcessing::kMonoAndKeyboard:
46 return 1;
47 case AudioProcessing::kStereoAndKeyboard:
48 return 2;
49 }
50 assert(false);
51 return -1;
52 }
53
54 template <typename T>
55 void StereoToMono(const T* left, const T* right, T* out,
56 int num_frames) {
57 for (int i = 0; i < num_frames; ++i)
58 out[i] = (left[i] + right[i]) / 2;
59 } 33 }
60 34
61 int NumBandsFromSamplesPerChannel(int num_frames) { 35 int NumBandsFromSamplesPerChannel(int num_frames) {
62 int num_bands = 1; 36 int num_bands = 1;
63 if (num_frames == kSamplesPer32kHzChannel || 37 if (num_frames == kSamplesPer32kHzChannel ||
64 num_frames == kSamplesPer48kHzChannel) { 38 num_frames == kSamplesPer48kHzChannel) {
65 num_bands = rtc::CheckedDivExact(num_frames, 39 num_bands = rtc::CheckedDivExact(num_frames,
66 static_cast<int>(kSamplesPer16kHzChannel)); 40 static_cast<int>(kSamplesPer16kHzChannel));
67 } 41 }
68 return num_bands; 42 return num_bands;
(...skipping 15 matching lines...) Expand all
84 num_bands_(NumBandsFromSamplesPerChannel(proc_num_frames_)), 58 num_bands_(NumBandsFromSamplesPerChannel(proc_num_frames_)),
85 num_split_frames_(rtc::CheckedDivExact(proc_num_frames_, num_bands_)), 59 num_split_frames_(rtc::CheckedDivExact(proc_num_frames_, num_bands_)),
86 mixed_low_pass_valid_(false), 60 mixed_low_pass_valid_(false),
87 reference_copied_(false), 61 reference_copied_(false),
88 activity_(AudioFrame::kVadUnknown), 62 activity_(AudioFrame::kVadUnknown),
89 keyboard_data_(NULL), 63 keyboard_data_(NULL),
90 data_(new IFChannelBuffer(proc_num_frames_, num_proc_channels_)) { 64 data_(new IFChannelBuffer(proc_num_frames_, num_proc_channels_)) {
91 assert(input_num_frames_ > 0); 65 assert(input_num_frames_ > 0);
92 assert(proc_num_frames_ > 0); 66 assert(proc_num_frames_ > 0);
93 assert(output_num_frames_ > 0); 67 assert(output_num_frames_ > 0);
94 assert(num_input_channels_ > 0 && num_input_channels_ <= 2); 68 assert(num_input_channels_ > 0);
95 assert(num_proc_channels_ > 0 && num_proc_channels_ <= num_input_channels_); 69 assert(num_proc_channels_ > 0 && num_proc_channels_ <= num_input_channels_);
96 70
97 if (input_num_frames_ != proc_num_frames_ || 71 if (input_num_frames_ != proc_num_frames_ ||
98 output_num_frames_ != proc_num_frames_) { 72 output_num_frames_ != proc_num_frames_) {
99 // Create an intermediate buffer for resampling. 73 // Create an intermediate buffer for resampling.
100 process_buffer_.reset(new ChannelBuffer<float>(proc_num_frames_, 74 process_buffer_.reset(new ChannelBuffer<float>(proc_num_frames_,
101 num_proc_channels_)); 75 num_proc_channels_));
102 76
103 if (input_num_frames_ != proc_num_frames_) { 77 if (input_num_frames_ != proc_num_frames_) {
104 for (int i = 0; i < num_proc_channels_; ++i) { 78 for (int i = 0; i < num_proc_channels_; ++i) {
(...skipping 18 matching lines...) Expand all
123 num_bands_)); 97 num_bands_));
124 splitting_filter_.reset(new SplittingFilter(num_proc_channels_, 98 splitting_filter_.reset(new SplittingFilter(num_proc_channels_,
125 num_bands_, 99 num_bands_,
126 proc_num_frames_)); 100 proc_num_frames_));
127 } 101 }
128 } 102 }
129 103
130 AudioBuffer::~AudioBuffer() {} 104 AudioBuffer::~AudioBuffer() {}
131 105
132 void AudioBuffer::CopyFrom(const float* const* data, 106 void AudioBuffer::CopyFrom(const float* const* data,
133 int num_frames, 107 const StreamConfig& stream_config) {
134 AudioProcessing::ChannelLayout layout) { 108 assert(stream_config.num_frames() == input_num_frames_);
135 assert(num_frames == input_num_frames_); 109 assert(stream_config.num_channels() == num_input_channels_);
136 assert(ChannelsFromLayout(layout) == num_input_channels_);
137 InitForNewData(); 110 InitForNewData();
138 // Initialized lazily because there's a different condition in 111 // Initialized lazily because there's a different condition in
139 // DeinterleaveFrom. 112 // DeinterleaveFrom.
140 if ((num_input_channels_ == 2 && num_proc_channels_ == 1) && !input_buffer_) { 113 const bool need_to_downmix =
114 num_input_channels_ > 1 && num_proc_channels_ == 1;
115 if (need_to_downmix && !input_buffer_) {
141 input_buffer_.reset( 116 input_buffer_.reset(
142 new IFChannelBuffer(input_num_frames_, num_proc_channels_)); 117 new IFChannelBuffer(input_num_frames_, num_proc_channels_));
143 } 118 }
144 119
145 if (HasKeyboardChannel(layout)) { 120 if (stream_config.has_keyboard()) {
146 keyboard_data_ = data[KeyboardChannelIndex(layout)]; 121 keyboard_data_ = data[KeyboardChannelIndex(stream_config)];
147 } 122 }
148 123
149 // Downmix. 124 // Downmix.
150 const float* const* data_ptr = data; 125 const float* const* data_ptr = data;
151 if (num_input_channels_ == 2 && num_proc_channels_ == 1) { 126 if (need_to_downmix) {
152 StereoToMono(data[0], 127 DownmixToMono<float, float>(data, input_num_frames_, num_input_channels_,
153 data[1], 128 input_buffer_->fbuf()->channels()[0]);
154 input_buffer_->fbuf()->channels()[0],
155 input_num_frames_);
156 data_ptr = input_buffer_->fbuf_const()->channels(); 129 data_ptr = input_buffer_->fbuf_const()->channels();
157 } 130 }
158 131
159 // Resample. 132 // Resample.
160 if (input_num_frames_ != proc_num_frames_) { 133 if (input_num_frames_ != proc_num_frames_) {
161 for (int i = 0; i < num_proc_channels_; ++i) { 134 for (int i = 0; i < num_proc_channels_; ++i) {
162 input_resamplers_[i]->Resample(data_ptr[i], 135 input_resamplers_[i]->Resample(data_ptr[i],
163 input_num_frames_, 136 input_num_frames_,
164 process_buffer_->channels()[i], 137 process_buffer_->channels()[i],
165 proc_num_frames_); 138 proc_num_frames_);
166 } 139 }
167 data_ptr = process_buffer_->channels(); 140 data_ptr = process_buffer_->channels();
168 } 141 }
169 142
170 // Convert to the S16 range. 143 // Convert to the S16 range.
171 for (int i = 0; i < num_proc_channels_; ++i) { 144 for (int i = 0; i < num_proc_channels_; ++i) {
172 FloatToFloatS16(data_ptr[i], 145 FloatToFloatS16(data_ptr[i],
173 proc_num_frames_, 146 proc_num_frames_,
174 data_->fbuf()->channels()[i]); 147 data_->fbuf()->channels()[i]);
175 } 148 }
176 } 149 }
177 150
178 void AudioBuffer::CopyTo(int num_frames, 151 void AudioBuffer::CopyTo(const StreamConfig& stream_config,
179 AudioProcessing::ChannelLayout layout,
180 float* const* data) { 152 float* const* data) {
181 assert(num_frames == output_num_frames_); 153 assert(stream_config.num_frames() == output_num_frames_);
182 assert(ChannelsFromLayout(layout) == num_channels_); 154 assert(stream_config.num_channels() == num_channels_);
183 155
184 // Convert to the float range. 156 // Convert to the float range.
185 float* const* data_ptr = data; 157 float* const* data_ptr = data;
186 if (output_num_frames_ != proc_num_frames_) { 158 if (output_num_frames_ != proc_num_frames_) {
187 // Convert to an intermediate buffer for subsequent resampling. 159 // Convert to an intermediate buffer for subsequent resampling.
188 data_ptr = process_buffer_->channels(); 160 data_ptr = process_buffer_->channels();
189 } 161 }
190 for (int i = 0; i < num_channels_; ++i) { 162 for (int i = 0; i < num_channels_; ++i) {
191 FloatS16ToFloat(data_->fbuf()->channels()[i], 163 FloatS16ToFloat(data_->fbuf()->channels()[i],
192 proc_num_frames_, 164 proc_num_frames_,
(...skipping 127 matching lines...) Expand 10 before | Expand all | Expand 10 after
320 ChannelBuffer<float>* AudioBuffer::split_data_f() { 292 ChannelBuffer<float>* AudioBuffer::split_data_f() {
321 mixed_low_pass_valid_ = false; 293 mixed_low_pass_valid_ = false;
322 return split_data_.get() ? split_data_->fbuf() : data_->fbuf(); 294 return split_data_.get() ? split_data_->fbuf() : data_->fbuf();
323 } 295 }
324 296
325 const ChannelBuffer<float>* AudioBuffer::split_data_f() const { 297 const ChannelBuffer<float>* AudioBuffer::split_data_f() const {
326 return split_data_.get() ? split_data_->fbuf_const() : data_->fbuf_const(); 298 return split_data_.get() ? split_data_->fbuf_const() : data_->fbuf_const();
327 } 299 }
328 300
329 const int16_t* AudioBuffer::mixed_low_pass_data() { 301 const int16_t* AudioBuffer::mixed_low_pass_data() {
330 // Currently only mixing stereo to mono is supported.
331 assert(num_proc_channels_ == 1 || num_proc_channels_ == 2);
332
333 if (num_proc_channels_ == 1) { 302 if (num_proc_channels_ == 1) {
334 return split_bands_const(0)[kBand0To8kHz]; 303 return split_bands_const(0)[kBand0To8kHz];
335 } 304 }
336 305
337 if (!mixed_low_pass_valid_) { 306 if (!mixed_low_pass_valid_) {
338 if (!mixed_low_pass_channels_.get()) { 307 if (!mixed_low_pass_channels_.get()) {
339 mixed_low_pass_channels_.reset( 308 mixed_low_pass_channels_.reset(
340 new ChannelBuffer<int16_t>(num_split_frames_, 1)); 309 new ChannelBuffer<int16_t>(num_split_frames_, 1));
341 } 310 }
342 StereoToMono(split_bands_const(0)[kBand0To8kHz], 311
343 split_bands_const(1)[kBand0To8kHz], 312 DownmixToMono<int16_t, int32_t>(split_channels_const(kBand0To8kHz),
344 mixed_low_pass_channels_->channels()[0], 313 num_split_frames_, num_channels_,
345 num_split_frames_); 314 mixed_low_pass_channels_->channels()[0]);
346 mixed_low_pass_valid_ = true; 315 mixed_low_pass_valid_ = true;
347 } 316 }
348 return mixed_low_pass_channels_->channels()[0]; 317 return mixed_low_pass_channels_->channels()[0];
349 } 318 }
350 319
351 const int16_t* AudioBuffer::low_pass_reference(int channel) const { 320 const int16_t* AudioBuffer::low_pass_reference(int channel) const {
352 if (!reference_copied_) { 321 if (!reference_copied_) {
353 return NULL; 322 return NULL;
354 } 323 }
355 324
(...skipping 48 matching lines...) Expand 10 before | Expand all | Expand 10 after
404 new IFChannelBuffer(input_num_frames_, num_proc_channels_)); 373 new IFChannelBuffer(input_num_frames_, num_proc_channels_));
405 } 374 }
406 activity_ = frame->vad_activity_; 375 activity_ = frame->vad_activity_;
407 376
408 int16_t* const* deinterleaved; 377 int16_t* const* deinterleaved;
409 if (input_num_frames_ == proc_num_frames_) { 378 if (input_num_frames_ == proc_num_frames_) {
410 deinterleaved = data_->ibuf()->channels(); 379 deinterleaved = data_->ibuf()->channels();
411 } else { 380 } else {
412 deinterleaved = input_buffer_->ibuf()->channels(); 381 deinterleaved = input_buffer_->ibuf()->channels();
413 } 382 }
414 if (num_input_channels_ == 2 && num_proc_channels_ == 1) { 383 if (num_proc_channels_ == 1) {
415 // Downmix directly; no explicit deinterleaving needed. 384 // Downmix and deinterleave simultaneously.
416 for (int i = 0; i < input_num_frames_; ++i) { 385 DownmixInterleavedToMono(frame->data_, input_num_frames_,
417 deinterleaved[0][i] = (frame->data_[i * 2] + frame->data_[i * 2 + 1]) / 2; 386 num_input_channels_, deinterleaved[0]);
418 }
419 } else { 387 } else {
420 assert(num_proc_channels_ == num_input_channels_); 388 assert(num_proc_channels_ == num_input_channels_);
421 Deinterleave(frame->data_, 389 Deinterleave(frame->data_,
422 input_num_frames_, 390 input_num_frames_,
423 num_proc_channels_, 391 num_proc_channels_,
424 deinterleaved); 392 deinterleaved);
425 } 393 }
426 394
427 // Resample. 395 // Resample.
428 if (input_num_frames_ != proc_num_frames_) { 396 if (input_num_frames_ != proc_num_frames_) {
(...skipping 41 matching lines...) Expand 10 before | Expand all | Expand 10 after
470 438
471 void AudioBuffer::SplitIntoFrequencyBands() { 439 void AudioBuffer::SplitIntoFrequencyBands() {
472 splitting_filter_->Analysis(data_.get(), split_data_.get()); 440 splitting_filter_->Analysis(data_.get(), split_data_.get());
473 } 441 }
474 442
475 void AudioBuffer::MergeFrequencyBands() { 443 void AudioBuffer::MergeFrequencyBands() {
476 splitting_filter_->Synthesis(split_data_.get(), data_.get()); 444 splitting_filter_->Synthesis(split_data_.get(), data_.get());
477 } 445 }
478 446
479 } // namespace webrtc 447 } // namespace webrtc
OLDNEW
« no previous file with comments | « webrtc/modules/audio_processing/audio_buffer.h ('k') | webrtc/modules/audio_processing/audio_processing_impl.h » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698