webrtc/modules/audio_processing/aec3/echo_canceller3.cc - Issue 2584493002: Added first layer of the echo canceller 3 functionality

Side by Side Diff: webrtc/modules/audio_processing/aec3/echo_canceller3.cc

Issue 2584493002: Added first layer of the echo canceller 3 functionality (Closed)

Patch Set: Restricted the AnalyzeRender access, added ability to add external reporting of echo failure, and o… Created 4 years ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

« webrtc/modules/audio_processing/aec3/echo_canceller3.h ('K') | « webrtc/modules/audio_processing/aec3/echo_canceller3.h ('k') | webrtc/modules/audio_processing/aec3/frame_blocker.h » ('j') | webrtc/modules/audio_processing/aec3/frame_blocker.h » ('J')
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

OLD	NEW
1 /*	1 /*

2 * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.	2 * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.

3 *	3 *

4 * Use of this source code is governed by a BSD-style license	4 * Use of this source code is governed by a BSD-style license

5 * that can be found in the LICENSE file in the root of the source	5 * that can be found in the LICENSE file in the root of the source

6 * tree. An additional intellectual property rights grant can be found	6 * tree. An additional intellectual property rights grant can be found

7 * in the file PATENTS. All contributing project authors may	7 * in the file PATENTS. All contributing project authors may

8 * be found in the AUTHORS file in the root of the source tree.	8 * be found in the AUTHORS file in the root of the source tree.

9 */	9 */

10 #include "webrtc/modules/audio_processing/aec3/echo_canceller3.h"	10 #include "webrtc/modules/audio_processing/aec3/echo_canceller3.h"

11	11

12 #include "webrtc/base/atomicops.h"	12 #include "webrtc/base/atomicops.h"

13 #include "webrtc/system_wrappers/include/logging.h"	13 #include "webrtc/modules/audio_processing/logging/apm_data_dumper.h"

14	14

15 namespace webrtc {	15 namespace webrtc {

16	16

17 int EchoCanceller3::instance_count_ = 0;	17 namespace {

18	18

19 EchoCanceller3::EchoCanceller3(int sample_rate_hz, bool use_anti_hum_filter) {	19 bool DetectSaturation(rtc::ArrayView<const float> y) {

20 int band_sample_rate_hz = (sample_rate_hz == 8000 ? sample_rate_hz : 16000);	20 for (auto y_k : y) {

21 frame_length_ = rtc::CheckedDivExact(band_sample_rate_hz, 100);	21 if (y_k > 32767.0f \|\| y_k < -32768.0f) {
	ivoc 2016/12/19 11:30:22 How about if the signals are equal to the limits? How about if the signals are equal to the limits? peah-webrtc 2016/12/20 10:10:25 Good find! Done. Show quoted text On 2016/12/19 11:30:22, ivoc wrote: > How about if the signals are equal to the limits? Good find! Done.
22	22 return true;

23 LOG(LS_INFO) << "AEC3 created : "	23 }

24 << "{ instance_count: " << instance_count_ << "}";	24 }

25 instance_count_ = rtc::AtomicOps::Increment(&instance_count_);	25 return false;

26 }	26 }

27	27

28 EchoCanceller3::~EchoCanceller3() = default;	28 void ProcessCaptureFrameContent(AudioBuffer* capture,

29	29 bool known_echo_path_change,

30 bool EchoCanceller3::AnalyzeRender(AudioBuffer* render) {	30 bool saturated_microphone_signal,

	31 size_t subframe_index,

	32 FrameBlocker* capture_blocker,

	33 BlockFramer* output_framer,

	34 BlockProcessor* block_processor) {

	35 float capture_block[kMaxNumBands * kBlockSize];

	36 capture_blocker->InsertFrameAndExtractBlock(

	37 subframe_index, capture->split_bands_f(0), capture_block);

	38 block_processor->ProcessCapture(known_echo_path_change,

	39 saturated_microphone_signal, capture_block);

	40 output_framer->InsertBlock(capture_block);

	41 output_framer->ExtractFrame(subframe_index, capture->split_bands_f(0));

	42 }

	43

	44 void ProcessRemainingCaptureFrameContent(bool known_echo_path_change,

	45 bool saturated_microphone_signal,

	46 FrameBlocker* capture_blocker,

	47 BlockFramer* output_framer,

	48 BlockProcessor* block_processor) {

	49 if (capture_blocker->IsBlockAvailable()) {
	hlundin-webrtc 2016/12/16 10:04:47 Nit: I prefer early return. if (!capture_blocker-> Nit: I prefer early return. if (!capture_blocker->IsBlockAvailable()) { return; } ... peah-webrtc 2016/12/20 10:10:25 Done. Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > Nit: I prefer early return. > if (!capture_blocker->IsBlockAvailable()) { > return; > } > ... Done.
	50 float capture_block[kMaxNumBands * kBlockSize];

	51 capture_blocker->ExtractBlockIfAvailable(capture_block);
	hlundin-webrtc 2016/12/16 10:04:47 ...IfAvailable? I thought we established that it w ...IfAvailable? I thought we established that it was available. peah-webrtc 2016/12/20 10:10:25 True, I changed the implementation of FrameBlocker Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > ...IfAvailable? I thought we established that it was available. True, I changed the implementation of FrameBlocker accordingly. Done.
	52 block_processor->ProcessCapture(known_echo_path_change,

	53 saturated_microphone_signal, capture_block);

	54 output_framer->InsertBlock(capture_block);

	55 }

	56 }

	57

	58 bool BufferRenderFrameContent(rtc::ArrayView<const float> render_frame,

	59 size_t subframe_index,

	60 FrameBlocker* render_blocker,

	61 BlockProcessor* block_processor) {

	62 return block_processor->BufferRender(

	63 [render_blocker, render_frame,

	64 subframe_index](rtc::ArrayView<float> block) mutable {

	65 render_blocker->InsertFrameAndExtractBlock(subframe_index, render_frame,

	66 block);

	67 });
	ivoc 2016/12/19 11:30:22 Can you explain what this is supposed to do? The w Can you explain what this is supposed to do? The way the code looks now doesn't make much sense to me. For example, this lambda is passed to the block processor (why?), and is never executed there. I guess some steps will be added later? peah-webrtc 2016/12/20 10:10:25 Yes, the reason for this construct is to provide a Show quoted text On 2016/12/19 11:30:22, ivoc wrote: > Can you explain what this is supposed to do? The way the code looks now doesn't > make much sense to me. For example, this lambda is passed to the block processor > (why?), and is never executed there. I guess some steps will be added later? Yes, the reason for this construct is to provide a cheap way of producing a render block from a frame and passing it to the BufferRender method. The reason for why it is not used in the block_processor is that that functionality is to be added in the next CL. However, with the code changes in the new patch, this lambda is no longer used and I instead use the vector-swap functionality for efficiently passing the blocks. PTAL ivoc 2016/12/21 13:04:04 It looks easier to understand now. Show quoted text On 2016/12/20 10:10:25, peah-webrtc wrote: > On 2016/12/19 11:30:22, ivoc wrote: > > Can you explain what this is supposed to do? The way the code looks now > doesn't > > make much sense to me. For example, this lambda is passed to the block > processor > > (why?), and is never executed there. I guess some steps will be added later? > > Yes, the reason for this construct is to provide a cheap way of producing a > render block from a frame and passing it to the BufferRender method. The reason > for why it is not used in the block_processor is that that functionality is to > be added in the next CL. > > However, with the code changes in the new patch, this lambda is no longer used > and I instead use the vector-swap functionality for efficiently passing the > blocks. > > PTAL It looks easier to understand now. peah-webrtc 2016/12/21 23:13:48 Acknowledged. Show quoted text On 2016/12/21 13:04:04, ivoc wrote: > On 2016/12/20 10:10:25, peah-webrtc wrote: > > On 2016/12/19 11:30:22, ivoc wrote: > > > Can you explain what this is supposed to do? The way the code looks now > > doesn't > > > make much sense to me. For example, this lambda is passed to the block > > processor > > > (why?), and is never executed there. I guess some steps will be added later? > > > > Yes, the reason for this construct is to provide a cheap way of producing a > > render block from a frame and passing it to the BufferRender method. The > reason > > for why it is not used in the block_processor is that that functionality is to > > be added in the next CL. > > > > However, with the code changes in the new patch, this lambda is no longer used > > and I instead use the vector-swap functionality for efficiently passing the > > blocks. > > > > PTAL > > It looks easier to understand now. Acknowledged.
	68 }

	69

	70 bool BufferRemainingRenderFrameContent(FrameBlocker* render_blocker,

	71 BlockProcessor* block_processor) {

	72 if (render_blocker->IsBlockAvailable()) {

	73 return block_processor->BufferRender(

	74 [render_blocker](rtc::ArrayView<float> block) mutable {

	75 render_blocker->ExtractBlockIfAvailable(block);

	76 });

	77 }

	78 return false;

	79 }

	80

	81 void CopyAudioBufferIntoFrame(AudioBuffer* buffer,
	hlundin-webrtc 2016/12/16 10:04:47 I assume this cannot be made a const argument beca I assume this cannot be made a const argument because of magic happening inside the buffer. peah-webrtc 2016/12/20 10:10:25 Afaics, that is the case. Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > I assume this cannot be made a const argument because of magic happening inside > the buffer. Afaics, that is the case.
	82 size_t num_bands,

	83 size_t frame_length,

	84 rtc::ArrayView<float> frame) {

	85 RTC_DCHECK_EQ(num_bands * frame_length, frame.size());

	86 for (size_t i = 0; i < num_bands; ++i) {

	87 rtc::ArrayView<float> buffer_view(&buffer->split_bands_f(0)[i][0],

	88 frame_length);

	89 std::copy(buffer_view.begin(), buffer_view.end(),

	90 frame.begin() + i * frame_length);

	91 }

	92 }

	93

	94 // [B,A] = butter(2,100/4000,'high')

	95 const CascadedBiQuadFilter::BiQuadCoefficients

	96 kHighPassFilterCoefficients_8kHz = {

	97 {0.945976856002790, -1.891953712005580, 0.945976856002790},

	98 {-1.889033079394525, 0.894874344616636}};

	99 const int kNumberOfHighPassBiQuads_8kHz = 1;

	100

	101 // [B,A] = butter(2,100/8000,'high')

	102 const CascadedBiQuadFilter::BiQuadCoefficients

	103 kHighPassFilterCoefficients_16kHz = {

	104 {0.972613898499844, -1.945227796999688, 0.972613898499844},

	105 {-1.944477657767094, 0.945977936232282}};

	106 const int kNumberOfHighPassBiQuads_16kHz = 1;

	107

	108 } // namespace

	109

	110 EchoCanceller3::RenderWriterState::RenderWriterState(

	111 ApmDataDumper* data_dumper,

	112 RenderTransferBufferWriter* transfer_buffer_writer,

	113 std::unique_ptr<CascadedBiQuadFilter> render_highpass_filter,

	114 int sample_rate_hz,

	115 int frame_length,

	116 int num_bands)

	117 : data_dumper_(data_dumper),
	hlundin-webrtc 2016/12/16 10:04:47 Is nullptr valid? Otherwise, add a DCHECK. Is nullptr valid? Otherwise, add a DCHECK. peah-webrtc 2016/12/20 10:10:25 Done. Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > Is nullptr valid? Otherwise, add a DCHECK. Done.
	118 sample_rate_hz_(sample_rate_hz),

	119 frame_length_(frame_length),

	120 num_bands_(num_bands),

	121 transfer_buffer_writer_(transfer_buffer_writer),

	122 render_highpass_filter_(std::move(render_highpass_filter)),

	123 render_queue_input_frame_(num_bands_ * frame_length_, 0.f) {}

	124

	125 EchoCanceller3::RenderWriterState::~RenderWriterState() = default;

	126

	127 bool EchoCanceller3::RenderWriterState::Insert(AudioBuffer* render) {
	hlundin-webrtc 2016/12/16 10:04:46 "render" is a dubious name here. I think "input" w "render" is a dubious name here. I think "input" would me more descriptive. peah-webrtc 2016/12/20 10:10:25 Done. Show quoted text On 2016/12/16 10:04:46, hlundin-webrtc wrote: > "render" is a dubious name here. I think "input" would me more descriptive. Done.
31 RTC_DCHECK_EQ(1u, render->num_channels());	128 RTC_DCHECK_EQ(1u, render->num_channels());
	hlundin-webrtc 2016/12/16 10:04:47 Nit: I think you no longer need the 'u' suffix, as Nit: I think you no longer need the 'u' suffix, as a result of https://codereview.webrtc.org/2535593002. peah-webrtc 2016/12/20 10:10:25 Done. Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > Nit: I think you no longer need the 'u' suffix, as a result of > https://codereview.webrtc.org/2535593002. Done.
32 RTC_DCHECK_EQ(frame_length_, render->num_frames_per_band());	129 RTC_DCHECK_EQ(frame_length_, render->num_frames_per_band());

33 return true;	130 data_dumper_->DumpWav("aec3_render_input", frame_length_,

34 }	131 &render->split_bands_f(0)[0][0],

35	132 LowestBandRate(sample_rate_hz_), 1);

36 void EchoCanceller3::AnalyzeCapture(AudioBuffer* capture) {}	133

	134 CopyAudioBufferIntoFrame(render, num_bands_, frame_length_,

	135 render_queue_input_frame_);

	136

	137 if (render_highpass_filter_) {

	138 render_highpass_filter_->Process(

	139 rtc::ArrayView<float>(&render_queue_input_frame_[0], frame_length_));

	140 }

	141

	142 return transfer_buffer_writer_->Insert(&render_queue_input_frame_);

	143 }

	144

	145 int EchoCanceller3::instance_count_ = 0;

	146

	147 EchoCanceller3::EchoCanceller3(int sample_rate_hz, bool use_highpass_filter)

	148 : data_dumper_(new ApmDataDumper(instance_count_)),

	149 sample_rate_hz_(sample_rate_hz),

	150 num_bands_(sample_rate_hz_ == 8000 ? 1 : sample_rate_hz / 16000),
	hlundin-webrtc 2016/12/16 10:04:47 You have this expression defined as NumBandsForRat You have this expression defined as NumBandsForRate(sample_rate_hz) in aec3_constants.h. peah-webrtc 2016/12/20 10:10:25 Done. Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > You have this expression defined as NumBandsForRate(sample_rate_hz) in > aec3_constants.h. Done.
	151 frame_length_(rtc::CheckedDivExact(LowestBandRate(sample_rate_hz_), 100)),

	152 output_framer_(num_bands_, frame_length_),

	153 capture_blocker_(num_bands_, frame_length_),

	154 render_blocker_(num_bands_, frame_length_),

	155 render_transfer_buffer_(num_bands_, frame_length_),

	156 block_processor_(data_dumper_.get(), sample_rate_hz, num_bands_),

	157 render_queue_output_frame_(num_bands_ * frame_length_, 0.f) {

	158 std::unique_ptr<CascadedBiQuadFilter> render_highpass_filter;

	159 if (use_highpass_filter) {

	160 render_highpass_filter.reset(new CascadedBiQuadFilter(

	161 sample_rate_hz_ == 8000 ? kHighPassFilterCoefficients_8kHz

	162 : kHighPassFilterCoefficients_16kHz,

	163 sample_rate_hz_ == 8000 ? kNumberOfHighPassBiQuads_8kHz

	164 : kNumberOfHighPassBiQuads_16kHz));

	165 capture_highpass_filter_.reset(new CascadedBiQuadFilter(

	166 sample_rate_hz_ == 8000 ? kHighPassFilterCoefficients_8kHz

	167 : kHighPassFilterCoefficients_16kHz,

	168 sample_rate_hz_ == 8000 ? kNumberOfHighPassBiQuads_8kHz

	169 : kNumberOfHighPassBiQuads_16kHz));

	170 }

	171

	172 render_writer_.reset(

	173 new RenderWriterState(data_dumper_.get(), &render_transfer_buffer_,

	174 std::move(render_highpass_filter), sample_rate_hz_,
	hlundin-webrtc 2016/12/16 10:04:47 What happens when you move from an (explicitly) un What happens when you move from an (explicitly) uninitialized unique_ptr? Are you sure you get a nullptr as expected? From http://en.cppreference.com/w/cpp/memory/unique_ptr/unique_ptr, it seems that the default ctor value-initializes the pointer, which I assume sets it to nullptr. peah-webrtc 2016/12/20 10:10:25 Good point! I cannot find whether it actually init Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > What happens when you move from an (explicitly) uninitialized unique_ptr? Are > you sure you get a nullptr as expected? From > http://en.cppreference.com/w/cpp/memory/unique_ptr/unique_ptr, it seems that the > default ctor value-initializes the pointer, which I assume sets it to nullptr. Good point! I cannot find whether it actually initializes it to null though. I added that specifically. PTAL
	175 frame_length_, num_bands_));

	176

	177 RTC_DCHECK_EQ(num_bands_, std::max(sample_rate_hz_, 16000) / 16000);

	178 RTC_DCHECK_GE(kMaxNumBands, num_bands_);

	179 instance_count_ = rtc::AtomicOps::Increment(&instance_count_);

	180 }

	181

	182 EchoCanceller3::~EchoCanceller3() = default;

	183

	184 bool EchoCanceller3::AnalyzeRender(AudioBuffer* render) {

	185 return render_writer_->Insert(render);

	186 }

	187

	188 bool EchoCanceller3::EmptyRenderQueue() {
	hlundin-webrtc 2016/12/16 10:04:47 Check the order of the methods in this file, and m Check the order of the methods in this file, and make sure it is the same as in the h-file. peah-webrtc 2016/12/20 10:10:25 Done. Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > Check the order of the methods in this file, and make sure it is the same as in > the h-file. Done.
	189 bool render_buffer_overrun = false;

	190 bool frame_to_buffer =

	191 render_transfer_buffer_.Remove(&render_queue_output_frame_);

	192 while (frame_to_buffer) {

	193 render_buffer_overrun \|= BufferRenderFrameContent(

	194 render_queue_output_frame_, 0, &render_blocker_, &block_processor_);

	195

	196 if (sample_rate_hz_ != 8000) {

	197 render_buffer_overrun \|= BufferRenderFrameContent(

	198 render_queue_output_frame_, 1, &render_blocker_, &block_processor_);

	199 }

	200

	201 render_buffer_overrun \|=

	202 BufferRemainingRenderFrameContent(&render_blocker_, &block_processor_);

	203

	204 frame_to_buffer =

	205 render_transfer_buffer_.Remove(&render_queue_output_frame_);

	206 }

	207 return render_buffer_overrun;

	208 }

	209

	210 void EchoCanceller3::AnalyzeCapture(AudioBuffer* capture) {

	211 data_dumper_->DumpWav("aec3_capture_analyze_input", frame_length_,

	212 capture->channels_f()[0], sample_rate_hz_, 1);

	213

	214 saturated_microphone_signal_ = false;
	hlundin-webrtc 2016/12/16 10:04:47 You reset saturated_microphone_signal_ both here a You reset saturated_microphone_signal_ both here and at the end of ProcessCapture. Is this intentional? peah-webrtc 2016/12/20 10:10:25 Done. Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > You reset saturated_microphone_signal_ both here and at the end of > ProcessCapture. Is this intentional? Done.
	215 for (size_t k = 0; k < capture->num_channels(); ++k) {

	216 saturated_microphone_signal_ \|=
	hlundin-webrtc 2016/12/16 10:04:47 I assume you will expand the work of this for loop I assume you will expand the work of this for loop later one. Otherwise, you can do early return on finding the first saturation. for () { if (DetectSaturation(blah) { saturated_microphone_signal_ = true; return; } } peah-webrtc 2016/12/20 10:10:25 There will be no more work on this loop. I added e Show quoted text On 2016/12/16 10:04:47, hlundin-webrtc wrote: > I assume you will expand the work of this for loop later one. Otherwise, you can > do early return on finding the first saturation. > for () { > if (DetectSaturation(blah) { > saturated_microphone_signal_ = true; > return; > } > } There will be no more work on this loop. I added early return. Done.
	217 DetectSaturation(rtc::ArrayView<const float>(capture->channels_f()[k],

	218 capture->num_frames()));

	219 }

	220 }

37	221

38 void EchoCanceller3::ProcessCapture(AudioBuffer* capture,	222 void EchoCanceller3::ProcessCapture(AudioBuffer* capture,

39 bool known_echo_path_change) {	223 bool known_echo_path_change) {

40 RTC_DCHECK_EQ(1u, capture->num_channels());	224 RTC_DCHECK_EQ(1u, capture->num_channels());

41 RTC_DCHECK_EQ(frame_length_, capture->num_frames_per_band());	225 RTC_DCHECK_EQ(frame_length_, capture->num_frames_per_band());

	226

	227 rtc::ArrayView<float> capture_lower_band =

	228 rtc::ArrayView<float>(&capture->split_bands_f(0)[0][0], frame_length_);

	229

	230 data_dumper_->DumpWav("aec3_capture_input", capture_lower_band,

	231 LowestBandRate(sample_rate_hz_), 1);

	232

	233 bool render_buffer_overrun = EmptyRenderQueue();

	234 RTC_DCHECK(!render_buffer_overrun);

	235

	236 if (capture_highpass_filter_) {

	237 capture_highpass_filter_->Process(capture_lower_band);

	238 }

	239

	240 ProcessCaptureFrameContent(capture, known_echo_path_change,

	241 saturated_microphone_signal_, 0, &capture_blocker_,

	242 &output_framer_, &block_processor_);

	243

	244 if (sample_rate_hz_ != 8000) {

	245 ProcessCaptureFrameContent(

	246 capture, known_echo_path_change, saturated_microphone_signal_, 1,

	247 &capture_blocker_, &output_framer_, &block_processor_);

	248 }

	249

	250 ProcessRemainingCaptureFrameContent(

	251 known_echo_path_change, saturated_microphone_signal_, &capture_blocker_,

	252 &output_framer_, &block_processor_);

	253

	254 data_dumper_->DumpWav("aec3_capture_output", frame_length_,

	255 &capture->split_bands_f(0)[0][0],

	256 LowestBandRate(sample_rate_hz_), 1);

	257

	258 saturated_microphone_signal_ = false;

42 }	259 }

43	260

44 std::string EchoCanceller3::ToString(	261 std::string EchoCanceller3::ToString(

45 const AudioProcessing::Config::EchoCanceller3& config) {	262 const AudioProcessing::Config::EchoCanceller3& config) {

46 std::stringstream ss;	263 std::stringstream ss;

47 ss << "{"	264 ss << "{"

48 << "enabled: " << (config.enabled ? "true" : "false") << "}";	265 << "enabled: " << (config.enabled ? "true" : "false") << "}";

49 return ss.str();	266 return ss.str();

50 }	267 }

51	268

52 bool EchoCanceller3::Validate(	269 bool EchoCanceller3::Validate(

53 const AudioProcessing::Config::EchoCanceller3& config) {	270 const AudioProcessing::Config::EchoCanceller3& config) {

54 return true;	271 return true;

55 }	272 }

56	273

57 } // namespace webrtc	274 } // namespace webrtc

OLD	NEW