webrtc/modules/audio_processing/include/audio_processing.h - Issue 1234463003: Integrate Intelligibility with APM

Unified Diff: webrtc/modules/audio_processing/include/audio_processing.h

Issue 1234463003: Integrate Intelligibility with APM (Closed) Base URL: https://chromium.googlesource.com/external/webrtc.git@master

Patch Set: Added support for distinct reverse input/output streams. Created 5 years, 5 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« webrtc/modules/audio_processing/audio_processing_impl.h ('K') | « webrtc/modules/audio_processing/audio_processing_impl.cc ('k') | webrtc/modules/audio_processing/include/mock_audio_processing.h » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: webrtc/modules/audio_processing/include/audio_processing.h

diff --git a/webrtc/modules/audio_processing/include/audio_processing.h b/webrtc/modules/audio_processing/include/audio_processing.h

index 085484466c3e3d1e1730b7d9c678224410ca44c5..74a9ff18853bc4ffb79952ab07e28816071663a9 100644

--- a/webrtc/modules/audio_processing/include/audio_processing.h

+++ b/webrtc/modules/audio_processing/include/audio_processing.h

@@ -116,6 +116,18 @@ struct Beamforming {

const std::vector<Point> array_geometry;

};

+// Use to enable intelligibility enhancer in audio processing. Must be provided

+// though the constructor. It will have no impact if used with

+// AudioProcessing::SetExtraOptions().

+//

+// Note: If enabled and the reverse stream has more than one output channel,

+// the reverse stream will become an upmixed mono signal.

+struct Intelligibility {

+ Intelligibility() : enabled(false) {}

+ explicit Intelligibility(bool enabled) : enabled(enabled) {}

+ bool enabled;

+};

static const int kAudioProcMaxNativeSampleRateHz = 32000;

// The Audio Processing Module (APM) provides a collection of voice processing

@@ -333,21 +345,28 @@ class AudioProcessing {

// |input_sample_rate_hz()|

// TODO(ajm): add const to input; requires an implementation fix.

+ // DEPRECATED: Use |ProcessReverseStream| instead.

+ // TODO(ekm): Remove once all users have updated to |ProcessReverseStream|.

virtual int AnalyzeReverseStream(AudioFrame* frame) = 0;

+ // Same as |AnalyzeReverseStream|, but may modify |data| if intelligibility

Andrew MacDonald 2015/07/30 18:48:53 modify |frame|

ekm 2015/07/30 22:38:44 Done.

+ // is enabled.

+ virtual int ProcessReverseStream(AudioFrame* frame) = 0;

// Accepts deinterleaved float audio with the range [-1, 1]. Each element

// of |data| points to a channel buffer, arranged according to |layout|.

- //

// TODO(mgraczyk): Remove once clients are updated to use the new interface.

virtual int AnalyzeReverseStream(const float* const* data,

int samples_per_channel,

- int sample_rate_hz,

+ int rev_sample_rate_hz,

ChannelLayout layout) = 0;

// Accepts deinterleaved float audio with the range [-1, 1]. Each element of

// |data| points to a channel buffer, arranged according to |reverse_config|.

- virtual int AnalyzeReverseStream(const float* const* data,

- const StreamConfig& reverse_config) = 0;

+ virtual int ProcessReverseStream(const float* const* src,

+ const StreamConfig& reverse_input_config,

+ const StreamConfig& reverse_output_config,

Andrew MacDonald 2015/07/30 18:48:53 I'm not sure we want to do this. The way you have

aluebs-webrtc 2015/07/30 18:56:34 You bring a good point here. I think it makes sens

ekm 2015/07/30 21:23:50 Are we talking about converting reverse to capture

aluebs-webrtc 2015/07/30 23:09:51 I would prefer to avoid adding yet another interfa

ekm 2015/07/30 23:20:17 Ok. Why are the two configs in the ProcessStream i

aluebs-webrtc 2015/07/30 23:23:38 So that the APM knows what the user expects as out

+ float* const* dest) = 0;

// This must be called if and only if echo processing is enabled.

@@ -469,8 +488,8 @@ class StreamConfig {

// has_keyboard: True if the stream has a keyboard channel. When has_keyboard

// is true, the last channel in any corresponding list of

// channels is the keyboard channel.

- StreamConfig(int sample_rate_hz = 0,

- int num_channels = 0,

+ StreamConfig(int sample_rate_hz = 16000,

+ int num_channels = 1,

aluebs-webrtc 2015/07/30 15:28:07 I think this zero-initialization here is on purpos

Andrew MacDonald 2015/07/30 18:48:53 Agreed.

ekm 2015/07/30 22:38:44 That makes sense. I thought it'd be a nice way to

bool has_keyboard = false)

: sample_rate_hz_(sample_rate_hz),

num_channels_(num_channels),

@@ -517,7 +536,8 @@ class ProcessingConfig {

enum StreamName {

kInputStream,

kOutputStream,

- kReverseStream,

+ kReverseInputStream,

+ kReverseOutputStream,

kNumStreamNames,

};

@@ -527,13 +547,21 @@ class ProcessingConfig {

const StreamConfig& output_stream() const {

return streams[StreamName::kOutputStream];

}

- const StreamConfig& reverse_stream() const {

- return streams[StreamName::kReverseStream];

+ const StreamConfig& reverse_input_stream() const {

+ return streams[StreamName::kReverseInputStream];

+ }

+ const StreamConfig& reverse_output_stream() const {

+ return streams[StreamName::kReverseOutputStream];

}

StreamConfig& input_stream() { return streams[StreamName::kInputStream]; }

StreamConfig& output_stream() { return streams[StreamName::kOutputStream]; }

- StreamConfig& reverse_stream() { return streams[StreamName::kReverseStream]; }

+ StreamConfig& reverse_input_stream() {

+ return streams[StreamName::kReverseInputStream];

+ }

+ StreamConfig& reverse_output_stream() {

+ return streams[StreamName::kReverseOutputStream];

+ }

bool operator==(const ProcessingConfig& other) const {

for (int i = 0; i < StreamName::kNumStreamNames; ++i) {