OLD | NEW |
---|---|
1 /* | 1 /* |
2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. | 2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license | 4 * Use of this source code is governed by a BSD-style license |
5 * that can be found in the LICENSE file in the root of the source | 5 * that can be found in the LICENSE file in the root of the source |
6 * tree. An additional intellectual property rights grant can be found | 6 * tree. An additional intellectual property rights grant can be found |
7 * in the file PATENTS. All contributing project authors may | 7 * in the file PATENTS. All contributing project authors may |
8 * be found in the AUTHORS file in the root of the source tree. | 8 * be found in the AUTHORS file in the root of the source tree. |
9 */ | 9 */ |
10 | 10 |
(...skipping 104 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
115 | 115 |
116 // Use to enable 48kHz support in audio processing. Must be provided through the | 116 // Use to enable 48kHz support in audio processing. Must be provided through the |
117 // constructor. It will have no impact if used with | 117 // constructor. It will have no impact if used with |
118 // AudioProcessing::SetExtraOptions(). | 118 // AudioProcessing::SetExtraOptions(). |
119 struct AudioProcessing48kHzSupport { | 119 struct AudioProcessing48kHzSupport { |
120 AudioProcessing48kHzSupport() : enabled(true) {} | 120 AudioProcessing48kHzSupport() : enabled(true) {} |
121 explicit AudioProcessing48kHzSupport(bool enabled) : enabled(enabled) {} | 121 explicit AudioProcessing48kHzSupport(bool enabled) : enabled(enabled) {} |
122 bool enabled; | 122 bool enabled; |
123 }; | 123 }; |
124 | 124 |
125 // Use to enable intelligibility enhancer in audio processing. Must be provided | |
126 // though the constructor. It will have no impact if used with | |
127 // AudioProcessing::SetExtraOptions(). | |
128 // | |
129 // Note: If enabled and the reverse stream has more than one output channel, | |
130 // the reverse stream will become an upmixed mono signal. | |
131 struct Intelligibility { | |
132 Intelligibility() : enabled(false) {} | |
133 explicit Intelligibility(bool enabled) : enabled(enabled) {} | |
134 bool enabled; | |
135 }; | |
136 | |
125 static const int kAudioProcMaxNativeSampleRateHz = 32000; | 137 static const int kAudioProcMaxNativeSampleRateHz = 32000; |
126 | 138 |
127 // The Audio Processing Module (APM) provides a collection of voice processing | 139 // The Audio Processing Module (APM) provides a collection of voice processing |
128 // components designed for real-time communications software. | 140 // components designed for real-time communications software. |
129 // | 141 // |
130 // APM operates on two audio streams on a frame-by-frame basis. Frames of the | 142 // APM operates on two audio streams on a frame-by-frame basis. Frames of the |
131 // primary stream, on which all processing is applied, are passed to | 143 // primary stream, on which all processing is applied, are passed to |
132 // |ProcessStream()|. Frames of the reverse direction stream, which are used for | 144 // |ProcessStream()|. Frames of the reverse direction stream, which are used for |
133 // analysis by some components, are passed to |AnalyzeReverseStream()|. On the | 145 // analysis by some components, are passed to |AnalyzeReverseStream()|. On the |
134 // client-side, this will typically be the near-end (capture) and far-end | 146 // client-side, this will typically be the near-end (capture) and far-end |
(...skipping 175 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
310 // reverse stream forms the echo reference signal. It is recommended, but not | 322 // reverse stream forms the echo reference signal. It is recommended, but not |
311 // necessary, to provide if gain control is enabled. On the server-side this | 323 // necessary, to provide if gain control is enabled. On the server-side this |
312 // typically will not be used. If you're not sure what to pass in here, | 324 // typically will not be used. If you're not sure what to pass in here, |
313 // chances are you don't need to use it. | 325 // chances are you don't need to use it. |
314 // | 326 // |
315 // The |sample_rate_hz_|, |num_channels_|, and |samples_per_channel_| | 327 // The |sample_rate_hz_|, |num_channels_|, and |samples_per_channel_| |
316 // members of |frame| must be valid. |sample_rate_hz_| must correspond to | 328 // members of |frame| must be valid. |sample_rate_hz_| must correspond to |
317 // |input_sample_rate_hz()| | 329 // |input_sample_rate_hz()| |
318 // | 330 // |
319 // TODO(ajm): add const to input; requires an implementation fix. | 331 // TODO(ajm): add const to input; requires an implementation fix. |
320 virtual int AnalyzeReverseStream(AudioFrame* frame) = 0; | 332 virtual int AnalyzeReverseStream(AudioFrame* frame) = 0; |
Andrew MacDonald
2015/07/29 03:52:27
Since we're now supporting this interface fully, y
ekm
2015/07/29 23:35:06
Done. Also added to the StreamConfig interface.
| |
321 | 333 |
322 // Accepts deinterleaved float audio with the range [-1, 1]. Each element | 334 // Accepts deinterleaved float audio with the range [-1, 1]. Each element |
323 // of |data| points to a channel buffer, arranged according to |layout|. | 335 // of |data| points to a channel buffer, arranged according to |layout|. |
336 // | |
337 // DEPRECATED: Use |ProcessReverseStream| instead. | |
338 // TODO(ekm): Remove once all users have updated to |ProcessReverseStream|. | |
324 virtual int AnalyzeReverseStream(const float* const* data, | 339 virtual int AnalyzeReverseStream(const float* const* data, |
325 int samples_per_channel, | 340 int samples_per_channel, |
326 int sample_rate_hz, | 341 int rev_sample_rate_hz, |
342 ChannelLayout layout) = 0; | |
343 | |
344 // Same as |AnalyzeReverseStream|, but may modify |data| if intelligibility | |
345 // is enabled. | |
346 virtual int ProcessReverseStream(float* const* data, | |
347 int samples_per_channel, | |
348 int rev_sample_rate_hz, | |
327 ChannelLayout layout) = 0; | 349 ChannelLayout layout) = 0; |
328 | 350 |
329 // This must be called if and only if echo processing is enabled. | 351 // This must be called if and only if echo processing is enabled. |
330 // | 352 // |
331 // Sets the |delay| in ms between AnalyzeReverseStream() receiving a far-end | 353 // Sets the |delay| in ms between AnalyzeReverseStream() receiving a far-end |
332 // frame and ProcessStream() receiving a near-end frame containing the | 354 // frame and ProcessStream() receiving a near-end frame containing the |
333 // corresponding echo. On the client-side this can be expressed as | 355 // corresponding echo. On the client-side this can be expressed as |
334 // delay = (t_render - t_analyze) + (t_process - t_capture) | 356 // delay = (t_render - t_analyze) + (t_process - t_capture) |
335 // where, | 357 // where, |
336 // - t_analyze is the time a frame is passed to AnalyzeReverseStream() and | 358 // - t_analyze is the time a frame is passed to AnalyzeReverseStream() and |
(...skipping 450 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
787 // This does not impact the size of frames passed to |ProcessStream()|. | 809 // This does not impact the size of frames passed to |ProcessStream()|. |
788 virtual int set_frame_size_ms(int size) = 0; | 810 virtual int set_frame_size_ms(int size) = 0; |
789 virtual int frame_size_ms() const = 0; | 811 virtual int frame_size_ms() const = 0; |
790 | 812 |
791 protected: | 813 protected: |
792 virtual ~VoiceDetection() {} | 814 virtual ~VoiceDetection() {} |
793 }; | 815 }; |
794 } // namespace webrtc | 816 } // namespace webrtc |
795 | 817 |
796 #endif // WEBRTC_MODULES_AUDIO_PROCESSING_INCLUDE_AUDIO_PROCESSING_H_ | 818 #endif // WEBRTC_MODULES_AUDIO_PROCESSING_INCLUDE_AUDIO_PROCESSING_H_ |
OLD | NEW |