OLD | NEW |
---|---|
1 /* | 1 /* |
2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. | 2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license | 4 * Use of this source code is governed by a BSD-style license |
5 * that can be found in the LICENSE file in the root of the source | 5 * that can be found in the LICENSE file in the root of the source |
6 * tree. An additional intellectual property rights grant can be found | 6 * tree. An additional intellectual property rights grant can be found |
7 * in the file PATENTS. All contributing project authors may | 7 * in the file PATENTS. All contributing project authors may |
8 * be found in the AUTHORS file in the root of the source tree. | 8 * be found in the AUTHORS file in the root of the source tree. |
9 */ | 9 */ |
10 | 10 |
11 #include "webrtc/modules/audio_coding/neteq/normal.h" | 11 #include "webrtc/modules/audio_coding/neteq/normal.h" |
12 | 12 |
13 #include <string.h> // memset, memcpy | 13 #include <string.h> // memset, memcpy |
14 | 14 |
15 #include <algorithm> // min | 15 #include <algorithm> // min |
16 | 16 |
17 #include "webrtc/base/checks.h" | |
17 #include "webrtc/common_audio/signal_processing/include/signal_processing_librar y.h" | 18 #include "webrtc/common_audio/signal_processing/include/signal_processing_librar y.h" |
18 #include "webrtc/modules/audio_coding/codecs/audio_decoder.h" | 19 #include "webrtc/modules/audio_coding/codecs/audio_decoder.h" |
19 #include "webrtc/modules/audio_coding/neteq/audio_multi_vector.h" | 20 #include "webrtc/modules/audio_coding/neteq/audio_multi_vector.h" |
20 #include "webrtc/modules/audio_coding/neteq/background_noise.h" | 21 #include "webrtc/modules/audio_coding/neteq/background_noise.h" |
21 #include "webrtc/modules/audio_coding/neteq/decoder_database.h" | 22 #include "webrtc/modules/audio_coding/neteq/decoder_database.h" |
22 #include "webrtc/modules/audio_coding/neteq/expand.h" | 23 #include "webrtc/modules/audio_coding/neteq/expand.h" |
23 | 24 |
24 namespace webrtc { | 25 namespace webrtc { |
25 | 26 |
26 int Normal::Process(const int16_t* input, | 27 int Normal::Process(const int16_t* input, |
27 size_t length, | 28 size_t length, |
28 Modes last_mode, | 29 Modes last_mode, |
29 int16_t* external_mute_factor_array, | 30 int16_t* external_mute_factor_array, |
30 AudioMultiVector* output) { | 31 AudioMultiVector* output) { |
31 if (length == 0) { | 32 if (length == 0) { |
32 // Nothing to process. | 33 // Nothing to process. |
33 output->Clear(); | 34 output->Clear(); |
34 return static_cast<int>(length); | 35 return static_cast<int>(length); |
35 } | 36 } |
36 | 37 |
37 assert(output->Empty()); | 38 RTC_DCHECK(output->Empty()); |
38 // Output should be empty at this point. | 39 // Output should be empty at this point. |
39 if (length % output->Channels() != 0) { | 40 if (length % output->Channels() != 0) { |
40 // The length does not match the number of channels. | 41 // The length does not match the number of channels. |
41 output->Clear(); | 42 output->Clear(); |
42 return 0; | 43 return 0; |
43 } | 44 } |
44 output->PushBackInterleaved(input, length); | 45 output->PushBackInterleaved(input, length); |
45 | 46 |
46 const int fs_mult = fs_hz_ / 8000; | 47 const int fs_mult = fs_hz_ / 8000; |
47 assert(fs_mult > 0); | 48 RTC_DCHECK_GT(fs_mult, 0); |
48 // fs_shift = log2(fs_mult), rounded down. | 49 // fs_shift = log2(fs_mult), rounded down. |
49 // Note that |fs_shift| is not "exact" for 48 kHz. | 50 // Note that |fs_shift| is not "exact" for 48 kHz. |
50 // TODO(hlundin): Investigate this further. | 51 // TODO(hlundin): Investigate this further. |
51 const int fs_shift = 30 - WebRtcSpl_NormW32(fs_mult); | 52 const int fs_shift = 30 - WebRtcSpl_NormW32(fs_mult); |
52 | 53 |
53 // Check if last RecOut call resulted in an Expand. If so, we have to take | 54 // Check if last RecOut call resulted in an Expand. If so, we have to take |
54 // care of some cross-fading and unmuting. | 55 // care of some cross-fading and unmuting. |
55 if (last_mode == kModeExpand) { | 56 if (last_mode == kModeExpand) { |
56 // Generate interpolation data using Expand. | 57 // Generate interpolation data using Expand. |
57 // First, set Expand parameters to appropriate values. | 58 // First, set Expand parameters to appropriate values. |
(...skipping 50 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
108 } | 109 } |
109 if (mute_factor > external_mute_factor_array[channel_ix]) { | 110 if (mute_factor > external_mute_factor_array[channel_ix]) { |
110 external_mute_factor_array[channel_ix] = | 111 external_mute_factor_array[channel_ix] = |
111 static_cast<int16_t>(std::min(mute_factor, 16384)); | 112 static_cast<int16_t>(std::min(mute_factor, 16384)); |
112 } | 113 } |
113 | 114 |
114 // If muted increase by 0.64 for every 20 ms (NB/WB 0.0040/0.0020 in Q14). | 115 // If muted increase by 0.64 for every 20 ms (NB/WB 0.0040/0.0020 in Q14). |
115 int increment = 64 / fs_mult; | 116 int increment = 64 / fs_mult; |
116 for (size_t i = 0; i < length_per_channel; i++) { | 117 for (size_t i = 0; i < length_per_channel; i++) { |
117 // Scale with mute factor. | 118 // Scale with mute factor. |
118 assert(channel_ix < output->Channels()); | 119 RTC_DCHECK_LT(channel_ix, output->Channels()); |
119 assert(i < output->Size()); | 120 RTC_DCHECK_LT(i, output->Size()); |
120 int32_t scaled_signal = (*output)[channel_ix][i] * | 121 int32_t scaled_signal = (*output)[channel_ix][i] * |
121 external_mute_factor_array[channel_ix]; | 122 external_mute_factor_array[channel_ix]; |
122 // Shift 14 with proper rounding. | 123 // Shift 14 with proper rounding. |
123 (*output)[channel_ix][i] = | 124 (*output)[channel_ix][i] = |
124 static_cast<int16_t>((scaled_signal + 8192) >> 14); | 125 static_cast<int16_t>((scaled_signal + 8192) >> 14); |
125 // Increase mute_factor towards 16384. | 126 // Increase mute_factor towards 16384. |
126 external_mute_factor_array[channel_ix] = static_cast<int16_t>(std::min( | 127 external_mute_factor_array[channel_ix] = static_cast<int16_t>(std::min( |
127 external_mute_factor_array[channel_ix] + increment, 16384)); | 128 external_mute_factor_array[channel_ix] + increment, 16384)); |
128 } | 129 } |
129 | 130 |
130 // Interpolate the expanded data into the new vector. | 131 // Interpolate the expanded data into the new vector. |
131 // (NB/WB/SWB32/SWB48 8/16/32/48 samples.) | 132 // (NB/WB/SWB32/SWB48 8/16/32/48 samples.) |
132 assert(fs_shift < 3); // Will always be 0, 1, or, 2. | 133 RTC_DCHECK_LT(fs_shift, 3); // Will always be 0, 1, or, 2. |
133 increment = 4 >> fs_shift; | 134 increment = 4 >> fs_shift; |
134 int fraction = increment; | 135 int fraction = increment; |
135 for (size_t i = 0; i < static_cast<size_t>(8 * fs_mult); i++) { | 136 // Don't interpolate over more samples than what is in output. When this |
137 // cap strikes, the interpolation will likely sound worse, but this is an | |
138 // emergency operation in response to unexpected input. | |
139 const size_t interp_len_samples = | |
140 std::min(static_cast<size_t>(8 * fs_mult), output->Size()); | |
kwiberg-webrtc
2016/11/14 14:36:33
Oooh, I just realized that it's possible to define
| |
141 for (size_t i = 0; i < interp_len_samples; ++i) { | |
136 // TODO(hlundin): Add 16 instead of 8 for correct rounding. Keeping 8 | 142 // TODO(hlundin): Add 16 instead of 8 for correct rounding. Keeping 8 |
137 // now for legacy bit-exactness. | 143 // now for legacy bit-exactness. |
138 assert(channel_ix < output->Channels()); | 144 RTC_DCHECK_LT(channel_ix, output->Channels()); |
139 assert(i < output->Size()); | 145 RTC_DCHECK_LT(i, output->Size()); |
140 (*output)[channel_ix][i] = | 146 (*output)[channel_ix][i] = |
141 static_cast<int16_t>((fraction * (*output)[channel_ix][i] + | 147 static_cast<int16_t>((fraction * (*output)[channel_ix][i] + |
142 (32 - fraction) * expanded[channel_ix][i] + 8) >> 5); | 148 (32 - fraction) * expanded[channel_ix][i] + 8) >> 5); |
143 fraction += increment; | 149 fraction += increment; |
144 } | 150 } |
145 } | 151 } |
146 } else if (last_mode == kModeRfc3389Cng) { | 152 } else if (last_mode == kModeRfc3389Cng) { |
147 assert(output->Channels() == 1); // Not adapted for multi-channel yet. | 153 RTC_DCHECK_EQ(output->Channels(), 1); // Not adapted for multi-channel yet. |
148 static const size_t kCngLength = 48; | 154 static const size_t kCngLength = 48; |
149 RTC_DCHECK_LE(static_cast<size_t>(8 * fs_mult), kCngLength); | 155 RTC_DCHECK_LE(static_cast<size_t>(8 * fs_mult), kCngLength); |
150 int16_t cng_output[kCngLength]; | 156 int16_t cng_output[kCngLength]; |
151 // Reset mute factor and start up fresh. | 157 // Reset mute factor and start up fresh. |
152 external_mute_factor_array[0] = 16384; | 158 external_mute_factor_array[0] = 16384; |
153 ComfortNoiseDecoder* cng_decoder = decoder_database_->GetActiveCngDecoder(); | 159 ComfortNoiseDecoder* cng_decoder = decoder_database_->GetActiveCngDecoder(); |
154 | 160 |
155 if (cng_decoder) { | 161 if (cng_decoder) { |
156 // Generate long enough for 48kHz. | 162 // Generate long enough for 48kHz. |
157 if (!cng_decoder->Generate(cng_output, 0)) { | 163 if (!cng_decoder->Generate(cng_output, 0)) { |
158 // Error returned; set return vector to all zeros. | 164 // Error returned; set return vector to all zeros. |
159 memset(cng_output, 0, sizeof(cng_output)); | 165 memset(cng_output, 0, sizeof(cng_output)); |
160 } | 166 } |
161 } else { | 167 } else { |
162 // If no CNG instance is defined, just copy from the decoded data. | 168 // If no CNG instance is defined, just copy from the decoded data. |
163 // (This will result in interpolating the decoded with itself.) | 169 // (This will result in interpolating the decoded with itself.) |
164 (*output)[0].CopyTo(fs_mult * 8, 0, cng_output); | 170 (*output)[0].CopyTo(fs_mult * 8, 0, cng_output); |
165 } | 171 } |
166 // Interpolate the CNG into the new vector. | 172 // Interpolate the CNG into the new vector. |
167 // (NB/WB/SWB32/SWB48 8/16/32/48 samples.) | 173 // (NB/WB/SWB32/SWB48 8/16/32/48 samples.) |
168 assert(fs_shift < 3); // Will always be 0, 1, or, 2. | 174 RTC_DCHECK_LT(fs_shift, 3); // Will always be 0, 1, or, 2. |
169 int16_t increment = 4 >> fs_shift; | 175 int16_t increment = 4 >> fs_shift; |
170 int16_t fraction = increment; | 176 int16_t fraction = increment; |
171 for (size_t i = 0; i < static_cast<size_t>(8 * fs_mult); i++) { | 177 for (size_t i = 0; i < static_cast<size_t>(8 * fs_mult); i++) { |
172 // TODO(hlundin): Add 16 instead of 8 for correct rounding. Keeping 8 now | 178 // TODO(hlundin): Add 16 instead of 8 for correct rounding. Keeping 8 now |
173 // for legacy bit-exactness. | 179 // for legacy bit-exactness. |
174 (*output)[0][i] = (fraction * (*output)[0][i] + | 180 (*output)[0][i] = (fraction * (*output)[0][i] + |
175 (32 - fraction) * cng_output[i] + 8) >> 5; | 181 (32 - fraction) * cng_output[i] + 8) >> 5; |
176 fraction += increment; | 182 fraction += increment; |
177 } | 183 } |
178 } else if (external_mute_factor_array[0] < 16384) { | 184 } else if (external_mute_factor_array[0] < 16384) { |
179 // Previous was neither of Expand, FadeToBGN or RFC3389_CNG, but we are | 185 // Previous was neither of Expand, FadeToBGN or RFC3389_CNG, but we are |
180 // still ramping up from previous muting. | 186 // still ramping up from previous muting. |
181 // If muted increase by 0.64 for every 20 ms (NB/WB 0.0040/0.0020 in Q14). | 187 // If muted increase by 0.64 for every 20 ms (NB/WB 0.0040/0.0020 in Q14). |
182 int increment = 64 / fs_mult; | 188 int increment = 64 / fs_mult; |
183 size_t length_per_channel = length / output->Channels(); | 189 size_t length_per_channel = length / output->Channels(); |
184 for (size_t i = 0; i < length_per_channel; i++) { | 190 for (size_t i = 0; i < length_per_channel; i++) { |
185 for (size_t channel_ix = 0; channel_ix < output->Channels(); | 191 for (size_t channel_ix = 0; channel_ix < output->Channels(); |
186 ++channel_ix) { | 192 ++channel_ix) { |
187 // Scale with mute factor. | 193 // Scale with mute factor. |
188 assert(channel_ix < output->Channels()); | 194 RTC_DCHECK_LT(channel_ix, output->Channels()); |
189 assert(i < output->Size()); | 195 RTC_DCHECK_LT(i, output->Size()); |
190 int32_t scaled_signal = (*output)[channel_ix][i] * | 196 int32_t scaled_signal = (*output)[channel_ix][i] * |
191 external_mute_factor_array[channel_ix]; | 197 external_mute_factor_array[channel_ix]; |
192 // Shift 14 with proper rounding. | 198 // Shift 14 with proper rounding. |
193 (*output)[channel_ix][i] = | 199 (*output)[channel_ix][i] = |
194 static_cast<int16_t>((scaled_signal + 8192) >> 14); | 200 static_cast<int16_t>((scaled_signal + 8192) >> 14); |
195 // Increase mute_factor towards 16384. | 201 // Increase mute_factor towards 16384. |
196 external_mute_factor_array[channel_ix] = static_cast<int16_t>(std::min( | 202 external_mute_factor_array[channel_ix] = static_cast<int16_t>(std::min( |
197 16384, external_mute_factor_array[channel_ix] + increment)); | 203 16384, external_mute_factor_array[channel_ix] + increment)); |
198 } | 204 } |
199 } | 205 } |
200 } | 206 } |
201 | 207 |
202 return static_cast<int>(length); | 208 return static_cast<int>(length); |
203 } | 209 } |
204 | 210 |
205 } // namespace webrtc | 211 } // namespace webrtc |
OLD | NEW |