| OLD | NEW | 
|---|
| 1 /* | 1 /* | 
| 2  *  Copyright (c) 2015 The WebRTC project authors. All Rights Reserved. | 2  *  Copyright (c) 2015 The WebRTC project authors. All Rights Reserved. | 
| 3  * | 3  * | 
| 4  *  Use of this source code is governed by a BSD-style license | 4  *  Use of this source code is governed by a BSD-style license | 
| 5  *  that can be found in the LICENSE file in the root of the source | 5  *  that can be found in the LICENSE file in the root of the source | 
| 6  *  tree. An additional intellectual property rights grant can be found | 6  *  tree. An additional intellectual property rights grant can be found | 
| 7  *  in the file PATENTS.  All contributing project authors may | 7  *  in the file PATENTS.  All contributing project authors may | 
| 8  *  be found in the AUTHORS file in the root of the source tree. | 8  *  be found in the AUTHORS file in the root of the source tree. | 
| 9  */ | 9  */ | 
| 10 | 10 | 
| 11 // |  | 
| 12 //  Unit tests for intelligibility enhancer. |  | 
| 13 // |  | 
| 14 |  | 
| 15 #include <math.h> | 11 #include <math.h> | 
| 16 #include <stdlib.h> | 12 #include <stdlib.h> | 
| 17 #include <algorithm> | 13 #include <algorithm> | 
| 18 #include <vector> | 14 #include <vector> | 
| 19 | 15 | 
| 20 #include "testing/gtest/include/gtest/gtest.h" | 16 #include "testing/gtest/include/gtest/gtest.h" | 
| 21 #include "webrtc/base/arraysize.h" | 17 #include "webrtc/base/arraysize.h" | 
| 22 #include "webrtc/base/scoped_ptr.h" | 18 #include "webrtc/base/scoped_ptr.h" | 
| 23 #include "webrtc/common_audio/signal_processing/include/signal_processing_librar
     y.h" | 19 #include "webrtc/common_audio/signal_processing/include/signal_processing_librar
     y.h" | 
| 24 #include "webrtc/modules/audio_processing/intelligibility/intelligibility_enhanc
     er.h" | 20 #include "webrtc/modules/audio_processing/intelligibility/intelligibility_enhanc
     er.h" | 
| 25 | 21 | 
| 26 namespace webrtc { | 22 namespace webrtc { | 
| 27 | 23 | 
| 28 namespace { | 24 namespace { | 
| 29 | 25 | 
| 30 // Target output for ERB create test. Generated with matlab. | 26 // Target output for ERB create test. Generated with matlab. | 
| 31 const float kTestCenterFreqs[] = { | 27 const float kTestCenterFreqs[] = { | 
| 32     13.169f, 26.965f, 41.423f, 56.577f, 72.461f, 89.113f, 106.57f, 124.88f, | 28     13.169f, 26.965f, 41.423f, 56.577f, 72.461f, 89.113f, 106.57f, 124.88f, | 
| 33     144.08f, 164.21f, 185.34f, 207.5f,  230.75f, 255.16f, 280.77f, 307.66f, | 29     144.08f, 164.21f, 185.34f, 207.5f,  230.75f, 255.16f, 280.77f, 307.66f, | 
| 34     335.9f,  365.56f, 396.71f, 429.44f, 463.84f, 500.f}; | 30     335.9f,  365.56f, 396.71f, 429.44f, 463.84f, 500.f}; | 
| 35 const float kTestFilterBank[][2] = {{0.055556f, 0.f}, | 31 const float kTestFilterBank[][9] = { | 
| 36                                     {0.055556f, 0.f}, | 32     {0.2f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 37                                     {0.055556f, 0.f}, | 33     {0.2f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 38                                     {0.055556f, 0.f}, | 34     {0.2f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 39                                     {0.055556f, 0.f}, | 35     {0.2f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 40                                     {0.055556f, 0.f}, | 36     {0.2f, 0.25f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 41                                     {0.055556f, 0.f}, | 37     {0.f, 0.25f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 42                                     {0.055556f, 0.f}, | 38     {0.f, 0.25f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 43                                     {0.055556f, 0.f}, | 39     {0.f, 0.25f, 0.25f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 44                                     {0.055556f, 0.f}, | 40     {0.f, 0.f, 0.25f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 45                                     {0.055556f, 0.f}, | 41     {0.f, 0.f, 0.25f, 0.142857f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 46                                     {0.055556f, 0.f}, | 42     {0.f, 0.f, 0.25f, 0.285714f, 0.f, 0.f, 0.f, 0.f, 0.f}, | 
| 47                                     {0.055556f, 0.f}, | 43     {0.f, 0.f, 0.f, 0.285714f, 0.142857f, 0.f, 0.f, 0.f, 0.f}, | 
| 48                                     {0.055556f, 0.f}, | 44     {0.f, 0.f, 0.f, 0.285714f, 0.285714f, 0.f, 0.f, 0.f, 0.f}, | 
| 49                                     {0.055556f, 0.f}, | 45     {0.f, 0.f, 0.f, 0.f, 0.285714f, 0.142857f, 0.f, 0.f, 0.f}, | 
| 50                                     {0.055556f, 0.f}, | 46     {0.f, 0.f, 0.f, 0.f, 0.285714f, 0.285714f, 0.f, 0.f, 0.f}, | 
| 51                                     {0.055556f, 0.f}, | 47     {0.f, 0.f, 0.f, 0.f, 0.f, 0.285714f, 0.142857f, 0.f, 0.f}, | 
| 52                                     {0.055556f, 0.2f}, | 48     {0.f, 0.f, 0.f, 0.f, 0.f, 0.285714f, 0.285714f, 0.f, 0.f}, | 
| 53                                     {0, 0.2f}, | 49     {0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.285714f, 0.142857f, 0.f}, | 
| 54                                     {0, 0.2f}, | 50     {0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.285714f, 0.285714f, 0.f}, | 
| 55                                     {0, 0.2f}, | 51     {0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.285714f, 0.f}, | 
| 56                                     {0, 0.2f}}; | 52     {0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.285714f, 0.5f}, | 
|  | 53     {0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.f, 0.5f}}; | 
| 57 static_assert(arraysize(kTestCenterFreqs) == arraysize(kTestFilterBank), | 54 static_assert(arraysize(kTestCenterFreqs) == arraysize(kTestFilterBank), | 
| 58               "Test filterbank badly initialized."); | 55               "Test filterbank badly initialized."); | 
| 59 | 56 | 
| 60 // Target output for gain solving test. Generated with matlab. | 57 // Target output for gain solving test. Generated with matlab. | 
| 61 const size_t kTestStartFreq = 12;  // Lowest integral frequency for ERBs. | 58 const size_t kTestStartFreq = 12;  // Lowest integral frequency for ERBs. | 
| 62 const float kTestZeroVar[] = {1.f, 1.f, 1.f, 1.f, 1.f, 1.f, 1.f, 1.f, | 59 const float kTestZeroVar[] = {1.f, 1.f, 1.f, 1.f, 1.f, 1.f, 1.f, 1.f, | 
| 63                               1.f, 1.f, 1.f, 0.f, 0.f, 0.f, 0.f, 0.f, | 60                               1.f, 1.f, 1.f, 0.f, 0.f, 0.f, 0.f, 0.f, | 
| 64                               0.f, 0.f, 0.f, 0.f, 0.f, 0.f}; | 61                               0.f, 0.f, 0.f, 0.f, 0.f, 0.f}; | 
| 65 static_assert(arraysize(kTestCenterFreqs) == arraysize(kTestZeroVar), | 62 static_assert(arraysize(kTestCenterFreqs) == arraysize(kTestZeroVar), | 
| 66               "Variance test data badly initialized."); | 63               "Power test data badly initialized."); | 
| 67 const float kTestNonZeroVarLambdaTop[] = { | 64 const float kTestNonZeroVarLambdaTop[] = { | 
| 68     1.f,     1.f,     1.f,     1.f,     1.f,     1.f,     1.f,     1.f, | 65     1.f,     1.f,     1.f,     1.f,     1.f,     1.f,     1.f,     1.f, | 
| 69     1.f,     1.f,     1.f,     0.f,     0.f,     0.0351f, 0.0636f, 0.0863f, | 66     1.f,     1.f,     1.f,     0.f,     0.f,     0.0351f, 0.0636f, 0.0863f, | 
| 70     0.1037f, 0.1162f, 0.1236f, 0.1251f, 0.1189f, 0.0993f}; | 67     0.1037f, 0.1162f, 0.1236f, 0.1251f, 0.1189f, 0.0993f}; | 
| 71 static_assert(arraysize(kTestCenterFreqs) == | 68 static_assert(arraysize(kTestCenterFreqs) == | 
| 72                   arraysize(kTestNonZeroVarLambdaTop), | 69                   arraysize(kTestNonZeroVarLambdaTop), | 
| 73               "Variance test data badly initialized."); | 70               "Power test data badly initialized."); | 
| 74 const float kMaxTestError = 0.005f; | 71 const float kMaxTestError = 0.005f; | 
| 75 | 72 | 
| 76 // Enhancer initialization parameters. | 73 // Enhancer initialization parameters. | 
| 77 const int kSamples = 2000; | 74 const int kSamples = 2000; | 
| 78 const int kSampleRate = 1000; | 75 const int kSampleRate = 1000; | 
| 79 const int kNumChannels = 1; | 76 const int kNumChannels = 1; | 
| 80 const int kFragmentSize = kSampleRate / 100; | 77 const int kFragmentSize = kSampleRate / 100; | 
| 81 | 78 | 
| 82 }  // namespace | 79 }  // namespace | 
| 83 | 80 | 
| 84 using std::vector; |  | 
| 85 using intelligibility::VarianceArray; |  | 
| 86 |  | 
| 87 class IntelligibilityEnhancerTest : public ::testing::Test { | 81 class IntelligibilityEnhancerTest : public ::testing::Test { | 
| 88  protected: | 82  protected: | 
| 89   IntelligibilityEnhancerTest() | 83   IntelligibilityEnhancerTest() | 
| 90       : clear_data_(kSamples), noise_data_(kSamples), orig_data_(kSamples) { | 84       : clear_data_(kSamples), noise_data_(kSamples), orig_data_(kSamples) { | 
| 91     config_.sample_rate_hz = kSampleRate; | 85     config_.sample_rate_hz = kSampleRate; | 
| 92     enh_.reset(new IntelligibilityEnhancer(config_)); | 86     enh_.reset(new IntelligibilityEnhancer(config_)); | 
| 93   } | 87   } | 
| 94 | 88 | 
| 95   bool CheckUpdate(VarianceArray::StepType step_type) { | 89   bool CheckUpdate() { | 
| 96     config_.sample_rate_hz = kSampleRate; | 90     config_.sample_rate_hz = kSampleRate; | 
| 97     config_.var_type = step_type; |  | 
| 98     enh_.reset(new IntelligibilityEnhancer(config_)); | 91     enh_.reset(new IntelligibilityEnhancer(config_)); | 
| 99     float* clear_cursor = &clear_data_[0]; | 92     float* clear_cursor = &clear_data_[0]; | 
| 100     float* noise_cursor = &noise_data_[0]; | 93     float* noise_cursor = &noise_data_[0]; | 
| 101     for (int i = 0; i < kSamples; i += kFragmentSize) { | 94     for (int i = 0; i < kSamples; i += kFragmentSize) { | 
| 102       enh_->ProcessRenderAudio(&clear_cursor, kSampleRate, kNumChannels); | 95       enh_->ProcessRenderAudio(&clear_cursor, kSampleRate, kNumChannels); | 
| 103       clear_cursor += kFragmentSize; | 96       clear_cursor += kFragmentSize; | 
| 104       noise_cursor += kFragmentSize; | 97       noise_cursor += kFragmentSize; | 
| 105     } | 98     } | 
| 106     for (int i = 0; i < kSamples; i++) { | 99     for (int i = 0; i < kSamples; i++) { | 
| 107       if (std::fabs(clear_data_[i] - orig_data_[i]) > kMaxTestError) { | 100       if (std::fabs(clear_data_[i] - orig_data_[i]) > kMaxTestError) { | 
| 108         return true; | 101         return true; | 
| 109       } | 102       } | 
| 110     } | 103     } | 
| 111     return false; | 104     return false; | 
| 112   } | 105   } | 
| 113 | 106 | 
| 114   IntelligibilityEnhancer::Config config_; | 107   IntelligibilityEnhancer::Config config_; | 
| 115   rtc::scoped_ptr<IntelligibilityEnhancer> enh_; | 108   rtc::scoped_ptr<IntelligibilityEnhancer> enh_; | 
| 116   vector<float> clear_data_; | 109   std::vector<float> clear_data_; | 
| 117   vector<float> noise_data_; | 110   std::vector<float> noise_data_; | 
| 118   vector<float> orig_data_; | 111   std::vector<float> orig_data_; | 
| 119 }; | 112 }; | 
| 120 | 113 | 
| 121 // For each class of generated data, tests that render stream is | 114 // For each class of generated data, tests that render stream is updated when | 
| 122 // updated when it should be for each variance update method. | 115 // it should be. | 
| 123 TEST_F(IntelligibilityEnhancerTest, TestRenderUpdate) { | 116 TEST_F(IntelligibilityEnhancerTest, TestRenderUpdate) { | 
| 124   vector<VarianceArray::StepType> step_types; |  | 
| 125   step_types.push_back(VarianceArray::kStepInfinite); |  | 
| 126   step_types.push_back(VarianceArray::kStepDecaying); |  | 
| 127   step_types.push_back(VarianceArray::kStepWindowed); |  | 
| 128   step_types.push_back(VarianceArray::kStepBlocked); |  | 
| 129   step_types.push_back(VarianceArray::kStepBlockBasedMovingAverage); |  | 
| 130   std::fill(noise_data_.begin(), noise_data_.end(), 0.0f); | 117   std::fill(noise_data_.begin(), noise_data_.end(), 0.0f); | 
| 131   std::fill(orig_data_.begin(), orig_data_.end(), 0.0f); | 118   std::fill(orig_data_.begin(), orig_data_.end(), 0.0f); | 
| 132   for (auto step_type : step_types) { | 119   std::fill(clear_data_.begin(), clear_data_.end(), 0.0f); | 
| 133     std::fill(clear_data_.begin(), clear_data_.end(), 0.0f); | 120   EXPECT_FALSE(CheckUpdate()); | 
| 134     EXPECT_FALSE(CheckUpdate(step_type)); |  | 
| 135   } |  | 
| 136   std::srand(1); | 121   std::srand(1); | 
| 137   auto float_rand = []() { return std::rand() * 2.f / RAND_MAX - 1; }; | 122   auto float_rand = []() { return std::rand() * 2.f / RAND_MAX - 1; }; | 
| 138   std::generate(noise_data_.begin(), noise_data_.end(), float_rand); | 123   std::generate(noise_data_.begin(), noise_data_.end(), float_rand); | 
| 139   for (auto step_type : step_types) { | 124   EXPECT_FALSE(CheckUpdate()); | 
| 140     EXPECT_FALSE(CheckUpdate(step_type)); | 125   std::generate(clear_data_.begin(), clear_data_.end(), float_rand); | 
| 141   } | 126   orig_data_ = clear_data_; | 
| 142   for (auto step_type : step_types) { | 127   EXPECT_TRUE(CheckUpdate()); | 
| 143     std::generate(clear_data_.begin(), clear_data_.end(), float_rand); |  | 
| 144     orig_data_ = clear_data_; |  | 
| 145     EXPECT_TRUE(CheckUpdate(step_type)); |  | 
| 146   } |  | 
| 147 } | 128 } | 
| 148 | 129 | 
| 149 // Tests ERB bank creation, comparing against matlab output. | 130 // Tests ERB bank creation, comparing against matlab output. | 
| 150 TEST_F(IntelligibilityEnhancerTest, TestErbCreation) { | 131 TEST_F(IntelligibilityEnhancerTest, TestErbCreation) { | 
| 151   ASSERT_EQ(arraysize(kTestCenterFreqs), enh_->bank_size_); | 132   ASSERT_EQ(arraysize(kTestCenterFreqs), enh_->bank_size_); | 
| 152   for (size_t i = 0; i < enh_->bank_size_; ++i) { | 133   for (size_t i = 0; i < enh_->bank_size_; ++i) { | 
| 153     EXPECT_NEAR(kTestCenterFreqs[i], enh_->center_freqs_[i], kMaxTestError); | 134     EXPECT_NEAR(kTestCenterFreqs[i], enh_->center_freqs_[i], kMaxTestError); | 
| 154     ASSERT_EQ(arraysize(kTestFilterBank[0]), enh_->freqs_); | 135     ASSERT_EQ(arraysize(kTestFilterBank[0]), enh_->freqs_); | 
| 155     for (size_t j = 0; j < enh_->freqs_; ++j) { | 136     for (size_t j = 0; j < enh_->freqs_; ++j) { | 
| 156       EXPECT_NEAR(kTestFilterBank[i][j], enh_->render_filter_bank_[i][j], | 137       EXPECT_NEAR(kTestFilterBank[i][j], enh_->render_filter_bank_[i][j], | 
| 157                   kMaxTestError); | 138                   kMaxTestError); | 
| 158     } | 139     } | 
| 159   } | 140   } | 
| 160 } | 141 } | 
| 161 | 142 | 
| 162 // Tests analytic solution for optimal gains, comparing | 143 // Tests analytic solution for optimal gains, comparing | 
| 163 // against matlab output. | 144 // against matlab output. | 
| 164 TEST_F(IntelligibilityEnhancerTest, TestSolveForGains) { | 145 TEST_F(IntelligibilityEnhancerTest, TestSolveForGains) { | 
| 165   ASSERT_EQ(kTestStartFreq, enh_->start_freq_); | 146   ASSERT_EQ(kTestStartFreq, enh_->start_freq_); | 
| 166   vector<float> sols(enh_->bank_size_); | 147   std::vector<float> sols(enh_->bank_size_); | 
| 167   float lambda = -0.001f; | 148   float lambda = -0.001f; | 
| 168   for (size_t i = 0; i < enh_->bank_size_; i++) { | 149   for (size_t i = 0; i < enh_->bank_size_; i++) { | 
| 169     enh_->filtered_clear_var_[i] = 0.0f; | 150     enh_->filtered_clear_pow_[i] = 0.0f; | 
| 170     enh_->filtered_noise_var_[i] = 0.0f; | 151     enh_->filtered_noise_pow_[i] = 0.0f; | 
| 171     enh_->rho_[i] = 0.02f; | 152     enh_->rho_[i] = 0.02f; | 
| 172   } | 153   } | 
| 173   enh_->SolveForGainsGivenLambda(lambda, enh_->start_freq_, &sols[0]); | 154   enh_->SolveForGainsGivenLambda(lambda, enh_->start_freq_, &sols[0]); | 
| 174   for (size_t i = 0; i < enh_->bank_size_; i++) { | 155   for (size_t i = 0; i < enh_->bank_size_; i++) { | 
| 175     EXPECT_NEAR(kTestZeroVar[i], sols[i], kMaxTestError); | 156     EXPECT_NEAR(kTestZeroVar[i], sols[i], kMaxTestError); | 
| 176   } | 157   } | 
| 177   for (size_t i = 0; i < enh_->bank_size_; i++) { | 158   for (size_t i = 0; i < enh_->bank_size_; i++) { | 
| 178     enh_->filtered_clear_var_[i] = static_cast<float>(i + 1); | 159     enh_->filtered_clear_pow_[i] = static_cast<float>(i + 1); | 
| 179     enh_->filtered_noise_var_[i] = static_cast<float>(enh_->bank_size_ - i); | 160     enh_->filtered_noise_pow_[i] = static_cast<float>(enh_->bank_size_ - i); | 
| 180   } | 161   } | 
| 181   enh_->SolveForGainsGivenLambda(lambda, enh_->start_freq_, &sols[0]); | 162   enh_->SolveForGainsGivenLambda(lambda, enh_->start_freq_, &sols[0]); | 
| 182   for (size_t i = 0; i < enh_->bank_size_; i++) { | 163   for (size_t i = 0; i < enh_->bank_size_; i++) { | 
| 183     EXPECT_NEAR(kTestNonZeroVarLambdaTop[i], sols[i], kMaxTestError); | 164     EXPECT_NEAR(kTestNonZeroVarLambdaTop[i], sols[i], kMaxTestError); | 
| 184   } | 165   } | 
| 185   lambda = -1.0; | 166   lambda = -1.0; | 
| 186   enh_->SolveForGainsGivenLambda(lambda, enh_->start_freq_, &sols[0]); | 167   enh_->SolveForGainsGivenLambda(lambda, enh_->start_freq_, &sols[0]); | 
| 187   for (size_t i = 0; i < enh_->bank_size_; i++) { | 168   for (size_t i = 0; i < enh_->bank_size_; i++) { | 
| 188     EXPECT_NEAR(kTestZeroVar[i], sols[i], kMaxTestError); | 169     EXPECT_NEAR(kTestZeroVar[i], sols[i], kMaxTestError); | 
| 189   } | 170   } | 
| 190 } | 171 } | 
| 191 | 172 | 
| 192 }  // namespace webrtc | 173 }  // namespace webrtc | 
| OLD | NEW | 
|---|