/* * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include "modules/audio_processing/aec3/subtractor.h" #include #include #include #include #include "modules/audio_processing/aec3/aec_state.h" #include "modules/audio_processing/aec3/render_delay_buffer.h" #include "modules/audio_processing/test/echo_canceller_test_tools.h" #include "modules/audio_processing/utility/cascaded_biquad_filter.h" #include "rtc_base/random.h" #include "rtc_base/strings/string_builder.h" #include "test/gtest.h" namespace webrtc { namespace { std::vector RunSubtractorTest( size_t num_render_channels, size_t num_capture_channels, int num_blocks_to_process, int delay_samples, int refined_filter_length_blocks, int coarse_filter_length_blocks, bool uncorrelated_inputs, const std::vector& blocks_with_echo_path_changes) { ApmDataDumper data_dumper(42); constexpr int kSampleRateHz = 48000; constexpr size_t kNumBands = NumBandsForRate(kSampleRateHz); EchoCanceller3Config config; config.filter.refined.length_blocks = refined_filter_length_blocks; config.filter.coarse.length_blocks = coarse_filter_length_blocks; Subtractor subtractor(config, num_render_channels, num_capture_channels, &data_dumper, DetectOptimization()); absl::optional delay_estimate; Block x(kNumBands, num_render_channels); Block y(/*num_bands=*/1, num_capture_channels); std::array x_old; std::vector output(num_capture_channels); config.delay.default_delay = 1; std::unique_ptr render_delay_buffer( RenderDelayBuffer::Create(config, kSampleRateHz, num_render_channels)); RenderSignalAnalyzer render_signal_analyzer(config); Random random_generator(42U); Aec3Fft fft; std::vector> Y2(num_capture_channels); std::vector> E2_refined( num_capture_channels); std::array E2_coarse; AecState aec_state(config, num_capture_channels); x_old.fill(0.f); for (auto& Y2_ch : Y2) { Y2_ch.fill(0.f); } for (auto& E2_refined_ch : E2_refined) { E2_refined_ch.fill(0.f); } E2_coarse.fill(0.f); std::vector>>> delay_buffer( num_capture_channels); for (size_t capture_ch = 0; capture_ch < num_capture_channels; ++capture_ch) { delay_buffer[capture_ch].resize(num_render_channels); for (size_t render_ch = 0; render_ch < num_render_channels; ++render_ch) { delay_buffer[capture_ch][render_ch] = std::make_unique>(delay_samples); } } // [B,A] = butter(2,100/8000,'high') constexpr CascadedBiQuadFilter::BiQuadCoefficients kHighPassFilterCoefficients = {{0.97261f, -1.94523f, 0.97261f}, {-1.94448f, 0.94598f}}; std::vector> x_hp_filter( num_render_channels); for (size_t ch = 0; ch < num_render_channels; ++ch) { x_hp_filter[ch] = std::make_unique(kHighPassFilterCoefficients, 1); } std::vector> y_hp_filter( num_capture_channels); for (size_t ch = 0; ch < num_capture_channels; ++ch) { y_hp_filter[ch] = std::make_unique(kHighPassFilterCoefficients, 1); } for (int k = 0; k < num_blocks_to_process; ++k) { for (size_t render_ch = 0; render_ch < num_render_channels; ++render_ch) { RandomizeSampleVector(&random_generator, x.View(/*band=*/0, render_ch)); } if (uncorrelated_inputs) { for (size_t capture_ch = 0; capture_ch < num_capture_channels; ++capture_ch) { RandomizeSampleVector(&random_generator, y.View(/*band=*/0, capture_ch)); } } else { for (size_t capture_ch = 0; capture_ch < num_capture_channels; ++capture_ch) { rtc::ArrayView y_view = y.View(/*band=*/0, capture_ch); for (size_t render_ch = 0; render_ch < num_render_channels; ++render_ch) { std::array y_channel; delay_buffer[capture_ch][render_ch]->Delay( x.View(/*band=*/0, render_ch), y_channel); for (size_t k = 0; k < kBlockSize; ++k) { y_view[k] += y_channel[k] / num_render_channels; } } } } for (size_t ch = 0; ch < num_render_channels; ++ch) { x_hp_filter[ch]->Process(x.View(/*band=*/0, ch)); } for (size_t ch = 0; ch < num_capture_channels; ++ch) { y_hp_filter[ch]->Process(y.View(/*band=*/0, ch)); } render_delay_buffer->Insert(x); if (k == 0) { render_delay_buffer->Reset(); } render_delay_buffer->PrepareCaptureProcessing(); render_signal_analyzer.Update(*render_delay_buffer->GetRenderBuffer(), aec_state.MinDirectPathFilterDelay()); // Handle echo path changes. if (std::find(blocks_with_echo_path_changes.begin(), blocks_with_echo_path_changes.end(), k) != blocks_with_echo_path_changes.end()) { subtractor.HandleEchoPathChange(EchoPathVariability( true, EchoPathVariability::DelayAdjustment::kNewDetectedDelay, false)); } subtractor.Process(*render_delay_buffer->GetRenderBuffer(), y, render_signal_analyzer, aec_state, output); aec_state.HandleEchoPathChange(EchoPathVariability( false, EchoPathVariability::DelayAdjustment::kNone, false)); aec_state.Update(delay_estimate, subtractor.FilterFrequencyResponses(), subtractor.FilterImpulseResponses(), *render_delay_buffer->GetRenderBuffer(), E2_refined, Y2, output); } std::vector results(num_capture_channels); for (size_t ch = 0; ch < num_capture_channels; ++ch) { const float output_power = std::inner_product( output[ch].e_refined.begin(), output[ch].e_refined.end(), output[ch].e_refined.begin(), 0.f); const float y_power = std::inner_product(y.begin(/*band=*/0, ch), y.end(/*band=*/0, ch), y.begin(/*band=*/0, ch), 0.f); if (y_power == 0.f) { ADD_FAILURE(); results[ch] = -1.f; } results[ch] = output_power / y_power; } return results; } std::string ProduceDebugText(size_t num_render_channels, size_t num_capture_channels, size_t delay, int filter_length_blocks) { rtc::StringBuilder ss; ss << "delay: " << delay << ", "; ss << "filter_length_blocks:" << filter_length_blocks << ", "; ss << "num_render_channels:" << num_render_channels << ", "; ss << "num_capture_channels:" << num_capture_channels; return ss.Release(); } } // namespace #if RTC_DCHECK_IS_ON && GTEST_HAS_DEATH_TEST && !defined(WEBRTC_ANDROID) // Verifies that the check for non data dumper works. TEST(SubtractorDeathTest, NullDataDumper) { EXPECT_DEATH( Subtractor(EchoCanceller3Config(), 1, 1, nullptr, DetectOptimization()), ""); } #endif // Verifies that the subtractor is able to converge on correlated data. TEST(Subtractor, Convergence) { std::vector blocks_with_echo_path_changes; for (size_t filter_length_blocks : {12, 20, 30}) { for (size_t delay_samples : {0, 64, 150, 200, 301}) { SCOPED_TRACE(ProduceDebugText(1, 1, delay_samples, filter_length_blocks)); std::vector echo_to_nearend_powers = RunSubtractorTest( 1, 1, 2500, delay_samples, filter_length_blocks, filter_length_blocks, false, blocks_with_echo_path_changes); for (float echo_to_nearend_power : echo_to_nearend_powers) { EXPECT_GT(0.1f, echo_to_nearend_power); } } } } // Verifies that the subtractor is able to handle the case when the refined // filter is longer than the coarse filter. TEST(Subtractor, RefinedFilterLongerThanCoarseFilter) { std::vector blocks_with_echo_path_changes; std::vector echo_to_nearend_powers = RunSubtractorTest( 1, 1, 400, 64, 20, 15, false, blocks_with_echo_path_changes); for (float echo_to_nearend_power : echo_to_nearend_powers) { EXPECT_GT(0.5f, echo_to_nearend_power); } } // Verifies that the subtractor is able to handle the case when the coarse // filter is longer than the refined filter. TEST(Subtractor, CoarseFilterLongerThanRefinedFilter) { std::vector blocks_with_echo_path_changes; std::vector echo_to_nearend_powers = RunSubtractorTest( 1, 1, 400, 64, 15, 20, false, blocks_with_echo_path_changes); for (float echo_to_nearend_power : echo_to_nearend_powers) { EXPECT_GT(0.5f, echo_to_nearend_power); } } // Verifies that the subtractor does not converge on uncorrelated signals. TEST(Subtractor, NonConvergenceOnUncorrelatedSignals) { std::vector blocks_with_echo_path_changes; for (size_t filter_length_blocks : {12, 20, 30}) { for (size_t delay_samples : {0, 64, 150, 200, 301}) { SCOPED_TRACE(ProduceDebugText(1, 1, delay_samples, filter_length_blocks)); std::vector echo_to_nearend_powers = RunSubtractorTest( 1, 1, 3000, delay_samples, filter_length_blocks, filter_length_blocks, true, blocks_with_echo_path_changes); for (float echo_to_nearend_power : echo_to_nearend_powers) { EXPECT_NEAR(1.f, echo_to_nearend_power, 0.1); } } } } class SubtractorMultiChannelUpToEightRender : public ::testing::Test, public ::testing::WithParamInterface> {}; #if defined(NDEBUG) INSTANTIATE_TEST_SUITE_P(NonDebugMultiChannel, SubtractorMultiChannelUpToEightRender, ::testing::Combine(::testing::Values(1, 2, 8), ::testing::Values(1, 2, 4))); #else INSTANTIATE_TEST_SUITE_P(DebugMultiChannel, SubtractorMultiChannelUpToEightRender, ::testing::Combine(::testing::Values(1, 2), ::testing::Values(1, 2))); #endif // Verifies that the subtractor is able to converge on correlated data. TEST_P(SubtractorMultiChannelUpToEightRender, Convergence) { const size_t num_render_channels = std::get<0>(GetParam()); const size_t num_capture_channels = std::get<1>(GetParam()); std::vector blocks_with_echo_path_changes; size_t num_blocks_to_process = 2500 * num_render_channels; std::vector echo_to_nearend_powers = RunSubtractorTest( num_render_channels, num_capture_channels, num_blocks_to_process, 64, 20, 20, false, blocks_with_echo_path_changes); for (float echo_to_nearend_power : echo_to_nearend_powers) { EXPECT_GT(0.1f, echo_to_nearend_power); } } class SubtractorMultiChannelUpToFourRender : public ::testing::Test, public ::testing::WithParamInterface> {}; #if defined(NDEBUG) INSTANTIATE_TEST_SUITE_P(NonDebugMultiChannel, SubtractorMultiChannelUpToFourRender, ::testing::Combine(::testing::Values(1, 2, 4), ::testing::Values(1, 2, 4))); #else INSTANTIATE_TEST_SUITE_P(DebugMultiChannel, SubtractorMultiChannelUpToFourRender, ::testing::Combine(::testing::Values(1, 2), ::testing::Values(1, 2))); #endif // Verifies that the subtractor does not converge on uncorrelated signals. TEST_P(SubtractorMultiChannelUpToFourRender, NonConvergenceOnUncorrelatedSignals) { const size_t num_render_channels = std::get<0>(GetParam()); const size_t num_capture_channels = std::get<1>(GetParam()); std::vector blocks_with_echo_path_changes; size_t num_blocks_to_process = 5000 * num_render_channels; std::vector echo_to_nearend_powers = RunSubtractorTest( num_render_channels, num_capture_channels, num_blocks_to_process, 64, 20, 20, true, blocks_with_echo_path_changes); for (float echo_to_nearend_power : echo_to_nearend_powers) { EXPECT_LT(.8f, echo_to_nearend_power); EXPECT_NEAR(1.f, echo_to_nearend_power, 0.25f); } } } // namespace webrtc