/* * Copyright (c) 2018 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #ifndef MODULES_AUDIO_PROCESSING_AGC2_RNN_VAD_FEATURES_EXTRACTION_H_ #define MODULES_AUDIO_PROCESSING_AGC2_RNN_VAD_FEATURES_EXTRACTION_H_ #include #include "api/array_view.h" #include "modules/audio_processing/agc2/biquad_filter.h" #include "modules/audio_processing/agc2/rnn_vad/common.h" #include "modules/audio_processing/agc2/rnn_vad/pitch_search.h" #include "modules/audio_processing/agc2/rnn_vad/sequence_buffer.h" #include "modules/audio_processing/agc2/rnn_vad/spectral_features.h" namespace webrtc { namespace rnn_vad { // Feature extractor to feed the VAD RNN. class FeaturesExtractor { public: explicit FeaturesExtractor(const AvailableCpuFeatures& cpu_features); FeaturesExtractor(const FeaturesExtractor&) = delete; FeaturesExtractor& operator=(const FeaturesExtractor&) = delete; ~FeaturesExtractor(); void Reset(); // Analyzes the samples, computes the feature vector and returns true if // silence is detected (false if not). When silence is detected, // `feature_vector` is partially written and therefore must not be used to // feed the VAD RNN. bool CheckSilenceComputeFeatures( rtc::ArrayView samples, rtc::ArrayView feature_vector); private: const bool use_high_pass_filter_; // TODO(bugs.webrtc.org/7494): Remove HPF depending on how AGC2 is used in APM // and on whether an HPF is already used as pre-processing step in APM. BiQuadFilter hpf_; SequenceBuffer pitch_buf_24kHz_; rtc::ArrayView pitch_buf_24kHz_view_; std::vector lp_residual_; rtc::ArrayView lp_residual_view_; PitchEstimator pitch_estimator_; rtc::ArrayView reference_frame_view_; SpectralFeaturesExtractor spectral_features_extractor_; int pitch_period_48kHz_; }; } // namespace rnn_vad } // namespace webrtc #endif // MODULES_AUDIO_PROCESSING_AGC2_RNN_VAD_FEATURES_EXTRACTION_H_