/* * Copyright (c) 2018 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #ifndef MODULES_AUDIO_PROCESSING_AGC2_VAD_WITH_LEVEL_H_ #define MODULES_AUDIO_PROCESSING_AGC2_VAD_WITH_LEVEL_H_ #include "common_audio/resampler/include/push_resampler.h" #include "modules/audio_processing/agc2/rnn_vad/features_extraction.h" #include "modules/audio_processing/agc2/rnn_vad/rnn.h" #include "modules/audio_processing/include/audio_frame_view.h" namespace webrtc { class VadWithLevel { public: struct LevelAndProbability { constexpr LevelAndProbability(float prob, float rms, float peak) : speech_probability(prob), speech_rms_dbfs(rms), speech_peak_dbfs(peak) {} LevelAndProbability() = default; float speech_probability = 0; float speech_rms_dbfs = 0; // Root mean square in decibels to full-scale. float speech_peak_dbfs = 0; }; VadWithLevel(); ~VadWithLevel(); LevelAndProbability AnalyzeFrame(AudioFrameView frame); private: void SetSampleRate(int sample_rate_hz); rnn_vad::RnnBasedVad rnn_vad_; rnn_vad::FeaturesExtractor features_extractor_; PushResampler resampler_; }; } // namespace webrtc #endif // MODULES_AUDIO_PROCESSING_AGC2_VAD_WITH_LEVEL_H_