mirror of
https://github.com/danog/libtgvoip.git
synced 2025-01-09 14:18:24 +01:00
49 lines
1.5 KiB
C
49 lines
1.5 KiB
C
|
/*
|
||
|
* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
|
||
|
*
|
||
|
* Use of this source code is governed by a BSD-style license
|
||
|
* that can be found in the LICENSE file in the root of the source
|
||
|
* tree. An additional intellectual property rights grant can be found
|
||
|
* in the file PATENTS. All contributing project authors may
|
||
|
* be found in the AUTHORS file in the root of the source tree.
|
||
|
*/
|
||
|
|
||
|
#ifndef MODULES_AUDIO_PROCESSING_AGC2_VAD_WITH_LEVEL_H_
|
||
|
#define MODULES_AUDIO_PROCESSING_AGC2_VAD_WITH_LEVEL_H_
|
||
|
|
||
|
#include "common_audio/resampler/include/push_resampler.h"
|
||
|
#include "modules/audio_processing/agc2/rnn_vad/features_extraction.h"
|
||
|
#include "modules/audio_processing/agc2/rnn_vad/rnn.h"
|
||
|
#include "modules/audio_processing/include/audio_frame_view.h"
|
||
|
|
||
|
namespace webrtc {
|
||
|
class VadWithLevel {
|
||
|
public:
|
||
|
struct LevelAndProbability {
|
||
|
constexpr LevelAndProbability(float prob, float rms, float peak)
|
||
|
: speech_probability(prob),
|
||
|
speech_rms_dbfs(rms),
|
||
|
speech_peak_dbfs(peak) {}
|
||
|
LevelAndProbability() = default;
|
||
|
float speech_probability = 0;
|
||
|
float speech_rms_dbfs = 0; // Root mean square in decibels to full-scale.
|
||
|
float speech_peak_dbfs = 0;
|
||
|
};
|
||
|
|
||
|
VadWithLevel();
|
||
|
~VadWithLevel();
|
||
|
|
||
|
LevelAndProbability AnalyzeFrame(AudioFrameView<const float> frame);
|
||
|
|
||
|
private:
|
||
|
void SetSampleRate(int sample_rate_hz);
|
||
|
|
||
|
rnn_vad::RnnBasedVad rnn_vad_;
|
||
|
rnn_vad::FeaturesExtractor features_extractor_;
|
||
|
PushResampler<float> resampler_;
|
||
|
};
|
||
|
|
||
|
} // namespace webrtc
|
||
|
|
||
|
#endif // MODULES_AUDIO_PROCESSING_AGC2_VAD_WITH_LEVEL_H_
|