mirror of
https://github.com/danog/libtgvoip.git
synced 2025-01-08 13:48:41 +01:00
5caaaafa42
I'm now using the entire audio processing module from WebRTC as opposed to individual DSP algorithms pulled from there before. Seems to work better this way.
184 lines
6.6 KiB
C++
184 lines
6.6 KiB
C++
/*
|
|
* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#ifndef MODULES_AUDIO_PROCESSING_ECHO_CANCELLATION_IMPL_H_
|
|
#define MODULES_AUDIO_PROCESSING_ECHO_CANCELLATION_IMPL_H_
|
|
|
|
#include <stddef.h>
|
|
#include <memory>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
#include "api/array_view.h"
|
|
#include "modules/audio_processing/include/audio_processing.h"
|
|
#include "rtc_base/constructormagic.h"
|
|
#include "rtc_base/criticalsection.h"
|
|
#include "rtc_base/thread_annotations.h"
|
|
|
|
namespace webrtc {
|
|
|
|
class AudioBuffer;
|
|
|
|
// The acoustic echo cancellation (AEC) component provides better performance
|
|
// than AECM but also requires more processing power and is dependent on delay
|
|
// stability and reporting accuracy. As such it is well-suited and recommended
|
|
// for PC and IP phone applications.
|
|
class EchoCancellationImpl {
|
|
public:
|
|
explicit EchoCancellationImpl();
|
|
~EchoCancellationImpl();
|
|
|
|
void ProcessRenderAudio(rtc::ArrayView<const float> packed_render_audio);
|
|
int ProcessCaptureAudio(AudioBuffer* audio, int stream_delay_ms);
|
|
|
|
int Enable(bool enable);
|
|
bool is_enabled() const;
|
|
|
|
// Differences in clock speed on the primary and reverse streams can impact
|
|
// the AEC performance. On the client-side, this could be seen when different
|
|
// render and capture devices are used, particularly with webcams.
|
|
//
|
|
// This enables a compensation mechanism, and requires that
|
|
// set_stream_drift_samples() be called.
|
|
int enable_drift_compensation(bool enable);
|
|
bool is_drift_compensation_enabled() const;
|
|
|
|
// Sets the difference between the number of samples rendered and captured by
|
|
// the audio devices since the last call to |ProcessStream()|. Must be called
|
|
// if drift compensation is enabled, prior to |ProcessStream()|.
|
|
void set_stream_drift_samples(int drift);
|
|
int stream_drift_samples() const;
|
|
|
|
enum SuppressionLevel {
|
|
kLowSuppression,
|
|
kModerateSuppression,
|
|
kHighSuppression
|
|
};
|
|
|
|
// Sets the aggressiveness of the suppressor. A higher level trades off
|
|
// double-talk performance for increased echo suppression.
|
|
int set_suppression_level(SuppressionLevel level);
|
|
SuppressionLevel suppression_level() const;
|
|
|
|
// Returns false if the current frame almost certainly contains no echo
|
|
// and true if it _might_ contain echo.
|
|
bool stream_has_echo() const;
|
|
|
|
// Enables the computation of various echo metrics. These are obtained
|
|
// through |GetMetrics()|.
|
|
int enable_metrics(bool enable);
|
|
bool are_metrics_enabled() const;
|
|
|
|
// Each statistic is reported in dB.
|
|
// P_far: Far-end (render) signal power.
|
|
// P_echo: Near-end (capture) echo signal power.
|
|
// P_out: Signal power at the output of the AEC.
|
|
// P_a: Internal signal power at the point before the AEC's non-linear
|
|
// processor.
|
|
struct Metrics {
|
|
struct Statistic {
|
|
int instant = 0; // Instantaneous value.
|
|
int average = 0; // Long-term average.
|
|
int maximum = 0; // Long-term maximum.
|
|
int minimum = 0; // Long-term minimum.
|
|
};
|
|
// RERL = ERL + ERLE
|
|
Statistic residual_echo_return_loss;
|
|
|
|
// ERL = 10log_10(P_far / P_echo)
|
|
Statistic echo_return_loss;
|
|
|
|
// ERLE = 10log_10(P_echo / P_out)
|
|
Statistic echo_return_loss_enhancement;
|
|
|
|
// (Pre non-linear processing suppression) A_NLP = 10log_10(P_echo / P_a)
|
|
Statistic a_nlp;
|
|
|
|
// Fraction of time that the AEC linear filter is divergent, in a 1-second
|
|
// non-overlapped aggregation window.
|
|
float divergent_filter_fraction;
|
|
};
|
|
|
|
// Provides various statistics about the AEC.
|
|
int GetMetrics(Metrics* metrics);
|
|
|
|
// Enables computation and logging of delay values. Statistics are obtained
|
|
// through |GetDelayMetrics()|.
|
|
int enable_delay_logging(bool enable);
|
|
bool is_delay_logging_enabled() const;
|
|
|
|
// Provides delay metrics.
|
|
// The delay metrics consists of the delay |median| and the delay standard
|
|
// deviation |std|. It also consists of the fraction of delay estimates
|
|
// |fraction_poor_delays| that can make the echo cancellation perform poorly.
|
|
// The values are aggregated until the first call to |GetDelayMetrics()| and
|
|
// afterwards aggregated and updated every second.
|
|
// Note that if there are several clients pulling metrics from
|
|
// |GetDelayMetrics()| during a session the first call from any of them will
|
|
// change to one second aggregation window for all.
|
|
int GetDelayMetrics(int* median, int* std);
|
|
int GetDelayMetrics(int* median, int* std, float* fraction_poor_delays);
|
|
|
|
// Returns a pointer to the low level AEC component. In case of multiple
|
|
// channels, the pointer to the first one is returned. A NULL pointer is
|
|
// returned when the AEC component is disabled or has not been initialized
|
|
// successfully.
|
|
struct AecCore* aec_core() const;
|
|
|
|
void Initialize(int sample_rate_hz,
|
|
size_t num_reverse_channels_,
|
|
size_t num_output_channels_,
|
|
size_t num_proc_channels_);
|
|
void SetExtraOptions(const webrtc::Config& config);
|
|
bool is_delay_agnostic_enabled() const;
|
|
bool is_extended_filter_enabled() const;
|
|
std::string GetExperimentsDescription();
|
|
bool is_refined_adaptive_filter_enabled() const;
|
|
|
|
// Returns the system delay of the first AEC component.
|
|
int GetSystemDelayInSamples() const;
|
|
|
|
static void PackRenderAudioBuffer(const AudioBuffer* audio,
|
|
size_t num_output_channels,
|
|
size_t num_channels,
|
|
std::vector<float>* packed_buffer);
|
|
static size_t NumCancellersRequired(size_t num_output_channels,
|
|
size_t num_reverse_channels);
|
|
|
|
private:
|
|
class Canceller;
|
|
struct StreamProperties;
|
|
|
|
void AllocateRenderQueue();
|
|
int Configure();
|
|
|
|
bool enabled_ = false;
|
|
bool drift_compensation_enabled_;
|
|
bool metrics_enabled_;
|
|
SuppressionLevel suppression_level_;
|
|
int stream_drift_samples_;
|
|
bool was_stream_drift_set_;
|
|
bool stream_has_echo_;
|
|
bool delay_logging_enabled_;
|
|
bool extended_filter_enabled_;
|
|
bool delay_agnostic_enabled_;
|
|
bool refined_adaptive_filter_enabled_ = false;
|
|
|
|
// Only active on Chrome OS devices.
|
|
const bool enforce_zero_stream_delay_;
|
|
|
|
std::vector<std::unique_ptr<Canceller>> cancellers_;
|
|
std::unique_ptr<StreamProperties> stream_properties_;
|
|
};
|
|
|
|
} // namespace webrtc
|
|
|
|
#endif // MODULES_AUDIO_PROCESSING_ECHO_CANCELLATION_IMPL_H_
|