AGC2 component that computes and applies the digital gain. The gain is computed from an estimated speech and noise level. This component decides how fast the gain can change and what it should be. Bug: webrtc:7494 Change-Id: If55b6e5c765f958e433730cd9e3b2b93c14a7910 Reviewed-on: https://webrtc-review.googlesource.com/64985 Commit-Queue: Alex Loiko <aleloi@webrtc.org> Reviewed-by: Alessio Bazzica <alessiob@webrtc.org> Cr-Commit-Position: refs/heads/master@{#22741}
65 lines
2.3 KiB
C++
65 lines
2.3 KiB
C++
/*
|
|
* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include "modules/audio_processing/agc2/adaptive_agc.h"
|
|
|
|
#include <algorithm>
|
|
#include <numeric>
|
|
|
|
#include "common_audio/include/audio_util.h"
|
|
#include "modules/audio_processing/logging/apm_data_dumper.h"
|
|
#include "modules/audio_processing/vad/voice_activity_detector.h"
|
|
|
|
namespace webrtc {
|
|
|
|
AdaptiveAgc::AdaptiveAgc(ApmDataDumper* apm_data_dumper)
|
|
: speech_level_estimator_(apm_data_dumper),
|
|
gain_applier_(apm_data_dumper),
|
|
apm_data_dumper_(apm_data_dumper),
|
|
noise_level_estimator_(apm_data_dumper) {
|
|
RTC_DCHECK(apm_data_dumper);
|
|
}
|
|
|
|
AdaptiveAgc::~AdaptiveAgc() = default;
|
|
|
|
void AdaptiveAgc::Process(AudioFrameView<float> float_frame) {
|
|
// TODO(webrtc:7494): Remove this loop. Remove the vectors from
|
|
// VadWithData after we move to a VAD that outputs an estimate every
|
|
// kFrameDurationMs ms.
|
|
//
|
|
// Some VADs are 'bursty'. They return several estimates for some
|
|
// frames, and no estimates for other frames. We want to feed all to
|
|
// the level estimator, but only care about the last level it
|
|
// produces.
|
|
rtc::ArrayView<const VadWithLevel::LevelAndProbability> vad_results =
|
|
vad_.AnalyzeFrame(float_frame);
|
|
for (const auto& vad_result : vad_results) {
|
|
apm_data_dumper_->DumpRaw("agc2_vad_probability",
|
|
vad_result.speech_probability);
|
|
apm_data_dumper_->DumpRaw("agc2_vad_rms_dbfs", vad_result.speech_rms_dbfs);
|
|
|
|
apm_data_dumper_->DumpRaw("agc2_vad_peak_dbfs",
|
|
vad_result.speech_peak_dbfs);
|
|
speech_level_estimator_.UpdateEstimation(vad_result);
|
|
}
|
|
|
|
const float speech_level_dbfs = speech_level_estimator_.LatestLevelEstimate();
|
|
|
|
const float noise_level_dbfs = noise_level_estimator_.Analyze(float_frame);
|
|
|
|
apm_data_dumper_->DumpRaw("agc2_noise_estimate_dbfs", noise_level_dbfs);
|
|
|
|
// The gain applier applies the gain.
|
|
gain_applier_.Process(speech_level_dbfs, noise_level_dbfs, vad_results,
|
|
float_frame);
|
|
}
|
|
|
|
} // namespace webrtc
|