- Code clean: exploiting the recently added ArrayView ctor for std::array - Pitch search internal unit test: long const arrays moved to a resource file - Minor changes Bug: webrtc:9076 Change-Id: Iaf30753f2498b4568860d72e0b81f5351235692f TBR: aleloi@webrtc.org Reviewed-on: https://webrtc-review.googlesource.com/76920 Commit-Queue: Alessio Bazzica <alessiob@webrtc.org> Reviewed-by: Alessio Bazzica <alessiob@webrtc.org> Cr-Commit-Position: refs/heads/master@{#23248}
57 lines
2.3 KiB
C++
57 lines
2.3 KiB
C++
/*
|
|
* Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include "modules/audio_processing/agc2/rnn_vad/pitch_search.h"
|
|
|
|
namespace webrtc {
|
|
namespace rnn_vad {
|
|
|
|
PitchEstimator::PitchEstimator()
|
|
: fft_(RealFourier::Create(kAutoCorrelationFftOrder)),
|
|
pitch_buf_decimated_(kBufSize12kHz),
|
|
pitch_buf_decimated_view_(pitch_buf_decimated_.data(), kBufSize12kHz),
|
|
auto_corr_(kNumInvertedLags12kHz),
|
|
auto_corr_view_(auto_corr_.data(), kNumInvertedLags12kHz) {
|
|
RTC_DCHECK_EQ(kBufSize12kHz, pitch_buf_decimated_.size());
|
|
RTC_DCHECK_EQ(kNumInvertedLags12kHz, auto_corr_view_.size());
|
|
}
|
|
|
|
PitchEstimator::~PitchEstimator() = default;
|
|
|
|
PitchInfo PitchEstimator::Estimate(
|
|
rtc::ArrayView<const float, kBufSize24kHz> pitch_buf) {
|
|
// Perform the initial pitch search at 12 kHz.
|
|
Decimate2x(pitch_buf, pitch_buf_decimated_view_);
|
|
// Compute auto-correlation terms.
|
|
ComputePitchAutoCorrelation(pitch_buf_decimated_view_, kMaxPitch12kHz,
|
|
auto_corr_view_, fft_.get());
|
|
|
|
// Search for pitch at 12 kHz.
|
|
std::array<size_t, 2> pitch_candidates_inv_lags = FindBestPitchPeriods(
|
|
auto_corr_view_, pitch_buf_decimated_view_, kMaxPitch12kHz);
|
|
|
|
// Refine the pitch period estimation.
|
|
// The refinement is done using the pitch buffer that contains 24 kHz samples.
|
|
// Therefore, adapt the inverted lags in |pitch_candidates_inv_lags| from 12
|
|
// to 24 kHz.
|
|
for (size_t i = 0; i < pitch_candidates_inv_lags.size(); ++i)
|
|
pitch_candidates_inv_lags[i] *= 2;
|
|
size_t pitch_inv_lag_48kHz =
|
|
RefinePitchPeriod48kHz(pitch_buf, pitch_candidates_inv_lags);
|
|
// Look for stronger harmonics to find the final pitch period and its gain.
|
|
RTC_DCHECK_LT(pitch_inv_lag_48kHz, kMaxPitch48kHz);
|
|
last_pitch_48kHz_ = CheckLowerPitchPeriodsAndComputePitchGain(
|
|
pitch_buf, kMaxPitch48kHz - pitch_inv_lag_48kHz, last_pitch_48kHz_);
|
|
return last_pitch_48kHz_;
|
|
}
|
|
|
|
} // namespace rnn_vad
|
|
} // namespace webrtc
|