[ tor-browser ].git.dasho

noise_suppressor.cc (22353B)
      1 /*
      2 *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
      3 *
      4 *  Use of this source code is governed by a BSD-style license
      5 *  that can be found in the LICENSE file in the root of the source
      6 *  tree. An additional intellectual property rights grant can be found
      7 *  in the file PATENTS.  All contributing project authors may
      8 *  be found in the AUTHORS file in the root of the source tree.
      9 */
     10 
     11 #include "modules/audio_processing/ns/noise_suppressor.h"
     12 
     13 #include <algorithm>
     14 #include <array>
     15 #include <cmath>
     16 #include <cstdlib>
     17 #include <cstring>
     18 #include <memory>
     19 
     20 #include "api/array_view.h"
     21 #include "modules/audio_processing/audio_buffer.h"
     22 #include "modules/audio_processing/ns/fast_math.h"
     23 #include "modules/audio_processing/ns/ns_common.h"
     24 #include "modules/audio_processing/ns/ns_config.h"
     25 #include "modules/audio_processing/ns/suppression_params.h"
     26 #include "rtc_base/checks.h"
     27 
     28 namespace webrtc {
     29 
     30 namespace {
     31 
     32 // Maps sample rate to number of bands.
     33 size_t NumBandsForRate(size_t sample_rate_hz) {
     34  RTC_DCHECK(sample_rate_hz == 16000 || sample_rate_hz == 32000 ||
     35             sample_rate_hz == 48000);
     36  return sample_rate_hz / 16000;
     37 }
     38 
     39 // Maximum number of channels for which the channel data is stored on
     40 // the stack. If the number of channels are larger than this, they are stored
     41 // using scratch memory that is pre-allocated on the heap. The reason for this
     42 // partitioning is not to waste heap space for handling the more common numbers
     43 // of channels, while at the same time not limiting the support for higher
     44 // numbers of channels by enforcing the channel data to be stored on the
     45 // stack using a fixed maximum value.
     46 constexpr size_t kMaxNumChannelsOnStack = 2;
     47 
     48 // Chooses the number of channels to store on the heap when that is required due
     49 // to the number of channels being larger than the pre-defined number
     50 // of channels to store on the stack.
     51 size_t NumChannelsOnHeap(size_t num_channels) {
     52  return num_channels > kMaxNumChannelsOnStack ? num_channels : 0;
     53 }
     54 
     55 // Hybrib Hanning and flat window for the filterbank.
     56 constexpr std::array<float, 96> kBlocks160w256FirstHalf = {
     57    0.00000000f, 0.01636173f, 0.03271908f, 0.04906767f, 0.06540313f,
     58    0.08172107f, 0.09801714f, 0.11428696f, 0.13052619f, 0.14673047f,
     59    0.16289547f, 0.17901686f, 0.19509032f, 0.21111155f, 0.22707626f,
     60    0.24298018f, 0.25881905f, 0.27458862f, 0.29028468f, 0.30590302f,
     61    0.32143947f, 0.33688985f, 0.35225005f, 0.36751594f, 0.38268343f,
     62    0.39774847f, 0.41270703f, 0.42755509f, 0.44228869f, 0.45690388f,
     63    0.47139674f, 0.48576339f, 0.50000000f, 0.51410274f, 0.52806785f,
     64    0.54189158f, 0.55557023f, 0.56910015f, 0.58247770f, 0.59569930f,
     65    0.60876143f, 0.62166057f, 0.63439328f, 0.64695615f, 0.65934582f,
     66    0.67155895f, 0.68359230f, 0.69544264f, 0.70710678f, 0.71858162f,
     67    0.72986407f, 0.74095113f, 0.75183981f, 0.76252720f, 0.77301045f,
     68    0.78328675f, 0.79335334f, 0.80320753f, 0.81284668f, 0.82226822f,
     69    0.83146961f, 0.84044840f, 0.84920218f, 0.85772861f, 0.86602540f,
     70    0.87409034f, 0.88192126f, 0.88951608f, 0.89687274f, 0.90398929f,
     71    0.91086382f, 0.91749450f, 0.92387953f, 0.93001722f, 0.93590593f,
     72    0.94154407f, 0.94693013f, 0.95206268f, 0.95694034f, 0.96156180f,
     73    0.96592583f, 0.97003125f, 0.97387698f, 0.97746197f, 0.98078528f,
     74    0.98384601f, 0.98664333f, 0.98917651f, 0.99144486f, 0.99344778f,
     75    0.99518473f, 0.99665524f, 0.99785892f, 0.99879546f, 0.99946459f,
     76    0.99986614f};
     77 
     78 // Applies the filterbank window to a buffer.
     79 void ApplyFilterBankWindow(ArrayView<float, kFftSize> x) {
     80  for (size_t i = 0; i < 96; ++i) {
     81    x[i] = kBlocks160w256FirstHalf[i] * x[i];
     82  }
     83 
     84  for (size_t i = 161, k = 95; i < kFftSize; ++i, --k) {
     85    RTC_DCHECK_NE(0, k);
     86    x[i] = kBlocks160w256FirstHalf[k] * x[i];
     87  }
     88 }
     89 
     90 // Extends a frame with previous data.
     91 void FormExtendedFrame(ArrayView<const float, kNsFrameSize> frame,
     92                       ArrayView<float, kFftSize - kNsFrameSize> old_data,
     93                       ArrayView<float, kFftSize> extended_frame) {
     94  std::copy(old_data.begin(), old_data.end(), extended_frame.begin());
     95  std::copy(frame.begin(), frame.end(),
     96            extended_frame.begin() + old_data.size());
     97  std::copy(extended_frame.end() - old_data.size(), extended_frame.end(),
     98            old_data.begin());
     99 }
    100 
    101 // Uses overlap-and-add to produce an output frame.
    102 void OverlapAndAdd(ArrayView<const float, kFftSize> extended_frame,
    103                   ArrayView<float, kOverlapSize> overlap_memory,
    104                   ArrayView<float, kNsFrameSize> output_frame) {
    105  for (size_t i = 0; i < kOverlapSize; ++i) {
    106    output_frame[i] = overlap_memory[i] + extended_frame[i];
    107  }
    108  std::copy(extended_frame.begin() + kOverlapSize,
    109            extended_frame.begin() + kNsFrameSize,
    110            output_frame.begin() + kOverlapSize);
    111  std::copy(extended_frame.begin() + kNsFrameSize, extended_frame.end(),
    112            overlap_memory.begin());
    113 }
    114 
    115 // Produces a delayed frame.
    116 void DelaySignal(ArrayView<const float, kNsFrameSize> frame,
    117                 ArrayView<float, kFftSize - kNsFrameSize> delay_buffer,
    118                 ArrayView<float, kNsFrameSize> delayed_frame) {
    119  constexpr size_t kSamplesFromFrame = kNsFrameSize - (kFftSize - kNsFrameSize);
    120  std::copy(delay_buffer.begin(), delay_buffer.end(), delayed_frame.begin());
    121  std::copy(frame.begin(), frame.begin() + kSamplesFromFrame,
    122            delayed_frame.begin() + delay_buffer.size());
    123 
    124  std::copy(frame.begin() + kSamplesFromFrame, frame.end(),
    125            delay_buffer.begin());
    126 }
    127 
    128 // Computes the energy of an extended frame.
    129 float ComputeEnergyOfExtendedFrame(ArrayView<const float, kFftSize> x) {
    130  float energy = 0.f;
    131  for (float x_k : x) {
    132    energy += x_k * x_k;
    133  }
    134 
    135  return energy;
    136 }
    137 
    138 // Computes the energy of an extended frame based on its subcomponents.
    139 float ComputeEnergyOfExtendedFrame(
    140    ArrayView<const float, kNsFrameSize> frame,
    141    ArrayView<float, kFftSize - kNsFrameSize> old_data) {
    142  float energy = 0.f;
    143  for (float v : old_data) {
    144    energy += v * v;
    145  }
    146  for (float v : frame) {
    147    energy += v * v;
    148  }
    149 
    150  return energy;
    151 }
    152 
    153 // Computes the magnitude spectrum based on an FFT output.
    154 void ComputeMagnitudeSpectrum(
    155    ArrayView<const float, kFftSize> real,
    156    ArrayView<const float, kFftSize> imag,
    157    ArrayView<float, kFftSizeBy2Plus1> signal_spectrum) {
    158  signal_spectrum[0] = fabsf(real[0]) + 1.f;
    159  signal_spectrum[kFftSizeBy2Plus1 - 1] =
    160      fabsf(real[kFftSizeBy2Plus1 - 1]) + 1.f;
    161 
    162  for (size_t i = 1; i < kFftSizeBy2Plus1 - 1; ++i) {
    163    signal_spectrum[i] =
    164        SqrtFastApproximation(real[i] * real[i] + imag[i] * imag[i]) + 1.f;
    165  }
    166 }
    167 
    168 // Compute prior and post SNR.
    169 void ComputeSnr(ArrayView<const float, kFftSizeBy2Plus1> filter,
    170                ArrayView<const float> prev_signal_spectrum,
    171                ArrayView<const float> signal_spectrum,
    172                ArrayView<const float> prev_noise_spectrum,
    173                ArrayView<const float> noise_spectrum,
    174                ArrayView<float> prior_snr,
    175                ArrayView<float> post_snr) {
    176  for (size_t i = 0; i < kFftSizeBy2Plus1; ++i) {
    177    // Previous post SNR.
    178    // Previous estimate: based on previous frame with gain filter.
    179    float prev_estimate = prev_signal_spectrum[i] /
    180                          (prev_noise_spectrum[i] + 0.0001f) * filter[i];
    181    // Post SNR.
    182    if (signal_spectrum[i] > noise_spectrum[i]) {
    183      post_snr[i] = signal_spectrum[i] / (noise_spectrum[i] + 0.0001f) - 1.f;
    184    } else {
    185      post_snr[i] = 0.f;
    186    }
    187    // The directed decision estimate of the prior SNR is a sum the current and
    188    // previous estimates.
    189    prior_snr[i] = 0.98f * prev_estimate + (1.f - 0.98f) * post_snr[i];
    190  }
    191 }
    192 
    193 // Computes the attenuating gain for the noise suppression of the upper bands.
    194 float ComputeUpperBandsGain(
    195    float minimum_attenuating_gain,
    196    ArrayView<const float, kFftSizeBy2Plus1> filter,
    197    ArrayView<const float> speech_probability,
    198    ArrayView<const float, kFftSizeBy2Plus1> prev_analysis_signal_spectrum,
    199    ArrayView<const float, kFftSizeBy2Plus1> signal_spectrum) {
    200  // Average speech prob and filter gain for the end of the lowest band.
    201  constexpr int kNumAvgBins = 32;
    202  constexpr float kOneByNumAvgBins = 1.f / kNumAvgBins;
    203 
    204  float avg_prob_speech = 0.f;
    205  float avg_filter_gain = 0.f;
    206  for (size_t i = kFftSizeBy2Plus1 - kNumAvgBins - 1; i < kFftSizeBy2Plus1 - 1;
    207       i++) {
    208    avg_prob_speech += speech_probability[i];
    209    avg_filter_gain += filter[i];
    210  }
    211  avg_prob_speech = avg_prob_speech * kOneByNumAvgBins;
    212  avg_filter_gain = avg_filter_gain * kOneByNumAvgBins;
    213 
    214  // If the speech was suppressed by a component between Analyze and Process, an
    215  // example being by an AEC, it should not be considered speech for the purpose
    216  // of high band suppression. To that end, the speech probability is scaled
    217  // accordingly.
    218  float sum_analysis_spectrum = 0.f;
    219  float sum_processing_spectrum = 0.f;
    220  for (size_t i = 0; i < kFftSizeBy2Plus1; ++i) {
    221    sum_analysis_spectrum += prev_analysis_signal_spectrum[i];
    222    sum_processing_spectrum += signal_spectrum[i];
    223  }
    224 
    225  // The magnitude spectrum computation enforces the spectrum to be strictly
    226  // positive.
    227  RTC_DCHECK_GT(sum_analysis_spectrum, 0.f);
    228  avg_prob_speech *= sum_processing_spectrum / sum_analysis_spectrum;
    229 
    230  // Compute gain based on speech probability.
    231  float gain =
    232      0.5f * (1.f + static_cast<float>(tanh(2.f * avg_prob_speech - 1.f)));
    233 
    234  // Combine gain with low band gain.
    235  if (avg_prob_speech >= 0.5f) {
    236    gain = 0.25f * gain + 0.75f * avg_filter_gain;
    237  } else {
    238    gain = 0.5f * gain + 0.5f * avg_filter_gain;
    239  }
    240 
    241  // Make sure gain is within flooring range.
    242  return std::min(std::max(gain, minimum_attenuating_gain), 1.f);
    243 }
    244 
    245 }  // namespace
    246 
    247 NoiseSuppressor::ChannelState::ChannelState(
    248    const SuppressionParams& suppression_params,
    249    size_t num_bands)
    250    : wiener_filter(suppression_params),
    251      noise_estimator(suppression_params),
    252      process_delay_memory(num_bands > 1 ? num_bands - 1 : 0) {
    253  analyze_analysis_memory.fill(0.f);
    254  prev_analysis_signal_spectrum.fill(1.f);
    255  process_analysis_memory.fill(0.f);
    256  process_synthesis_memory.fill(0.f);
    257  for (auto& d : process_delay_memory) {
    258    d.fill(0.f);
    259  }
    260 }
    261 
    262 NoiseSuppressor::NoiseSuppressor(const NsConfig& config,
    263                                 size_t sample_rate_hz,
    264                                 size_t num_channels)
    265    : num_bands_(NumBandsForRate(sample_rate_hz)),
    266      num_channels_(num_channels),
    267      suppression_params_(config.target_level),
    268      filter_bank_states_heap_(NumChannelsOnHeap(num_channels_)),
    269      upper_band_gains_heap_(NumChannelsOnHeap(num_channels_)),
    270      energies_before_filtering_heap_(NumChannelsOnHeap(num_channels_)),
    271      gain_adjustments_heap_(NumChannelsOnHeap(num_channels_)),
    272      channels_(num_channels_) {
    273  for (size_t ch = 0; ch < num_channels_; ++ch) {
    274    channels_[ch] =
    275        std::make_unique<ChannelState>(suppression_params_, num_bands_);
    276  }
    277 }
    278 
    279 void NoiseSuppressor::AggregateWienerFilters(
    280    ArrayView<float, kFftSizeBy2Plus1> filter) const {
    281  ArrayView<const float, kFftSizeBy2Plus1> filter0 =
    282      channels_[0]->wiener_filter.get_filter();
    283  std::copy(filter0.begin(), filter0.end(), filter.begin());
    284 
    285  for (size_t ch = 1; ch < num_channels_; ++ch) {
    286    ArrayView<const float, kFftSizeBy2Plus1> filter_ch =
    287        channels_[ch]->wiener_filter.get_filter();
    288 
    289    for (size_t k = 0; k < kFftSizeBy2Plus1; ++k) {
    290      filter[k] = std::min(filter[k], filter_ch[k]);
    291    }
    292  }
    293 }
    294 
    295 void NoiseSuppressor::Analyze(const AudioBuffer& audio) {
    296  // Prepare the noise estimator for the analysis stage.
    297  for (size_t ch = 0; ch < num_channels_; ++ch) {
    298    channels_[ch]->noise_estimator.PrepareAnalysis();
    299  }
    300 
    301  // Check for zero frames.
    302  bool zero_frame = true;
    303  for (size_t ch = 0; ch < num_channels_; ++ch) {
    304    ArrayView<const float, kNsFrameSize> y_band0(
    305        &audio.split_bands_const(ch)[0][0], kNsFrameSize);
    306    float energy = ComputeEnergyOfExtendedFrame(
    307        y_band0, channels_[ch]->analyze_analysis_memory);
    308    if (energy > 0.f) {
    309      zero_frame = false;
    310      break;
    311    }
    312  }
    313 
    314  if (zero_frame) {
    315    // We want to avoid updating statistics in this case:
    316    // Updating feature statistics when we have zeros only will cause
    317    // thresholds to move towards zero signal situations. This in turn has the
    318    // effect that once the signal is "turned on" (non-zero values) everything
    319    // will be treated as speech and there is no noise suppression effect.
    320    // Depending on the duration of the inactive signal it takes a
    321    // considerable amount of time for the system to learn what is noise and
    322    // what is speech.
    323    return;
    324  }
    325 
    326  // Only update analysis counter for frames that are properly analyzed.
    327  if (++num_analyzed_frames_ < 0) {
    328    num_analyzed_frames_ = 0;
    329  }
    330 
    331  // Analyze all channels.
    332  for (size_t ch = 0; ch < num_channels_; ++ch) {
    333    std::unique_ptr<ChannelState>& ch_p = channels_[ch];
    334    ArrayView<const float, kNsFrameSize> y_band0(
    335        &audio.split_bands_const(ch)[0][0], kNsFrameSize);
    336 
    337    // Form an extended frame and apply analysis filter bank windowing.
    338    std::array<float, kFftSize> extended_frame;
    339    FormExtendedFrame(y_band0, ch_p->analyze_analysis_memory, extended_frame);
    340    ApplyFilterBankWindow(extended_frame);
    341 
    342    // Compute the magnitude spectrum.
    343    std::array<float, kFftSize> real;
    344    std::array<float, kFftSize> imag;
    345    fft_.Fft(extended_frame, real, imag);
    346 
    347    std::array<float, kFftSizeBy2Plus1> signal_spectrum;
    348    ComputeMagnitudeSpectrum(real, imag, signal_spectrum);
    349 
    350    // Compute energies.
    351    float signal_energy = 0.f;
    352    for (size_t i = 0; i < kFftSizeBy2Plus1; ++i) {
    353      signal_energy += real[i] * real[i] + imag[i] * imag[i];
    354    }
    355    signal_energy /= kFftSizeBy2Plus1;
    356 
    357    float signal_spectral_sum = 0.f;
    358    for (size_t i = 0; i < kFftSizeBy2Plus1; ++i) {
    359      signal_spectral_sum += signal_spectrum[i];
    360    }
    361 
    362    // Estimate the noise spectra and the probability estimates of speech
    363    // presence.
    364    ch_p->noise_estimator.PreUpdate(num_analyzed_frames_, signal_spectrum,
    365                                    signal_spectral_sum);
    366 
    367    std::array<float, kFftSizeBy2Plus1> post_snr;
    368    std::array<float, kFftSizeBy2Plus1> prior_snr;
    369    ComputeSnr(ch_p->wiener_filter.get_filter(),
    370               ch_p->prev_analysis_signal_spectrum, signal_spectrum,
    371               ch_p->noise_estimator.get_prev_noise_spectrum(),
    372               ch_p->noise_estimator.get_noise_spectrum(), prior_snr, post_snr);
    373 
    374    ch_p->speech_probability_estimator.Update(
    375        num_analyzed_frames_, prior_snr, post_snr,
    376        ch_p->noise_estimator.get_conservative_noise_spectrum(),
    377        signal_spectrum, signal_spectral_sum, signal_energy);
    378 
    379    ch_p->noise_estimator.PostUpdate(
    380        ch_p->speech_probability_estimator.get_probability(), signal_spectrum);
    381 
    382    // Store the magnitude spectrum to make it avalilable for the process
    383    // method.
    384    std::copy(signal_spectrum.begin(), signal_spectrum.end(),
    385              ch_p->prev_analysis_signal_spectrum.begin());
    386  }
    387 }
    388 
    389 void NoiseSuppressor::Process(AudioBuffer* audio) {
    390  // Select the space for storing data during the processing.
    391  std::array<FilterBankState, kMaxNumChannelsOnStack> filter_bank_states_stack;
    392  ArrayView<FilterBankState> filter_bank_states(filter_bank_states_stack.data(),
    393                                                num_channels_);
    394  std::array<float, kMaxNumChannelsOnStack> upper_band_gains_stack;
    395  ArrayView<float> upper_band_gains(upper_band_gains_stack.data(),
    396                                    num_channels_);
    397  std::array<float, kMaxNumChannelsOnStack> energies_before_filtering_stack;
    398  ArrayView<float> energies_before_filtering(
    399      energies_before_filtering_stack.data(), num_channels_);
    400  std::array<float, kMaxNumChannelsOnStack> gain_adjustments_stack;
    401  ArrayView<float> gain_adjustments(gain_adjustments_stack.data(),
    402                                    num_channels_);
    403  if (NumChannelsOnHeap(num_channels_) > 0) {
    404    // If the stack-allocated space is too small, use the heap for storing the
    405    // data.
    406    filter_bank_states = ArrayView<FilterBankState>(
    407        filter_bank_states_heap_.data(), num_channels_);
    408    upper_band_gains =
    409        ArrayView<float>(upper_band_gains_heap_.data(), num_channels_);
    410    energies_before_filtering =
    411        ArrayView<float>(energies_before_filtering_heap_.data(), num_channels_);
    412    gain_adjustments =
    413        ArrayView<float>(gain_adjustments_heap_.data(), num_channels_);
    414  }
    415 
    416  // Compute the suppression filters for all channels.
    417  for (size_t ch = 0; ch < num_channels_; ++ch) {
    418    // Form an extended frame and apply analysis filter bank windowing.
    419    ArrayView<float, kNsFrameSize> y_band0(&audio->split_bands(ch)[0][0],
    420                                           kNsFrameSize);
    421 
    422    FormExtendedFrame(y_band0, channels_[ch]->process_analysis_memory,
    423                      filter_bank_states[ch].extended_frame);
    424 
    425    ApplyFilterBankWindow(filter_bank_states[ch].extended_frame);
    426 
    427    energies_before_filtering[ch] =
    428        ComputeEnergyOfExtendedFrame(filter_bank_states[ch].extended_frame);
    429 
    430    // Perform filter bank analysis and compute the magnitude spectrum.
    431    fft_.Fft(filter_bank_states[ch].extended_frame, filter_bank_states[ch].real,
    432             filter_bank_states[ch].imag);
    433 
    434    std::array<float, kFftSizeBy2Plus1> signal_spectrum;
    435    ComputeMagnitudeSpectrum(filter_bank_states[ch].real,
    436                             filter_bank_states[ch].imag, signal_spectrum);
    437 
    438    // Compute the frequency domain gain filter for noise attenuation.
    439    channels_[ch]->wiener_filter.Update(
    440        num_analyzed_frames_,
    441        channels_[ch]->noise_estimator.get_noise_spectrum(),
    442        channels_[ch]->noise_estimator.get_prev_noise_spectrum(),
    443        channels_[ch]->noise_estimator.get_parametric_noise_spectrum(),
    444        signal_spectrum);
    445 
    446    if (num_bands_ > 1) {
    447      // Compute the time-domain gain for attenuating the noise in the upper
    448      // bands.
    449 
    450      upper_band_gains[ch] = ComputeUpperBandsGain(
    451          suppression_params_.minimum_attenuating_gain,
    452          channels_[ch]->wiener_filter.get_filter(),
    453          channels_[ch]->speech_probability_estimator.get_probability(),
    454          channels_[ch]->prev_analysis_signal_spectrum, signal_spectrum);
    455    }
    456  }
    457 
    458  // Only do the below processing if the output of the audio processing module
    459  // is used.
    460  if (!capture_output_used_) {
    461    return;
    462  }
    463 
    464  // Aggregate the Wiener filters for all channels.
    465  std::array<float, kFftSizeBy2Plus1> filter_data;
    466  ArrayView<const float, kFftSizeBy2Plus1> filter = filter_data;
    467  if (num_channels_ == 1) {
    468    filter = channels_[0]->wiener_filter.get_filter();
    469  } else {
    470    AggregateWienerFilters(filter_data);
    471  }
    472 
    473  for (size_t ch = 0; ch < num_channels_; ++ch) {
    474    // Apply the filter to the lower band.
    475    for (size_t i = 0; i < kFftSizeBy2Plus1; ++i) {
    476      filter_bank_states[ch].real[i] *= filter[i];
    477      filter_bank_states[ch].imag[i] *= filter[i];
    478    }
    479  }
    480 
    481  // Perform filter bank synthesis
    482  for (size_t ch = 0; ch < num_channels_; ++ch) {
    483    fft_.Ifft(filter_bank_states[ch].real, filter_bank_states[ch].imag,
    484              filter_bank_states[ch].extended_frame);
    485  }
    486 
    487  for (size_t ch = 0; ch < num_channels_; ++ch) {
    488    const float energy_after_filtering =
    489        ComputeEnergyOfExtendedFrame(filter_bank_states[ch].extended_frame);
    490 
    491    // Apply synthesis window.
    492    ApplyFilterBankWindow(filter_bank_states[ch].extended_frame);
    493 
    494    // Compute the adjustment of the noise attenuation filter based on the
    495    // effect of the attenuation.
    496    gain_adjustments[ch] =
    497        channels_[ch]->wiener_filter.ComputeOverallScalingFactor(
    498            num_analyzed_frames_,
    499            channels_[ch]->speech_probability_estimator.get_prior_probability(),
    500            energies_before_filtering[ch], energy_after_filtering);
    501  }
    502 
    503  // Select and apply adjustment of the noise attenuation filter based on the
    504  // effect of the attenuation.
    505  float gain_adjustment = gain_adjustments[0];
    506  for (size_t ch = 1; ch < num_channels_; ++ch) {
    507    gain_adjustment = std::min(gain_adjustment, gain_adjustments[ch]);
    508  }
    509  for (size_t ch = 0; ch < num_channels_; ++ch) {
    510    for (size_t i = 0; i < kFftSize; ++i) {
    511      filter_bank_states[ch].extended_frame[i] =
    512          gain_adjustment * filter_bank_states[ch].extended_frame[i];
    513    }
    514  }
    515 
    516  // Use overlap-and-add to form the output frame of the lowest band.
    517  for (size_t ch = 0; ch < num_channels_; ++ch) {
    518    ArrayView<float, kNsFrameSize> y_band0(&audio->split_bands(ch)[0][0],
    519                                           kNsFrameSize);
    520    OverlapAndAdd(filter_bank_states[ch].extended_frame,
    521                  channels_[ch]->process_synthesis_memory, y_band0);
    522  }
    523 
    524  if (num_bands_ > 1) {
    525    // Select the noise attenuating gain to apply to the upper band.
    526    float upper_band_gain = upper_band_gains[0];
    527    for (size_t ch = 1; ch < num_channels_; ++ch) {
    528      upper_band_gain = std::min(upper_band_gain, upper_band_gains[ch]);
    529    }
    530 
    531    // Process the upper bands.
    532    for (size_t ch = 0; ch < num_channels_; ++ch) {
    533      for (size_t b = 1; b < num_bands_; ++b) {
    534        // Delay the upper bands to match the delay of the filterbank applied to
    535        // the lowest band.
    536        ArrayView<float, kNsFrameSize> y_band(&audio->split_bands(ch)[b][0],
    537                                              kNsFrameSize);
    538        std::array<float, kNsFrameSize> delayed_frame;
    539        DelaySignal(y_band, channels_[ch]->process_delay_memory[b - 1],
    540                    delayed_frame);
    541 
    542        // Apply the time-domain noise-attenuating gain.
    543        for (size_t j = 0; j < kNsFrameSize; j++) {
    544          y_band[j] = upper_band_gain * delayed_frame[j];
    545        }
    546      }
    547    }
    548  }
    549 
    550  // Limit the output the allowed range.
    551  for (size_t ch = 0; ch < num_channels_; ++ch) {
    552    for (size_t b = 0; b < num_bands_; ++b) {
    553      ArrayView<float, kNsFrameSize> y_band(&audio->split_bands(ch)[b][0],
    554                                            kNsFrameSize);
    555      for (size_t j = 0; j < kNsFrameSize; j++) {
    556        y_band[j] = std::min(std::max(y_band[j], -32768.f), 32767.f);
    557      }
    558    }
    559  }
    560 }
    561 
    562 }  // namespace webrtc
	tor-browser The Tor Browser
	git clone https://git.dasho.dev/tor-browser.git
	Log \| Files \| Refs \| README \| LICENSE