modules/audio_processing/aec/echo_cancellation.cc - src.git - Git at Google

 /*
  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 /*
  * Contains the API functions for the AEC.
  */
 #include "modules/audio_processing/aec/echo_cancellation.h"

 #include <math.h>
 #include <stdlib.h>
 #include <string.h>

 extern "C" {
 #include "common_audio/ring_buffer.h"
 #include "common_audio/signal_processing/include/signal_processing_library.h"
 }
 #include "modules/audio_processing/aec/aec_core.h"
 #include "modules/audio_processing/aec/aec_resampler.h"
 #include "modules/audio_processing/logging/apm_data_dumper.h"
 #include "typedefs.h"  // NOLINT(build/include)

 namespace webrtc {

 Aec::Aec() = default;
 Aec::~Aec() = default;

 // Measured delays [ms]
 // Device                Chrome  GTP
 // MacBook Air           10
 // MacBook Retina        10      100
 // MacPro                30?
 //
 // Win7 Desktop          70      80?
 // Win7 T430s            110
 // Win8 T420s            70
 //
 // Daisy                 50
 // Pixel (w/ preproc?)           240
 // Pixel (w/o preproc?)  110     110

 // The extended filter mode gives us the flexibility to ignore the system's
 // reported delays. We do this for platforms which we believe provide results
 // which are incompatible with the AEC's expectations. Based on measurements
 // (some provided above) we set a conservative (i.e. lower than measured)
 // fixed delay.
 //
 // WEBRTC_UNTRUSTED_DELAY will only have an impact when |extended_filter_mode|
 // is enabled. See the note along with |DelayCorrection| in
 // echo_cancellation_impl.h for more details on the mode.
 //
 // Justification:
 // Chromium/Mac: Here, the true latency is so low (~10-20 ms), that it plays
 // havoc with the AEC's buffering. To avoid this, we set a fixed delay of 20 ms
 // and then compensate by rewinding by 10 ms (in wideband) through
 // kDelayDiffOffsetSamples. This trick does not seem to work for larger rewind
 // values, but fortunately this is sufficient.
 //
 // Chromium/Linux(ChromeOS): The values we get on this platform don't correspond
 // well to reality. The variance doesn't match the AEC's buffer changes, and the
 // bulk values tend to be too low. However, the range across different hardware
 // appears to be too large to choose a single value.
 //
 // GTP/Linux(ChromeOS): TBD, but for the moment we will trust the values.
 #if defined(WEBRTC_CHROMIUM_BUILD) && defined(WEBRTC_MAC)
 #define WEBRTC_UNTRUSTED_DELAY
 #endif

 #if defined(WEBRTC_UNTRUSTED_DELAY) && defined(WEBRTC_MAC)
 static const int kDelayDiffOffsetSamples = -160;
 #else
 // Not enabled for now.
 static const int kDelayDiffOffsetSamples = 0;
 #endif

 #if defined(WEBRTC_MAC)
 static const int kFixedDelayMs = 20;
 #else
 static const int kFixedDelayMs = 50;
 #endif
 #if !defined(WEBRTC_UNTRUSTED_DELAY)
 static const int kMinTrustedDelayMs = 20;
 #endif
 static const int kMaxTrustedDelayMs = 500;

 // Maximum length of resampled signal. Must be an integer multiple of frames
 // (ceil(1/(1 + MIN_SKEW)*2) + 1)*FRAME_LEN
 // The factor of 2 handles wb, and the + 1 is as a safety margin
 // TODO(bjornv): Replace with kResamplerBufferSize
 #define MAX_RESAMP_LEN (5 * FRAME_LEN)

 static const int kMaxBufSizeStart = 62;  // In partitions
 static const int sampMsNb = 8;           // samples per ms in nb
 static const int initCheck = 42;

 int Aec::instance_count = 0;

 // Estimates delay to set the position of the far-end buffer read pointer
 // (controlled by knownDelay)
 static void EstBufDelayNormal(Aec* aecInst);
 static void EstBufDelayExtended(Aec* aecInst);
 static int ProcessNormal(Aec* aecInst,
                          const float* const* nearend,
                          size_t num_bands,
                          float* const* out,
                          size_t num_samples,
                          int16_t reported_delay_ms,
                          int32_t skew);
 static void ProcessExtended(Aec* aecInst,
                             const float* const* nearend,
                             size_t num_bands,
                             float* const* out,
                             size_t num_samples,
                             int16_t reported_delay_ms,
                             int32_t skew);

 void* WebRtcAec_Create() {
   Aec* aecpc = new Aec();

   if (!aecpc) {
     return NULL;
   }
   aecpc->data_dumper.reset(new ApmDataDumper(aecpc->instance_count));

   aecpc->aec = WebRtcAec_CreateAec(aecpc->instance_count);
   if (!aecpc->aec) {
     WebRtcAec_Free(aecpc);
     return NULL;
   }
   aecpc->resampler = WebRtcAec_CreateResampler();
   if (!aecpc->resampler) {
     WebRtcAec_Free(aecpc);
     return NULL;
   }
   // Create far-end pre-buffer. The buffer size has to be large enough for
   // largest possible drift compensation (kResamplerBufferSize) + "almost" an
   // FFT buffer (PART_LEN2 - 1).
   aecpc->far_pre_buf =
       WebRtc_CreateBuffer(PART_LEN2 + kResamplerBufferSize, sizeof(float));
   if (!aecpc->far_pre_buf) {
     WebRtcAec_Free(aecpc);
     return NULL;
   }

   aecpc->initFlag = 0;

   aecpc->instance_count++;
   return aecpc;
 }

 void WebRtcAec_Free(void* aecInst) {
   Aec* aecpc = reinterpret_cast<Aec*>(aecInst);

   if (aecpc == NULL) {
     return;
   }

   WebRtc_FreeBuffer(aecpc->far_pre_buf);

   WebRtcAec_FreeAec(aecpc->aec);
   WebRtcAec_FreeResampler(aecpc->resampler);
   delete aecpc;
 }

 int32_t WebRtcAec_Init(void* aecInst, int32_t sampFreq, int32_t scSampFreq) {
   Aec* aecpc = reinterpret_cast<Aec*>(aecInst);
   aecpc->data_dumper->InitiateNewSetOfRecordings();
   AecConfig aecConfig;

   if (sampFreq != 8000 && sampFreq != 16000 && sampFreq != 32000 &&
       sampFreq != 48000) {
     return AEC_BAD_PARAMETER_ERROR;
   }
   aecpc->sampFreq = sampFreq;

   if (scSampFreq < 1 || scSampFreq > 96000) {
     return AEC_BAD_PARAMETER_ERROR;
   }
   aecpc->scSampFreq = scSampFreq;

   // Initialize echo canceller core
   if (WebRtcAec_InitAec(aecpc->aec, aecpc->sampFreq) == -1) {
     return AEC_UNSPECIFIED_ERROR;
   }

   if (WebRtcAec_InitResampler(aecpc->resampler, aecpc->scSampFreq) == -1) {
     return AEC_UNSPECIFIED_ERROR;
   }

   WebRtc_InitBuffer(aecpc->far_pre_buf);
   WebRtc_MoveReadPtr(aecpc->far_pre_buf, -PART_LEN);  // Start overlap.

   aecpc->initFlag = initCheck;  // indicates that initialization has been done

   if (aecpc->sampFreq == 32000 || aecpc->sampFreq == 48000) {
     aecpc->splitSampFreq = 16000;
   } else {
     aecpc->splitSampFreq = sampFreq;
   }

   aecpc->delayCtr = 0;
   aecpc->sampFactor = (aecpc->scSampFreq * 1.0f) / aecpc->splitSampFreq;
   // Sampling frequency multiplier (SWB is processed as 160 frame size).
   aecpc->rate_factor = aecpc->splitSampFreq / 8000;

   aecpc->sum = 0;
   aecpc->counter = 0;
   aecpc->checkBuffSize = 1;
   aecpc->firstVal = 0;

   // We skip the startup_phase completely (setting to 0) if DA-AEC is enabled,
   // but not extended_filter mode.
   aecpc->startup_phase = WebRtcAec_extended_filter_enabled(aecpc->aec) ||
                          !WebRtcAec_delay_agnostic_enabled(aecpc->aec);
   aecpc->bufSizeStart = 0;
   aecpc->checkBufSizeCtr = 0;
   aecpc->msInSndCardBuf = 0;
   aecpc->filtDelay = -1;  // -1 indicates an initialized state.
   aecpc->timeForDelayChange = 0;
   aecpc->knownDelay = 0;
   aecpc->lastDelayDiff = 0;

   aecpc->skewFrCtr = 0;
   aecpc->resample = kAecFalse;
   aecpc->highSkewCtr = 0;
   aecpc->skew = 0;

   aecpc->farend_started = 0;

   // Default settings.
   aecConfig.nlpMode = kAecNlpModerate;
   aecConfig.skewMode = kAecFalse;
   aecConfig.metricsMode = kAecFalse;
   aecConfig.delay_logging = kAecFalse;

   if (WebRtcAec_set_config(aecpc, aecConfig) == -1) {
     return AEC_UNSPECIFIED_ERROR;
   }

   return 0;
 }

 // Returns any error that is caused when buffering the
 // far-end signal.
 int32_t WebRtcAec_GetBufferFarendError(void* aecInst,
                                        const float* farend,
                                        size_t nrOfSamples) {
   Aec* aecpc = reinterpret_cast<Aec*>(aecInst);

   if (!farend)
     return AEC_NULL_POINTER_ERROR;

   if (aecpc->initFlag != initCheck)
     return AEC_UNINITIALIZED_ERROR;

   // number of samples == 160 for SWB input
   if (nrOfSamples != 80 && nrOfSamples != 160)
     return AEC_BAD_PARAMETER_ERROR;

   return 0;
 }

 // only buffer L band for farend
 int32_t WebRtcAec_BufferFarend(void* aecInst,
                                const float* farend,
                                size_t nrOfSamples) {
   Aec* aecpc = reinterpret_cast<Aec*>(aecInst);
   size_t newNrOfSamples = nrOfSamples;
   float new_farend[MAX_RESAMP_LEN];
   const float* farend_ptr = farend;

   // Get any error caused by buffering the farend signal.
   int32_t error_code =
       WebRtcAec_GetBufferFarendError(aecInst, farend, nrOfSamples);

   if (error_code != 0)
     return error_code;

   if (aecpc->skewMode == kAecTrue && aecpc->resample == kAecTrue) {
     // Resample and get a new number of samples
     WebRtcAec_ResampleLinear(aecpc->resampler, farend, nrOfSamples, aecpc->skew,
                              new_farend, &newNrOfSamples);
     farend_ptr = new_farend;
   }

   aecpc->farend_started = 1;
   WebRtcAec_SetSystemDelay(aecpc->aec, WebRtcAec_system_delay(aecpc->aec) +
                            static_cast<int>(newNrOfSamples));

   // Write the time-domain data to |far_pre_buf|.
   WebRtc_WriteBuffer(aecpc->far_pre_buf, farend_ptr, newNrOfSamples);

   // TODO(minyue): reduce to |PART_LEN| samples for each buffering.
   while (WebRtc_available_read(aecpc->far_pre_buf) >= PART_LEN2) {
     // We have enough data to pass to the FFT, hence read PART_LEN2 samples.
     {
       float* ptmp = NULL;
       float tmp[PART_LEN2];
       WebRtc_ReadBuffer(aecpc->far_pre_buf,
                         reinterpret_cast<void**>(&ptmp), tmp, PART_LEN2);
       WebRtcAec_BufferFarendBlock(aecpc->aec, &ptmp[PART_LEN]);
     }

     // Rewind |far_pre_buf| PART_LEN samples for overlap before continuing.
     WebRtc_MoveReadPtr(aecpc->far_pre_buf, -PART_LEN);
   }

   return 0;
 }

 int32_t WebRtcAec_Process(void* aecInst,
                           const float* const* nearend,
                           size_t num_bands,
                           float* const* out,
                           size_t nrOfSamples,
                           int16_t msInSndCardBuf,
                           int32_t skew) {
   Aec* aecpc = reinterpret_cast<Aec*>(aecInst);
   int32_t retVal = 0;

   if (out == NULL) {
     return AEC_NULL_POINTER_ERROR;
   }

   if (aecpc->initFlag != initCheck) {
     return AEC_UNINITIALIZED_ERROR;
   }

   // number of samples == 160 for SWB input
   if (nrOfSamples != 80 && nrOfSamples != 160) {
     return AEC_BAD_PARAMETER_ERROR;
   }

   if (msInSndCardBuf < 0) {
     msInSndCardBuf = 0;
     retVal = AEC_BAD_PARAMETER_WARNING;
   } else if (msInSndCardBuf > kMaxTrustedDelayMs) {
     // The clamping is now done in ProcessExtended/Normal().
     retVal = AEC_BAD_PARAMETER_WARNING;
   }

   // This returns the value of aec->extended_filter_enabled.
   if (WebRtcAec_extended_filter_enabled(aecpc->aec)) {
     ProcessExtended(aecpc, nearend, num_bands, out, nrOfSamples, msInSndCardBuf,
                     skew);
   } else {
     retVal = ProcessNormal(aecpc, nearend, num_bands, out, nrOfSamples,
                            msInSndCardBuf, skew);
   }

   int far_buf_size_samples = WebRtcAec_system_delay(aecpc->aec);
   aecpc->data_dumper->DumpRaw("aec_system_delay", 1, &far_buf_size_samples);
   aecpc->data_dumper->DumpRaw("aec_known_delay", 1, &aecpc->knownDelay);

   return retVal;
 }

 int WebRtcAec_set_config(void* handle, AecConfig config) {
   Aec* self = reinterpret_cast<Aec*>(handle);
   if (self->initFlag != initCheck) {
     return AEC_UNINITIALIZED_ERROR;
   }

   if (config.skewMode != kAecFalse && config.skewMode != kAecTrue) {
     return AEC_BAD_PARAMETER_ERROR;
   }
   self->skewMode = config.skewMode;

   if (config.nlpMode != kAecNlpConservative &&
       config.nlpMode != kAecNlpModerate &&
       config.nlpMode != kAecNlpAggressive) {
     return AEC_BAD_PARAMETER_ERROR;
   }

   if (config.metricsMode != kAecFalse && config.metricsMode != kAecTrue) {
     return AEC_BAD_PARAMETER_ERROR;
   }

   if (config.delay_logging != kAecFalse && config.delay_logging != kAecTrue) {
     return AEC_BAD_PARAMETER_ERROR;
   }

   WebRtcAec_SetConfigCore(self->aec, config.nlpMode, config.metricsMode,
                           config.delay_logging);
   return 0;
 }

 int WebRtcAec_get_echo_status(void* handle, int* status) {
   Aec* self = reinterpret_cast<Aec*>(handle);
   if (status == NULL) {
     return AEC_NULL_POINTER_ERROR;
   }
   if (self->initFlag != initCheck) {
     return AEC_UNINITIALIZED_ERROR;
   }

   *status = WebRtcAec_echo_state(self->aec);

   return 0;
 }

 int WebRtcAec_GetMetrics(void* handle, AecMetrics* metrics) {
   const float kUpWeight = 0.7f;
   float dtmp;
   int stmp;
   Aec* self = reinterpret_cast<Aec*>(handle);
   Stats erl;
   Stats erle;
   Stats a_nlp;

   if (handle == NULL) {
     return -1;
   }
   if (metrics == NULL) {
     return AEC_NULL_POINTER_ERROR;
   }
   if (self->initFlag != initCheck) {
     return AEC_UNINITIALIZED_ERROR;
   }

   WebRtcAec_GetEchoStats(self->aec, &erl, &erle, &a_nlp,
                          &metrics->divergent_filter_fraction);

   // ERL
   metrics->erl.instant = static_cast<int>(erl.instant);

   if ((erl.himean > kOffsetLevel) && (erl.average > kOffsetLevel)) {
     // Use a mix between regular average and upper part average.
     dtmp = kUpWeight * erl.himean + (1 - kUpWeight) * erl.average;
     metrics->erl.average = static_cast<int>(dtmp);
   } else {
     metrics->erl.average = kOffsetLevel;
   }

   metrics->erl.max = static_cast<int>(erl.max);

   if (erl.min < (kOffsetLevel * (-1))) {
     metrics->erl.min = static_cast<int>(erl.min);
   } else {
     metrics->erl.min = kOffsetLevel;
   }

   // ERLE
   metrics->erle.instant = static_cast<int>(erle.instant);

   if ((erle.himean > kOffsetLevel) && (erle.average > kOffsetLevel)) {
     // Use a mix between regular average and upper part average.
     dtmp = kUpWeight * erle.himean + (1 - kUpWeight) * erle.average;
     metrics->erle.average = static_cast<int>(dtmp);
   } else {
     metrics->erle.average = kOffsetLevel;
   }

   metrics->erle.max = static_cast<int>(erle.max);

   if (erle.min < (kOffsetLevel * (-1))) {
     metrics->erle.min = static_cast<int>(erle.min);
   } else {
     metrics->erle.min = kOffsetLevel;
   }

   // RERL
   if ((metrics->erl.average > kOffsetLevel) &&
       (metrics->erle.average > kOffsetLevel)) {
     stmp = metrics->erl.average + metrics->erle.average;
   } else {
     stmp = kOffsetLevel;
   }
   metrics->rerl.average = stmp;

   // No other statistics needed, but returned for completeness.
   metrics->rerl.instant = stmp;
   metrics->rerl.max = stmp;
   metrics->rerl.min = stmp;

   // A_NLP
   metrics->aNlp.instant = static_cast<int>(a_nlp.instant);

   if ((a_nlp.himean > kOffsetLevel) && (a_nlp.average > kOffsetLevel)) {
     // Use a mix between regular average and upper part average.
     dtmp = kUpWeight * a_nlp.himean + (1 - kUpWeight) * a_nlp.average;
     metrics->aNlp.average = static_cast<int>(dtmp);
   } else {
     metrics->aNlp.average = kOffsetLevel;
   }

   metrics->aNlp.max = static_cast<int>(a_nlp.max);

   if (a_nlp.min < (kOffsetLevel * (-1))) {
     metrics->aNlp.min = static_cast<int>(a_nlp.min);
   } else {
     metrics->aNlp.min = kOffsetLevel;
   }

   return 0;
 }

 int WebRtcAec_GetDelayMetrics(void* handle,
                               int* median,
                               int* std,
                               float* fraction_poor_delays) {
   Aec* self = reinterpret_cast<Aec*>(handle);
   if (median == NULL) {
     return AEC_NULL_POINTER_ERROR;
   }
   if (std == NULL) {
     return AEC_NULL_POINTER_ERROR;
   }
   if (self->initFlag != initCheck) {
     return AEC_UNINITIALIZED_ERROR;
   }
   if (WebRtcAec_GetDelayMetricsCore(self->aec, median, std,
                                     fraction_poor_delays) == -1) {
     // Logging disabled.
     return AEC_UNSUPPORTED_FUNCTION_ERROR;
   }

   return 0;
 }

 AecCore* WebRtcAec_aec_core(void* handle) {
   if (!handle) {
     return NULL;
   }
   return reinterpret_cast<Aec*>(handle)->aec;
 }

 static int ProcessNormal(Aec* aecInst,
                          const float* const* nearend,
                          size_t num_bands,
                          float* const* out,
                          size_t num_samples,
                          int16_t reported_delay_ms,
                          int32_t skew) {
   int retVal = 0;
   size_t i;
   size_t nBlocks10ms;
   // Limit resampling to doubling/halving of signal
   const float minSkewEst = -0.5f;
   const float maxSkewEst = 1.0f;

   reported_delay_ms =
       reported_delay_ms > kMaxTrustedDelayMs ? kMaxTrustedDelayMs :
       reported_delay_ms;
   // TODO(andrew): we need to investigate if this +10 is really wanted.
   reported_delay_ms += 10;
   aecInst->msInSndCardBuf = reported_delay_ms;

   if (aecInst->skewMode == kAecTrue) {
     if (aecInst->skewFrCtr < 25) {
       aecInst->skewFrCtr++;
     } else {
       retVal = WebRtcAec_GetSkew(aecInst->resampler, skew, &aecInst->skew);
       if (retVal == -1) {
         aecInst->skew = 0;
         retVal = AEC_BAD_PARAMETER_WARNING;
       }

       aecInst->skew /= aecInst->sampFactor * num_samples;

       if (aecInst->skew < 1.0e-3 && aecInst->skew > -1.0e-3) {
         aecInst->resample = kAecFalse;
       } else {
         aecInst->resample = kAecTrue;
       }

       if (aecInst->skew < minSkewEst) {
         aecInst->skew = minSkewEst;
       } else if (aecInst->skew > maxSkewEst) {
         aecInst->skew = maxSkewEst;
       }

       aecInst->data_dumper->DumpRaw("aec_skew", 1, &aecInst->skew);
     }
   }

   nBlocks10ms = num_samples / (FRAME_LEN * aecInst->rate_factor);

   if (aecInst->startup_phase) {
     for (i = 0; i < num_bands; ++i) {
       // Only needed if they don't already point to the same place.
       if (nearend[i] != out[i]) {
         memcpy(out[i], nearend[i], sizeof(nearend[i][0]) * num_samples);
       }
     }

     // The AEC is in the start up mode
     // AEC is disabled until the system delay is OK

     // Mechanism to ensure that the system delay is reasonably stable.
     if (aecInst->checkBuffSize) {
       aecInst->checkBufSizeCtr++;
       // Before we fill up the far-end buffer we require the system delay
       // to be stable (+/-8 ms) compared to the first value. This
       // comparison is made during the following 6 consecutive 10 ms
       // blocks. If it seems to be stable then we start to fill up the
       // far-end buffer.
       if (aecInst->counter == 0) {
         aecInst->firstVal = aecInst->msInSndCardBuf;
         aecInst->sum = 0;
       }

       if (abs(aecInst->firstVal - aecInst->msInSndCardBuf) <
           WEBRTC_SPL_MAX(0.2 * aecInst->msInSndCardBuf, sampMsNb)) {
         aecInst->sum += aecInst->msInSndCardBuf;
         aecInst->counter++;
       } else {
         aecInst->counter = 0;
       }

       if (aecInst->counter * nBlocks10ms >= 6) {
         // The far-end buffer size is determined in partitions of
         // PART_LEN samples. Use 75% of the average value of the system
         // delay as buffer size to start with.
         aecInst->bufSizeStart =
             WEBRTC_SPL_MIN((3 * aecInst->sum * aecInst->rate_factor * 8) /
                                (4 * aecInst->counter * PART_LEN),
                            kMaxBufSizeStart);
         // Buffer size has now been determined.
         aecInst->checkBuffSize = 0;
       }

       if (aecInst->checkBufSizeCtr * nBlocks10ms > 50) {
         // For really bad systems, don't disable the echo canceller for
         // more than 0.5 sec.
         aecInst->bufSizeStart = WEBRTC_SPL_MIN(
             (aecInst->msInSndCardBuf * aecInst->rate_factor * 3) / 40,
             kMaxBufSizeStart);
         aecInst->checkBuffSize = 0;
       }
     }

     // If |checkBuffSize| changed in the if-statement above.
     if (!aecInst->checkBuffSize) {
       // The system delay is now reasonably stable (or has been unstable
       // for too long). When the far-end buffer is filled with
       // approximately the same amount of data as reported by the system
       // we end the startup phase.
       int overhead_elements =
           WebRtcAec_system_delay(aecInst->aec) / PART_LEN -
           aecInst->bufSizeStart;
       if (overhead_elements == 0) {
         // Enable the AEC
         aecInst->startup_phase = 0;
       } else if (overhead_elements > 0) {
         // TODO(bjornv): Do we need a check on how much we actually
         // moved the read pointer? It should always be possible to move
         // the pointer |overhead_elements| since we have only added data
         // to the buffer and no delay compensation nor AEC processing
         // has been done.
         WebRtcAec_AdjustFarendBufferSizeAndSystemDelay(aecInst->aec,
                                                        overhead_elements);

         // Enable the AEC
         aecInst->startup_phase = 0;
       }
     }
   } else {
     // AEC is enabled.
     EstBufDelayNormal(aecInst);

     // Call the AEC.
     // TODO(bjornv): Re-structure such that we don't have to pass
     // |aecInst->knownDelay| as input. Change name to something like
     // |system_buffer_diff|.
     WebRtcAec_ProcessFrames(aecInst->aec, nearend, num_bands, num_samples,
                             aecInst->knownDelay, out);
   }

   return retVal;
 }

 static void ProcessExtended(Aec* self,
                             const float* const* near,
                             size_t num_bands,
                             float* const* out,
                             size_t num_samples,
                             int16_t reported_delay_ms,
                             int32_t skew) {
   size_t i;
   const int delay_diff_offset = kDelayDiffOffsetSamples;
   RTC_DCHECK(num_samples == 80 || num_samples == 160);
 #if defined(WEBRTC_UNTRUSTED_DELAY)
   reported_delay_ms = kFixedDelayMs;
 #else
   // This is the usual mode where we trust the reported system delay values.
   // Due to the longer filter, we no longer add 10 ms to the reported delay
   // to reduce chance of non-causality. Instead we apply a minimum here to avoid
   // issues with the read pointer jumping around needlessly.
   reported_delay_ms = reported_delay_ms < kMinTrustedDelayMs
                           ? kMinTrustedDelayMs
                           : reported_delay_ms;
   // If the reported delay appears to be bogus, we attempt to recover by using
   // the measured fixed delay values. We use >= here because higher layers
   // may already clamp to this maximum value, and we would otherwise not
   // detect it here.
   reported_delay_ms = reported_delay_ms >= kMaxTrustedDelayMs
                           ? kFixedDelayMs
                           : reported_delay_ms;
 #endif
   self->msInSndCardBuf = reported_delay_ms;

   if (!self->farend_started) {
     for (i = 0; i < num_bands; ++i) {
       // Only needed if they don't already point to the same place.
       if (near[i] != out[i]) {
         memcpy(out[i], near[i], sizeof(near[i][0]) * num_samples);
       }
     }
     return;
   }
   if (self->startup_phase) {
     // In the extended mode, there isn't a startup "phase", just a special
     // action on the first frame. In the trusted delay case, we'll take the
     // current reported delay, unless it's less then our conservative
     // measurement.
     int startup_size_ms =
         reported_delay_ms < kFixedDelayMs ? kFixedDelayMs : reported_delay_ms;
 #if defined(WEBRTC_ANDROID)
     int target_delay = startup_size_ms * self->rate_factor * 8;
 #else
     // To avoid putting the AEC in a non-causal state we're being slightly
     // conservative and scale by 2. On Android we use a fixed delay and
     // therefore there is no need to scale the target_delay.
     int target_delay = startup_size_ms * self->rate_factor * 8 / 2;
 #endif
     int overhead_elements =
         (WebRtcAec_system_delay(self->aec) - target_delay) / PART_LEN;
     WebRtcAec_AdjustFarendBufferSizeAndSystemDelay(self->aec,
                                                    overhead_elements);
     self->startup_phase = 0;
   }

   EstBufDelayExtended(self);

   {
     // |delay_diff_offset| gives us the option to manually rewind the delay on
     // very low delay platforms which can't be expressed purely through
     // |reported_delay_ms|.
     const int adjusted_known_delay =
         WEBRTC_SPL_MAX(0, self->knownDelay + delay_diff_offset);

     WebRtcAec_ProcessFrames(self->aec, near, num_bands, num_samples,
                             adjusted_known_delay, out);
   }
 }

 static void EstBufDelayNormal(Aec* aecInst) {
   int nSampSndCard = aecInst->msInSndCardBuf * sampMsNb * aecInst->rate_factor;
   int current_delay = nSampSndCard - WebRtcAec_system_delay(aecInst->aec);
   int delay_difference = 0;

   // Before we proceed with the delay estimate filtering we:
   // 1) Compensate for the frame that will be read.
   // 2) Compensate for drift resampling.
   // 3) Compensate for non-causality if needed, since the estimated delay can't
   //    be negative.

   // 1) Compensating for the frame(s) that will be read/processed.
   current_delay += FRAME_LEN * aecInst->rate_factor;

   // 2) Account for resampling frame delay.
   if (aecInst->skewMode == kAecTrue && aecInst->resample == kAecTrue) {
     current_delay -= kResamplingDelay;
   }

   // 3) Compensate for non-causality, if needed, by flushing one block.
   if (current_delay < PART_LEN) {
     current_delay +=
         WebRtcAec_AdjustFarendBufferSizeAndSystemDelay(aecInst->aec, 1) *
         PART_LEN;
   }

   // We use -1 to signal an initialized state in the "extended" implementation;
   // compensate for that.
   aecInst->filtDelay = aecInst->filtDelay < 0 ? 0 : aecInst->filtDelay;
   aecInst->filtDelay =
       WEBRTC_SPL_MAX(0, static_cast<int16_t>(0.8 *
                                              aecInst->filtDelay +
                                              0.2 * current_delay));

   delay_difference = aecInst->filtDelay - aecInst->knownDelay;
   if (delay_difference > 224) {
     if (aecInst->lastDelayDiff < 96) {
       aecInst->timeForDelayChange = 0;
     } else {
       aecInst->timeForDelayChange++;
     }
   } else if (delay_difference < 96 && aecInst->knownDelay > 0) {
     if (aecInst->lastDelayDiff > 224) {
       aecInst->timeForDelayChange = 0;
     } else {
       aecInst->timeForDelayChange++;
     }
   } else {
     aecInst->timeForDelayChange = 0;
   }
   aecInst->lastDelayDiff = delay_difference;

   if (aecInst->timeForDelayChange > 25) {
     aecInst->knownDelay = WEBRTC_SPL_MAX((int)aecInst->filtDelay - 160, 0);
   }
 }

 static void EstBufDelayExtended(Aec* aecInst) {
   int reported_delay = aecInst->msInSndCardBuf * sampMsNb *
       aecInst->rate_factor;
   int current_delay = reported_delay - WebRtcAec_system_delay(aecInst->aec);
   int delay_difference = 0;

   // Before we proceed with the delay estimate filtering we:
   // 1) Compensate for the frame that will be read.
   // 2) Compensate for drift resampling.
   // 3) Compensate for non-causality if needed, since the estimated delay can't
   //    be negative.

   // 1) Compensating for the frame(s) that will be read/processed.
   current_delay += FRAME_LEN * aecInst->rate_factor;

   // 2) Account for resampling frame delay.
   if (aecInst->skewMode == kAecTrue && aecInst->resample == kAecTrue) {
     current_delay -= kResamplingDelay;
   }

   // 3) Compensate for non-causality, if needed, by flushing two blocks.
   if (current_delay < PART_LEN) {
     current_delay +=
         WebRtcAec_AdjustFarendBufferSizeAndSystemDelay(aecInst->aec, 2) *
         PART_LEN;
   }

   if (aecInst->filtDelay == -1) {
     aecInst->filtDelay = WEBRTC_SPL_MAX(0, 0.5 * current_delay);
   } else {
     aecInst->filtDelay = WEBRTC_SPL_MAX(
         0, static_cast<int16_t>(0.95 * aecInst->filtDelay + 0.05 *
                                 current_delay));
   }

   delay_difference = aecInst->filtDelay - aecInst->knownDelay;
   if (delay_difference > 384) {
     if (aecInst->lastDelayDiff < 128) {
       aecInst->timeForDelayChange = 0;
     } else {
       aecInst->timeForDelayChange++;
     }
   } else if (delay_difference < 128 && aecInst->knownDelay > 0) {
     if (aecInst->lastDelayDiff > 384) {
       aecInst->timeForDelayChange = 0;
     } else {
       aecInst->timeForDelayChange++;
     }
   } else {
     aecInst->timeForDelayChange = 0;
   }
   aecInst->lastDelayDiff = delay_difference;

   if (aecInst->timeForDelayChange > 25) {
     aecInst->knownDelay = WEBRTC_SPL_MAX((int)aecInst->filtDelay - 256, 0);
   }
 }
 }  // namespace webrtc