arduino-audio-tools/_m_d_f_echo_cancellation_8h_source.html

/* Copyright (C) 2003-2008 Jean-Marc Valin

 * Copyright (C) 2024 Phil Schatzmann (Header-only adaptation)

 *

 * Echo canceller based on the MDF algorithm

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * 1. Redistributions of source code must retain the above copyright notice,

 * this list of conditions and the following disclaimer.

 *

 * 2. Redistributions in binary form must reproduce the above copyright

 * notice, this list of conditions and the following disclaimer in the

 * documentation and/or other materials provided with the distribution.

 *

 * 3. The name of the author may not be used to endorse or promote products

 * derived from this software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR

 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES

 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

 * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,

 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR

 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)

 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,

 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN

 * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGE.

 */


#pragma once


#include <algorithm>

#include <cmath>

#include <cstdint>

#include <cstdlib>

#include <cstring>

#include <vector>


#include "MDFEchoCancellationConfig.h"

#include "AudioTools/AudioLibs/AudioFFT.h"


// Control requests

#define ECHO_GET_FRAME_SIZE 3

#define ECHO_SET_SAMPLING_RATE 24

#define ECHO_GET_SAMPLING_RATE 25

#define ECHO_GET_IMPULSE_RESPONSE_SIZE 27

#define ECHO_GET_IMPULSE_RESPONSE 29


// Helper macros for floating point mode

#ifndef FIXED_POINT

#define PSEUDOFLOAT(x) (x)

#define FLOAT_MULT(a, b) ((a) * (b))

#define FLOAT_AMULT(a, b) ((a) * (b))

#define FLOAT_MUL32(a, b) ((a) * (b))

#define FLOAT_DIV32(a, b) ((a) / (b))

#define FLOAT_EXTRACT16(a) (a)

#define FLOAT_EXTRACT32(a) (a)

#define FLOAT_ADD(a, b) ((a) + (b))

#define FLOAT_SUB(a, b) ((a) - (b))

#define FLOAT_DIV32_FLOAT(a, b) ((a) / (b))

#define FLOAT_MUL32U(a, b) ((a) * (b))

#define FLOAT_SHL(a, b) (a)

#define FLOAT_LT(a, b) ((a) < (b))

#define FLOAT_GT(a, b) ((a) > (b))

#define FLOAT_DIVU(a, b) ((a) / (b))

#define FLOAT_SQRT(a) (sqrtf(a))


// Math operation macros for floating point

#define ABS(x) (((x) < 0) ? (-(x)) : (x))

#define ABS16(x) (((x) < 0) ? (-(x)) : (x))

#define ABS32(x) (((x) < 0) ? (-(x)) : (x))

#define MIN16(a, b) ((a) < (b) ? (a) : (b))

#define MAX16(a, b) ((a) > (b) ? (a) : (b))

#define MIN32(a, b) ((a) < (b) ? (a) : (b))

#define MAX32(a, b) ((a) > (b) ? (a) : (b))


#define QCONST16(x, bits) (x)

#define QCONST32(x, bits) (x)

#define NEG16(x) (-(x))

#define NEG32(x) (-(x))

#define EXTRACT16(x) (x)

#define EXTEND32(x) (x)

#define SHR16(a, shift) (a)

#define SHL16(a, shift) (a)

#define SHR32(a, shift) (a)

#define SHL32(a, shift) (a)

#define PSHR16(a, shift) (a)

#define PSHR32(a, shift) (a)

#define VSHR32(a, shift) (a)

#define SATURATE16(x, a) (x)

#define SATURATE32(x, a) (x)

#define ADD16(a, b) ((a) + (b))

#define SUB16(a, b) ((a) - (b))

#define ADD32(a, b) ((a) + (b))

#define SUB32(a, b) ((a) - (b))

#define MULT16_16(a, b) ((echo_word32_t)(a) * (echo_word32_t)(b))

#define MAC16_16(c, a, b) ((c) + (echo_word32_t)(a) * (echo_word32_t)(b))

#define MULT16_32_Q15(a, b) ((a) * (b))

#define MULT16_16_P15(a, b) ((a) * (b))

#define MULT16_32_P15(a, b) ((a) * (b))

#define MULT16_16_Q15(a, b) ((a) * (b))

#define DIV32_16(a, b) (((echo_word32_t)(a)) / (echo_word16_t)(b))

#define DIV32(a, b) (((echo_word32_t)(a)) / (echo_word32_t)(b))

#define WORD2INT(x) \

  ((x) < -32767.5f  \

       ? -32768     \

       : ((x) > 32766.5f ? 32767 : (echo_int16_t)floorf(.5f + (x))))

#define MULT16_16_Q14(a, b) ((a) * (b))

#define MULT16_16_Q13(a, b) ((a) * (b))

#define MULT16_16_P13(a, b) ((a) * (b))

#define MULT16_16_P14(a, b) ((a) * (b))

#define MULT16_32_Q14(a, b) ((a) * (b))

#define MAC16_32_Q15(c, a, b) ((c) + (a) * (b))


#define TOP16(x) (x)

#define WEIGHT_SHIFT 0


#else

// Fixed-point mode macros

#define PSEUDOFLOAT(x) (echo_float_from_double(x))

#define FLOAT_MULT(a, b) (echo_float_mult(a, b))

#define FLOAT_MUL32U(a, b) (echo_float_mul32_u(a, b))

#define FLOAT_ADD(a, b) (echo_float_add(a, b))

#define FLOAT_SUB(a, b) (echo_float_sub(a, b))

#define FLOAT_LT(a, b) (echo_float_lt(a, b))

#define FLOAT_GT(a, b) (echo_float_gt(a, b))

#define FLOAT_DIVU(a, b) (echo_float_divu(a, b))

#define FLOAT_SQRT(a) (echo_float_sqrt(a))

#define FLOAT_EXTRACT16(a) (echo_float_extract16(a))

#define FLOAT_SHL(a, b) (echo_float_shl(a, b))


// Math operation macros (same for fixed-point)

#define ABS(x) (((x) < 0) ? (-(x)) : (x))

#define ABS16(x) (((x) < 0) ? (-(x)) : (x))

#define ABS32(x) (((x) < 0) ? (-(x)) : (x))

#define MIN16(a, b) ((a) < (b) ? (a) : (b))

#define MAX16(a, b) ((a) > (b) ? (a) : (b))

#define MIN32(a, b) ((a) < (b) ? (a) : (b))

#define MAX32(a, b) ((a) > (b) ? (a) : (b))


#define WORD2INT(x) \

  ((x) < -32767.5f  \

       ? -32768     \

       : ((x) > 32766.5f ? 32767 : (echo_int16_t)floorf(.5f + (x))))


#define TOP16(x) (x)

#define WEIGHT_SHIFT 0


#endif  // !FIXED_POINT


// Forward declaration for FFT interface

namespace audio_tools {


// Type definitions (must be before echo_float_t struct)

typedef int16_t echo_int16_t;

typedef uint16_t echo_uint16_t;

typedef int32_t echo_int32_t;

typedef uint32_t echo_uint32_t;


typedef echo_int16_t echo_word16_t;

typedef echo_int32_t echo_word32_t;

typedef echo_word32_t echo_mem_t;


#ifdef FIXED_POINT

// Forward declarations for operators

struct echo_float_t;

inline echo_float_t echo_float_mult(echo_float_t a, echo_float_t b);

inline echo_float_t echo_float_mul32_u(float a, float b);


// Fixed-point type for pseudo-float operations


typedef struct echo_float_t {

  int16_t m;  // Mantissa

  int16_t e;  // Exponent


  // Constructor for initialization

  constexpr echo_float_t(int16_t mantissa = 0, int16_t exponent = 0)

    : m(mantissa), e(exponent) {}


  // Operator overloads for arithmetic

  inline echo_float_t operator*(const echo_float_t& other) const {

    return echo_float_mult(*this, other);

  }


  inline echo_word32_t operator*(int16_t scalar) const {

    // Result is a regular integer when multiplying float by int

    int32_t result = ((int32_t)m * scalar);

    if (e >= 14) {

      return result << (e - 14);

    } else {

      return result >> (14 - e);

    }

  }


  inline echo_word32_t operator*(int32_t scalar) const {

    // Result is a regular integer when multiplying float by int

    int64_t result = ((int64_t)m * scalar);

    if (e >= 14) {

      return result << (e - 14);

    } else {

      return result >> (14 - e);

    }

  }


  friend inline echo_word32_t operator*(int32_t scalar, const echo_float_t& f) {

    return f * scalar;

  }

} echo_float_t;


// Fixed-point arithmetic helper functions

inline echo_float_t echo_float_from_double(double x) {

  echo_float_t r;

  if (x == 0) {

    r.m = 0;

    r.e = 0;

    return r;

  }

  int e = 0;

  while (x >= 32768) { x *= 0.5; e++; }

  while (x < 16384) { x *= 2.0; e--; }

  r.m = (int16_t)x;

  r.e = (int16_t)e;

  return r;

}


inline echo_float_t echo_float_mult(echo_float_t a, echo_float_t b) {

  echo_float_t r;

  r.m = (int16_t)((((int32_t)a.m) * b.m) >> 15);

  r.e = a.e + b.e + 15;

  if (r.m > 0) {

    while (r.m < 16384) { r.m <<= 1; r.e--; }

  }

  return r;

}


inline echo_float_t echo_float_mul32_u(float a, float b) {

  return echo_float_from_double(a * b);

}


inline echo_float_t echo_float_add(echo_float_t a, echo_float_t b) {

  if (a.e > b.e) {

    int shift = a.e - b.e;

    if (shift > 15) return a;

    echo_float_t r = {(int16_t)(a.m + (b.m >> shift)), a.e};

    return r;

  } else {

    int shift = b.e - a.e;

    if (shift > 15) return b;

    echo_float_t r = {(int16_t)((a.m >> shift) + b.m), b.e};

    return r;

  }

}


inline echo_float_t echo_float_sub(echo_float_t a, echo_float_t b) {

  if (a.e > b.e) {

    int shift = a.e - b.e;

    if (shift > 15) return a;

    echo_float_t r = {(int16_t)(a.m - (b.m >> shift)), a.e};

    return r;

  } else {

    int shift = b.e - a.e;

    if (shift > 15) {

      echo_float_t r = {(int16_t)(-b.m), b.e};

      return r;

    }

    echo_float_t r = {(int16_t)((a.m >> shift) - b.m), b.e};

    return r;

  }

}


inline bool echo_float_lt(echo_float_t a, echo_float_t b) {

  if (a.e != b.e) return a.e < b.e;

  return a.m < b.m;

}


inline bool echo_float_gt(echo_float_t a, echo_float_t b) {

  if (a.e != b.e) return a.e > b.e;

  return a.m > b.m;

}


inline echo_float_t echo_float_divu(echo_float_t a, echo_float_t b) {

  echo_float_t r;

  if (b.m == 0) {

    r.m = 32767;

    r.e = 15;

    return r;

  }

  r.m = (int16_t)((((int32_t)a.m) << 15) / b.m);

  r.e = a.e - b.e - 15;

  if (r.m > 0) {

    while (r.m < 16384) { r.m <<= 1; r.e--; }

  }

  return r;

}


inline echo_float_t echo_float_sqrt(echo_float_t x) {

  double val = x.m * pow(2.0, x.e - 14);

  return echo_float_from_double(sqrt(val));

}


inline int16_t echo_float_extract16(echo_float_t x) {

  if (x.e > 0) {

    return x.m << (x.e > 15 ? 15 : x.e);

  } else {

    return x.m >> (-x.e > 15 ? 15 : -x.e);

  }

}


inline echo_float_t echo_float_shl(echo_float_t x, int bits) {

  echo_float_t r = {x.m, (int16_t)(x.e + bits)};

  return r;

}


static const echo_float_t MIN_LEAK = {164, -15};


static const echo_float_t VAR1_SMOOTH = {11796, -15};


static const echo_float_t VAR2_SMOOTH = {23674, -15};


static const echo_float_t VAR1_UPDATE = {16384, -15};


static const echo_float_t VAR2_UPDATE = {8192, -15};


static const echo_float_t VAR_BACKTRACK = {16384, 2};


#else

// Floating-point mode


static const float MIN_LEAK = 0.005f;


static const float VAR1_SMOOTH = 0.36f;


static const float VAR2_SMOOTH = 0.7225f;


static const float VAR1_UPDATE = 0.5f;


static const float VAR2_UPDATE = 0.25f;


static const float VAR_BACKTRACK = 4.0f;


#endif  // FIXED_POINT


// Floating point type definition (for non-FIXED_POINT mode)

#ifndef FIXED_POINT

typedef float echo_float_t;

#endif


struct EchoState_ {

  int frame_size;

  int window_size;

  int M;

  int cancel_count;

  int adapted;

  int saturated;

  int screwed_up;

  int C;

  int K;

  echo_int32_t sampling_rate;

  echo_word16_t spec_average;

  echo_word16_t beta0;

  echo_word16_t beta_max;

  echo_word32_t sum_adapt;

  echo_word16_t leak_estimate;


  echo_word16_t* e;     /* scratch */

  echo_word16_t* x;     /* Far-end input buffer (2N) */

  echo_word16_t* X;     /* Far-end buffer (M+1 frames) in frequency domain */

  echo_word16_t* input; /* scratch */

  echo_word16_t* y;     /* scratch */

  echo_word16_t* last_y;

  echo_word16_t* Y; /* scratch */

  echo_word16_t* E;

  echo_word32_t* PHI; /* scratch */

  echo_word32_t* W;   /* (Background) filter weights */

#ifdef TWO_PATH

  echo_word16_t* foreground; /* Foreground filter weights */

  echo_word32_t

      Davg1; /* 1st recursive average of the residual power difference */

  echo_word32_t

      Davg2; /* 2nd recursive average of the residual power difference */

  echo_float_t Dvar1; /* Estimated variance of 1st estimator */

  echo_float_t Dvar2; /* Estimated variance of 2nd estimator */

#endif

  echo_word32_t* power;  /* Power of the far-end signal */

  echo_float_t* power_1; /* Inverse power of far-end */

  echo_word16_t* wtmp;   /* scratch */

  echo_word32_t* Rf;     /* scratch */

  echo_word32_t* Yf;     /* scratch */

  echo_word32_t* Xf;     /* scratch */

  echo_word32_t* Eh;

  echo_word32_t* Yh;

  echo_float_t Pey;

  echo_float_t Pyy;

  echo_word16_t* window;

  echo_word16_t* prop;

  void* fft_table;

  echo_word16_t *memX, *memD, *memE;

  echo_word16_t preemph;

  echo_word16_t notch_radius;

  echo_mem_t* notch_mem;


  echo_int16_t* play_buf;

  int play_buf_pos;

  int play_buf_started;

};


typedef struct EchoState_ EchoState;


template <typename Allocator = std::allocator<uint8_t>>


struct fft_state {

  using FloatAllocator = typename std::allocator_traits<Allocator>::template rebind_alloc<float>;

  AudioFFTBase* driver;

  int N;

  std::vector<float, FloatAllocator> temp_real;

  std::vector<float, FloatAllocator> temp_img;


  fft_state(int size, AudioFFTBase* drv, const Allocator& alloc = Allocator())

      : N(size), driver(drv),

        temp_real(FloatAllocator(alloc)),

        temp_img(FloatAllocator(alloc)) {

    temp_real.resize(size);

    temp_img.resize(size);

  }


};


template <typename Allocator = std::allocator<uint8_t>>


class MDFEchoCancellation : public AudioStream {

 public:


  MDFEchoCancellation(int filterLength, AudioFFTBase& fftDriver, const Allocator& alloc = Allocator())

      : fft_driver(&fftDriver), allocator(alloc),

        filter_length(filterLength), nb_mic(1), nb_speakers(1) {}


  MDFEchoCancellation(int filterLength, int nbMic, int nbSpeakers,

                AudioFFTBase& fftDriver, const Allocator& alloc = Allocator())

      : fft_driver(&fftDriver), allocator(alloc),

        filter_length(filterLength), nb_mic(nbMic), nb_speakers(nbSpeakers) {}


  ~MDFEchoCancellation() {

    if (!state) return;


    if (state->fft_table) echo_fft_destroy<Allocator>(state->fft_table);


    echoFree(state->e);

    echoFree(state->x);

    echoFree(state->input);

    echoFree(state->y);

    echoFree(state->last_y);

    echoFree(state->Yf);

    echoFree(state->Rf);

    echoFree(state->Xf);

    echoFree(state->Yh);

    echoFree(state->Eh);

    echoFree(state->X);

    echoFree(state->Y);

    echoFree(state->E);

    echoFree(state->W);

#ifdef TWO_PATH

    echoFree(state->foreground);

#endif

    echoFree(state->PHI);

    echoFree(state->power);

    echoFree(state->power_1);

    echoFree(state->window);

    echoFree(state->prop);

    echoFree(state->wtmp);

    echoFree(state->memX);

    echoFree(state->memD);

    echoFree(state->memE);

    echoFree(state->notch_mem);

    echoFree(state->play_buf);

    delete state;

    state = nullptr;

  }


  void cancel(const echo_int16_t* rec, const echo_int16_t* play,

                    echo_int16_t* out) {

    ensureInitialized();

    echoCancellationImpl(state, rec, play, out);

  }


  void capture(const echo_int16_t* rec, echo_int16_t* out) {

    ensureInitialized();

    state->play_buf_started = 1;

    if (state->play_buf_pos >= state->frame_size) {

      echoCancellationImpl(state, rec, state->play_buf, out);

      state->play_buf_pos -= state->frame_size;

      std::memmove(state->play_buf,

                   &state->play_buf[state->frame_size],

                   state->play_buf_pos * sizeof(echo_int16_t));

    } else {

      echoWarning("No playback frame available");

      if (state->play_buf_pos != 0) {

        echoWarning("Internal playback buffer corruption");

        state->play_buf_pos = 0;

      }

      for (int i = 0; i < state->frame_size; i++) out[i] = rec[i];

    }

  }


  void playback(const echo_int16_t* play) {

    ensureInitialized();

    if (!state->play_buf_started) {

      echoWarning("Discarded first playback frame");

      return;

    }

    if (state->play_buf_pos <= PLAYBACK_DELAY * state->frame_size) {

      for (int i = 0; i < state->frame_size; i++)

        state->play_buf[state->play_buf_pos + i] = play[i];

      state->play_buf_pos += state->frame_size;

      if (state->play_buf_pos <= (PLAYBACK_DELAY - 1) * state->frame_size) {

        echoWarning("Auto-filling buffer");

        for (int i = 0; i < state->frame_size; i++)

          state->play_buf[state->play_buf_pos + i] = play[i];

        state->play_buf_pos += state->frame_size;

      }

    } else {

      echoWarning("Had to discard playback frame");

    }

  }


  void reset() {

    ensureInitialized();

    int N = state->window_size;

    int M = state->M;

    int C = state->C;

    int K = state->K;


    state->cancel_count = 0;

    state->screwed_up = 0;


    for (int i = 0; i < N * M; i++) state->W[i] = 0;

#ifdef TWO_PATH

    for (int i = 0; i < N * M; i++) state->foreground[i] = 0;

#endif

    for (int i = 0; i < N * (M + 1); i++) state->X[i] = 0;

    for (int i = 0; i <= state->frame_size; i++) {

      state->power[i] = 0;

      state->power_1[i] = FLOAT_ONE;

      state->Eh[i] = 0;

      state->Yh[i] = 0;

    }

    for (int i = 0; i < state->frame_size; i++) state->last_y[i] = 0;

    for (int i = 0; i < N * C; i++) state->E[i] = 0;

    for (int i = 0; i < N * K; i++) state->x[i] = 0;

    for (int i = 0; i < 2 * C; i++) state->notch_mem[i] = 0;

    for (int i = 0; i < C; i++) state->memD[i] = state->memE[i] = 0;

    for (int i = 0; i < K; i++) state->memX[i] = 0;


    state->saturated = 0;

    state->adapted = 0;

    state->sum_adapt = 0;

    state->Pey = state->Pyy = FLOAT_ONE;

#ifdef TWO_PATH

    state->Davg1 = state->Davg2 = 0;

    state->Dvar1 = state->Dvar2 = FLOAT_ZERO;

#endif

    for (int i = 0; i < 3 * state->frame_size; i++) state->play_buf[i] = 0;

    state->play_buf_pos = PLAYBACK_DELAY * state->frame_size;

    state->play_buf_started = 0;

  }


  int control(int request, void* ptr) {

    switch (request) {

      case ECHO_GET_FRAME_SIZE:

        (*(int*)ptr) = state->frame_size;

        break;

      case ECHO_SET_SAMPLING_RATE:

        state->sampling_rate = (*(int*)ptr);

        state->spec_average = state->frame_size / (float)state->sampling_rate;

        state->beta0 = (2.0f * state->frame_size) / state->sampling_rate;

        state->beta_max = (.5f * state->frame_size) / state->sampling_rate;

        if (state->sampling_rate < 12000)

          state->notch_radius = .9f;

        else if (state->sampling_rate < 24000)

          state->notch_radius = .982f;

        else

          state->notch_radius = .992f;

        break;

      case ECHO_GET_SAMPLING_RATE:

        (*(int*)ptr) = state->sampling_rate;

        break;

      case ECHO_GET_IMPULSE_RESPONSE_SIZE:

        *((echo_int32_t*)ptr) = state->M * state->frame_size;

        break;

      case ECHO_GET_IMPULSE_RESPONSE: {

        int M = state->M, N = state->window_size, n = state->frame_size;

        echo_int32_t* filt = (echo_int32_t*)ptr;

        for (int j = 0; j < M; j++) {

          echo_ifft<Allocator>(state->fft_table, &state->W[j * N], state->wtmp);

          for (int i = 0; i < n; i++) filt[j * n + i] = 32767 * state->wtmp[i];

        }

      } break;

      default:

        return -1;

    }

    return 0;

  }


  int getFrameSize() { return state->frame_size; }


  void setSamplingRate(int rate) { control(ECHO_SET_SAMPLING_RATE, &rate); }


  int getSamplingRate() { return state->sampling_rate; }


  int getImpulseResponseSize() { return state->M * state->frame_size; }


  void getImpulseResponse(echo_int32_t* response) {

    control(ECHO_GET_IMPULSE_RESPONSE, response);

  }


  void setFilterLength(int len) {

    if (initialized) {

      echoWarning("Cannot change filter length after initialization");

      return;

    }

    filter_length = len;

  }


  int getFilterLength() { return filter_length; }


  void setMicChannels(int num) {

    if (initialized) {

      echoWarning("Cannot change mic channels after initialization");

      return;

    }

    nb_mic = num;

  }


  int getMicChannels() { return nb_mic; }


  void setSpeakerChannels(int num) {

    if (initialized) {

      echoWarning("Cannot change speaker channels after initialization");

      return;

    }

    nb_speakers = num;

  }


  int getSpeakerChannels() { return nb_speakers; }


  void setFFTDriver(AudioFFTBase& fftDriver) {

    if (initialized) {

      echoWarning("Cannot change FFT driver after initialization");

      return;

    }

    fft_driver = &fftDriver;

  }


  EchoState* getState() { return state; }


 protected:

  EchoState* state = nullptr;

  AudioFFTBase* fft_driver;

  Allocator allocator;

  int filter_length;

  int nb_mic;

  int nb_speakers;

  bool initialized = false;


  void ensureInitialized() {

    if (initialized) return;


    int frameSize = fft_driver->config().length;

    state = echoStateInitMc(frameSize, filter_length, nb_mic, nb_speakers);

    if (state && fft_driver) {

      state->fft_table =

          echo_fft_init<Allocator>(state->window_size, fft_driver, allocator);

    }

    initialized = true;

  }


  template <typename T>


  T* echoAlloc(size_t count) {

    typename std::allocator_traits<Allocator>::template rebind_alloc<T> alloc(allocator);

    T* ptr = alloc.allocate(count);

    // Initialize to zero (equivalent to calloc behavior)

    for (size_t i = 0; i < count; ++i) {

      std::allocator_traits<typename std::allocator_traits<Allocator>::template rebind_alloc<T>>::construct(alloc, ptr + i);

    }

    return ptr;

  }


  template <typename T>


  void echoFree(T* ptr, size_t count = 0) {

    if (ptr) {

      typename std::allocator_traits<Allocator>::template rebind_alloc<T> alloc(allocator);

      // Note: count is not used since we can't track allocation size

      // This is acceptable for POD types as we're using with speexdsp

      alloc.deallocate(ptr, count);

    }

  }


  inline void echoWarning(const char* str) {

    LOGW("EchoCanceller Warning: %s", str);

  }


  inline void echoFatal(const char* str) {

    LOGE("EchoCanceller Error: %s", str);

  }


  inline float spxSqrt(float x) { return sqrtf(x); }


  inline echo_int16_t spxIlog2(echo_uint32_t x) {

    int r = 0;

    if (x >= (echo_int32_t)65536) {

      x >>= 16;

      r += 16;

    }

    if (x >= 256) {

      x >>= 8;

      r += 8;

    }

    if (x >= 16) {

      x >>= 4;

      r += 4;

    }

    if (x >= 4) {

      x >>= 2;

      r += 2;

    }

    if (x >= 2) {

      r += 1;

    }

    return r;

  }


  inline float spxExp(float x) { return expf(x); }


  inline float spxCos(float x) { return cosf(x); }


  inline void filterDcNotch16(const echo_int16_t* in, echo_word16_t radius,

                              echo_word16_t* out, int len, echo_mem_t* mem,

                              int stride) {

    echo_word16_t den2 = radius * radius + .7f * (1 - radius) * (1 - radius);

    for (int i = 0; i < len; i++) {

      echo_word16_t vin = in[i * stride];

      echo_word32_t vout = mem[0] + vin;

      mem[0] = mem[1] + 2 * (-vin + radius * vout);

      mem[1] = vin - den2 * vout;

      out[i] = radius * vout;

    }

  }


  inline echo_word32_t mdfInnerProd(const echo_word16_t* x, const echo_word16_t* y,

                                   int len) {

    float sum = 0;

    for (int i = 0; i < len; i++) {

      sum += x[i] * y[i];

    }

    return sum;

  }


  inline void powerSpectrum(const echo_word16_t* X, echo_word32_t* ps, int N) {

    ps[0] = X[0] * X[0];

    for (int i = 1, j = 1; i < N - 1; i += 2, j++) {

      ps[j] = X[i] * X[i] + X[i + 1] * X[i + 1];

    }

    ps[N / 2] = X[N - 1] * X[N - 1];

  }


  inline void powerSpectrumAccum(const echo_word16_t* X, echo_word32_t* ps,

                                 int N) {

    ps[0] += X[0] * X[0];

    for (int i = 1, j = 1; i < N - 1; i += 2, j++) {

      ps[j] += X[i] * X[i] + X[i + 1] * X[i + 1];

    }

    ps[N / 2] += X[N - 1] * X[N - 1];

  }


  inline void spectralMulAccum(const echo_word16_t* X, const echo_word32_t* Y,

                               echo_word16_t* acc, int N, int M) {

    for (int i = 0; i < N; i++) acc[i] = 0;


    for (int j = 0; j < M; j++) {

      acc[0] += X[0] * Y[0];

      for (int i = 1; i < N - 1; i += 2) {

        acc[i] += (X[i] * Y[i] - X[i + 1] * Y[i + 1]);

        acc[i + 1] += (X[i + 1] * Y[i] + X[i] * Y[i + 1]);

      }

      acc[N - 1] += X[N - 1] * Y[N - 1];

      X += N;

      Y += N;

    }

  }


  inline void weightedSpectralMulConj(const echo_float_t* w, const echo_float_t p,

                                      const echo_word16_t* X,

                                      const echo_word16_t* Y, echo_word32_t* prod,

                                      int N) {

    echo_float_t W;

    W = p * w[0];

    prod[0] = W * ((int32_t)X[0] * Y[0]);

    for (int i = 1, j = 1; i < N - 1; i += 2, j++) {

      W = p * w[j];

      prod[i] = W * ((int32_t)(X[i] * Y[i] + X[i + 1] * Y[i + 1]));

      prod[i + 1] = W * ((int32_t)(-X[i + 1] * Y[i] + X[i] * Y[i + 1]));

    }

    W = p * w[N / 2];

    prod[N - 1] = W * ((int32_t)X[N - 1] * Y[N - 1]);

  }


  inline void mdfAdjustProp(const echo_word32_t* W, int N, int M, int P,

                            echo_word16_t* prop) {

    echo_word16_t max_sum = 1;

    echo_word32_t prop_sum = 1;


    for (int i = 0; i < M; i++) {

      echo_word32_t tmp = 1;

      for (int p = 0; p < P; p++) {

        for (int j = 0; j < N; j++) {

          float val = W[p * N * M + i * N + j];

          tmp += val * val;

        }

      }

      prop[i] = spxSqrt(tmp);

      if (prop[i] > max_sum) max_sum = prop[i];

    }


    for (int i = 0; i < M; i++) {

      prop[i] += 0.1f * max_sum;

      prop_sum += prop[i];

    }


    for (int i = 0; i < M; i++) {

      prop[i] = 0.99f * prop[i] / prop_sum;

    }

  }


  EchoState* echoStateInitMc(int frame_size, int filter_length, int nb_mic,

                                  int nb_speakers) {

    int N = frame_size * 2;

    int M = (filter_length + frame_size - 1) / frame_size;

    int C = nb_mic;

    int K = nb_speakers;


    EchoState* st = new EchoState();

    if (!st) return nullptr;


    st->K = K;

    st->C = C;

    st->frame_size = frame_size;

    st->window_size = N;

    st->M = M;

    st->cancel_count = 0;

    st->sum_adapt = 0;

    st->saturated = 0;

    st->screwed_up = 0;

    st->sampling_rate = 8000;

    st->spec_average = st->frame_size / (float)st->sampling_rate;

    st->beta0 = (2.0f * st->frame_size) / st->sampling_rate;

    st->beta_max = (.5f * st->frame_size) / st->sampling_rate;

    st->leak_estimate = 0;


    // Allocate buffers

    st->e = echoAlloc<echo_word16_t>(C * N);

    st->x = echoAlloc<echo_word16_t>(K * N);

    st->input = echoAlloc<echo_word16_t>(C * st->frame_size);

    st->y = echoAlloc<echo_word16_t>(C * N);

    st->last_y = echoAlloc<echo_word16_t>(C * N);

    st->Yf = echoAlloc<echo_word32_t>(st->frame_size + 1);

    st->Rf = echoAlloc<echo_word32_t>(st->frame_size + 1);

    st->Xf = echoAlloc<echo_word32_t>(st->frame_size + 1);

    st->Yh = echoAlloc<echo_word32_t>(st->frame_size + 1);

    st->Eh = echoAlloc<echo_word32_t>(st->frame_size + 1);

    st->X = echoAlloc<echo_word16_t>(K * (M + 1) * N);

    st->Y = echoAlloc<echo_word16_t>(C * N);

    st->E = echoAlloc<echo_word16_t>(C * N);

    st->W = echoAlloc<echo_word32_t>(C * K * M * N);


#ifdef TWO_PATH

    st->foreground = echoAlloc<echo_word16_t>(M * N * C * K);

#endif


    st->PHI = echoAlloc<echo_word32_t>(N);

    st->power = echoAlloc<echo_word32_t>(frame_size + 1);

    st->power_1 = echoAlloc<echo_float_t>(frame_size + 1);

    st->window = echoAlloc<echo_word16_t>(N);

    st->prop = echoAlloc<echo_word16_t>(M);

    st->wtmp = echoAlloc<echo_word16_t>(N);


    // Initialize window

    for (int i = 0; i < N; i++)

      st->window[i] = .5f - .5f * cosf(2 * M_PI * i / N);


    // Initialize power_1

    for (int i = 0; i <= st->frame_size; i++) st->power_1[i] = FLOAT_ONE;


    // Initialize W

    for (int i = 0; i < N * M * K * C; i++) st->W[i] = 0;


    // Initialize prop

    {

      echo_word32_t sum = 0;

      float decay = expf(-2.4f / M);

      st->prop[0] = .7f;

      sum = st->prop[0];

      for (int i = 1; i < M; i++) {

        st->prop[i] = st->prop[i - 1] * decay;

        sum += st->prop[i];

      }

      for (int i = M - 1; i >= 0; i--) {

        st->prop[i] = .8f * st->prop[i] / sum;

      }

    }


    st->memX = echoAlloc<echo_word16_t>(K);

    st->memD = echoAlloc<echo_word16_t>(C);

    st->memE = echoAlloc<echo_word16_t>(C);

    st->preemph = .9f;


    if (st->sampling_rate < 12000)

      st->notch_radius = .9f;

    else if (st->sampling_rate < 24000)

      st->notch_radius = .982f;

    else

      st->notch_radius = .992f;


    st->notch_mem = echoAlloc<echo_mem_t>(2 * C);

    st->adapted = 0;

    st->Pey = st->Pyy = FLOAT_ONE;


#ifdef TWO_PATH

    st->Davg1 = st->Davg2 = 0;

    st->Dvar1 = st->Dvar2 = FLOAT_ZERO;

#endif


    st->play_buf =

        echoAlloc<echo_int16_t>(K * (PLAYBACK_DELAY + 1) * st->frame_size);

    st->play_buf_pos = PLAYBACK_DELAY * st->frame_size;

    st->play_buf_started = 0;


    st->fft_table = nullptr;


    return st;

  }


  inline void echoCancellationImpl(EchoState* st, const echo_int16_t* in,

                                   const echo_int16_t* far_end,

                                   echo_int16_t* out) {

    int N = st->window_size;

    int M = st->M;

    int C = st->C;

    int K = st->K;


    st->cancel_count++;

    float ss = .35f / M;

    float ss_1 = 1 - ss;


    // Apply notch filter and pre-emphasis to input

    for (int chan = 0; chan < C; chan++) {

      filterDcNotch16(in + chan, st->notch_radius,

                      st->input + chan * st->frame_size, st->frame_size,

                      st->notch_mem + 2 * chan, C);


      for (int i = 0; i < st->frame_size; i++) {

        echo_word32_t tmp32 =

            st->input[chan * st->frame_size + i] - st->preemph * st->memD[chan];

        st->memD[chan] = st->input[chan * st->frame_size + i];

        st->input[chan * st->frame_size + i] = tmp32;

      }

    }


    // Process far-end signal

    for (int speak = 0; speak < K; speak++) {

      std::memmove(&st->x[speak * N],

                   &st->x[speak * N + st->frame_size],

                   st->frame_size * sizeof(echo_word16_t));

      for (int i = 0; i < st->frame_size; i++) {

        echo_word32_t tmp32 =

            far_end[i * K + speak] - st->preemph * st->memX[speak];

        st->x[speak * N + i + st->frame_size] = tmp32;

        st->memX[speak] = far_end[i * K + speak];

      }

    }


    // Shift memory and compute FFT of far-end

    for (int speak = 0; speak < K; speak++) {

      for (int j = M - 1; j >= 0; j--) {

        std::memmove(&st->X[(j + 1) * N * K + speak * N],

                     &st->X[j * N * K + speak * N],

                     N * sizeof(echo_word16_t));

      }

      echo_fft<Allocator>(st->fft_table, st->x + speak * N, &st->X[speak * N]);

    }


    // Compute power spectrum of far-end

    echo_word32_t Sxx = 0;

    for (int speak = 0; speak < K; speak++) {

      Sxx += mdfInnerProd(st->x + speak * N + st->frame_size,

                          st->x + speak * N + st->frame_size, st->frame_size);

      powerSpectrumAccum(st->X + speak * N, st->Xf, N);

    }


    // Compute foreground filter output and residual

    echo_word32_t Sff = 0;

    for (int chan = 0; chan < C; chan++) {

#ifdef TWO_PATH

      spectralMulAccum(st->X, st->foreground + chan * N * K * M,

                       st->Y + chan * N, N, M * K);

      echo_ifft<Allocator>(st->fft_table, st->Y + chan * N, st->e + chan * N);

      for (int i = 0; i < st->frame_size; i++)

        st->e[chan * N + i] = st->input[chan * st->frame_size + i] -

                              st->e[chan * N + i + st->frame_size];

      Sff += mdfInnerProd(st->e + chan * N, st->e + chan * N, st->frame_size);

#endif

    }


    // Adjust proportional adaptation

    if (st->adapted) mdfAdjustProp(st->W, N, M, C * K, st->prop);


    // Compute weight gradient

    if (st->saturated == 0) {

      for (int chan = 0; chan < C; chan++) {

        for (int speak = 0; speak < K; speak++) {

          for (int j = M - 1; j >= 0; j--) {

            weightedSpectralMulConj(st->power_1, st->prop[j],

                                    &st->X[(j + 1) * N * K + speak * N],

                                    st->E + chan * N, st->PHI, N);

            for (int i = 0; i < N; i++)

              st->W[chan * N * K * M + j * N * K + speak * N + i] += st->PHI[i];

          }

        }

      }

    } else {

      st->saturated--;

    }


    // Update weights (AUMDF)

    for (int chan = 0; chan < C; chan++) {

      for (int speak = 0; speak < K; speak++) {

        for (int j = 0; j < M; j++) {

          if (j == 0 || st->cancel_count % (M - 1) == j - 1) {

            echo_ifft<Allocator>(

                st->fft_table, &st->W[chan * N * K * M + j * N * K + speak * N],

                st->wtmp);

            for (int i = st->frame_size; i < N; i++) st->wtmp[i] = 0;

            echo_fft<Allocator>(

                st->fft_table, st->wtmp,

                &st->W[chan * N * K * M + j * N * K + speak * N]);

          }

        }

      }

    }


    // Initialize spectrum buffers

    for (int i = 0; i <= st->frame_size; i++)

      st->Rf[i] = st->Yf[i] = st->Xf[i] = 0;


    echo_word32_t Dbf = 0;

    echo_word32_t See = 0;


#ifdef TWO_PATH

    // Compute background filter output

    for (int chan = 0; chan < C; chan++) {

      spectralMulAccum(st->X, st->W + chan * N * K * M, st->Y + chan * N, N,

                       M * K);

      echo_ifft<Allocator>(st->fft_table, st->Y + chan * N, st->y + chan * N);

      for (int i = 0; i < st->frame_size; i++)

        st->e[chan * N + i] = st->e[chan * N + i + st->frame_size] -

                              st->y[chan * N + i + st->frame_size];

      Dbf +=

          10 + mdfInnerProd(st->e + chan * N, st->e + chan * N, st->frame_size);

      for (int i = 0; i < st->frame_size; i++)

        st->e[chan * N + i] = st->input[chan * st->frame_size + i] -

                              st->y[chan * N + i + st->frame_size];

      See += mdfInnerProd(st->e + chan * N, st->e + chan * N, st->frame_size);

    }

#endif


#ifndef TWO_PATH

    Sff = See;

#endif


#ifdef TWO_PATH

    // Two-path filter logic

    st->Davg1 = .6f * st->Davg1 + .4f * (Sff - See);

    st->Davg2 = .85f * st->Davg2 + .15f * (Sff - See);

    st->Dvar1 = FLOAT_ADD(FLOAT_MULT(VAR1_SMOOTH, st->Dvar1),

                          FLOAT_MUL32U(.4f * Sff, .4f * Dbf));

    st->Dvar2 = FLOAT_ADD(FLOAT_MULT(VAR2_SMOOTH, st->Dvar2),

                          FLOAT_MUL32U(.15f * Sff, .15f * Dbf));


    int update_foreground = 0;

    if (FLOAT_GT(FLOAT_MUL32U(Sff - See, fabsf(Sff - See)),

                 FLOAT_MUL32U(Sff, Dbf)))

      update_foreground = 1;

    else if (FLOAT_GT(FLOAT_MUL32U(st->Davg1, fabsf(st->Davg1)),

                      FLOAT_MULT(VAR1_UPDATE, st->Dvar1)))

      update_foreground = 1;

    else if (FLOAT_GT(FLOAT_MUL32U(st->Davg2, fabsf(st->Davg2)),

                      FLOAT_MULT(VAR2_UPDATE, st->Dvar2)))

      update_foreground = 1;


    if (update_foreground) {

      st->Davg1 = st->Davg2 = 0;

      st->Dvar1 = st->Dvar2 = FLOAT_ZERO;

      std::memcpy(st->foreground, st->W, N * M * C * K * sizeof(echo_word16_t));

      for (int chan = 0; chan < C; chan++)

        for (int i = 0; i < st->frame_size; i++)

          st->e[chan * N + i + st->frame_size] =

              st->window[i + st->frame_size] *

                  st->e[chan * N + i + st->frame_size] +

              st->window[i] * st->y[chan * N + i + st->frame_size];

    } else {

      int reset_background = 0;

      if (FLOAT_GT(FLOAT_MUL32U(-(Sff - See), fabsf(Sff - See)),

                   FLOAT_MULT(VAR_BACKTRACK, FLOAT_MUL32U(Sff, Dbf))))

        reset_background = 1;

      if (FLOAT_GT(FLOAT_MUL32U(-st->Davg1, fabsf(st->Davg1)),

                   FLOAT_MULT(VAR_BACKTRACK, st->Dvar1)))

        reset_background = 1;

      if (FLOAT_GT(FLOAT_MUL32U(-st->Davg2, fabsf(st->Davg2)),

                   FLOAT_MULT(VAR_BACKTRACK, st->Dvar2)))

        reset_background = 1;


      if (reset_background) {

        std::memcpy(st->W, st->foreground, N * M * C * K * sizeof(echo_word32_t));

        for (int chan = 0; chan < C; chan++) {

          for (int i = 0; i < st->frame_size; i++)

            st->y[chan * N + i + st->frame_size] =

                st->e[chan * N + i + st->frame_size];

          for (int i = 0; i < st->frame_size; i++)

            st->e[chan * N + i] = st->input[chan * st->frame_size + i] -

                                  st->y[chan * N + i + st->frame_size];

        }

        See = Sff;

        st->Davg1 = st->Davg2 = 0;

        st->Dvar1 = st->Dvar2 = FLOAT_ZERO;

      }

    }

#endif


    echo_word32_t Sey = 0, Syy = 0, Sdd = 0;

    for (int chan = 0; chan < C; chan++) {

      // Compute output with de-emphasis

      for (int i = 0; i < st->frame_size; i++) {

        echo_word32_t tmp_out;

#ifdef TWO_PATH

        tmp_out = st->input[chan * st->frame_size + i] -

                  st->e[chan * N + i + st->frame_size];

#else

        tmp_out = st->input[chan * st->frame_size + i] -

                  st->y[chan * N + i + st->frame_size];

#endif

        tmp_out = tmp_out + st->preemph * st->memE[chan];

        if (in[i * C + chan] <= -32000 || in[i * C + chan] >= 32000) {

          if (st->saturated == 0) st->saturated = 1;

        }

        out[i * C + chan] = WORD2INT(tmp_out);

        st->memE[chan] = tmp_out;

      }


      // Prepare error signal for filter update

      for (int i = 0; i < st->frame_size; i++) {

        st->e[chan * N + i + st->frame_size] = st->e[chan * N + i];

        st->e[chan * N + i] = 0;

      }


      // Compute correlations

      Sey += mdfInnerProd(st->e + chan * N + st->frame_size,

                          st->y + chan * N + st->frame_size, st->frame_size);

      Syy += mdfInnerProd(st->y + chan * N + st->frame_size,

                          st->y + chan * N + st->frame_size, st->frame_size);

      Sdd += mdfInnerProd(st->input + chan * st->frame_size,

                          st->input + chan * st->frame_size, st->frame_size);


      // Convert error to frequency domain

      echo_fft<Allocator>(st->fft_table, st->e + chan * N, st->E + chan * N);


      for (int i = 0; i < st->frame_size; i++) st->y[i + chan * N] = 0;

      echo_fft<Allocator>(st->fft_table, st->y + chan * N, st->Y + chan * N);


      // Compute power spectra

      powerSpectrumAccum(st->E + chan * N, st->Rf, N);

      powerSpectrumAccum(st->Y + chan * N, st->Yf, N);

    }


    // Sanity checks

    if (!(Syy >= 0 && Sxx >= 0 && See >= 0) ||

        !(Sff < N * 1e9f && Syy < N * 1e9f && Sxx < N * 1e9f)) {

      st->screwed_up += 50;

      for (int i = 0; i < st->frame_size * C; i++) out[i] = 0;

    } else if (Sff > Sdd + N * 10000.0f) {

      st->screwed_up++;

    } else {

      st->screwed_up = 0;

    }


    if (st->screwed_up >= 50) {

      echoWarning("Echo canceller reset");

      reset();

      return;

    }


    See = MAX32(See, N * 100.0f);


    for (int speak = 0; speak < K; speak++) {

      Sxx += mdfInnerProd(st->x + speak * N + st->frame_size,

                          st->x + speak * N + st->frame_size, st->frame_size);

      powerSpectrumAccum(st->X + speak * N, st->Xf, N);

    }


    // Smooth far-end energy

    for (int j = 0; j <= st->frame_size; j++)

      st->power[j] = ss_1 * st->power[j] + 1 + ss * st->Xf[j];


    // Compute filtered spectra and correlations

    echo_float_t Pey = FLOAT_ZERO, Pyy = FLOAT_ZERO;

    for (int j = st->frame_size; j >= 0; j--) {

      echo_float_t Eh = PSEUDOFLOAT(st->Rf[j] - st->Eh[j]);

      echo_float_t Yh = PSEUDOFLOAT(st->Yf[j] - st->Yh[j]);

      Pey = FLOAT_ADD(Pey, FLOAT_MULT(Eh, Yh));

      Pyy = FLOAT_ADD(Pyy, FLOAT_MULT(Yh, Yh));

      st->Eh[j] =

          (1 - st->spec_average) * st->Eh[j] + st->spec_average * st->Rf[j];

      st->Yh[j] =

          (1 - st->spec_average) * st->Yh[j] + st->spec_average * st->Yf[j];

    }


    Pyy = FLOAT_SQRT(Pyy);

    Pey = FLOAT_DIVU(Pey, Pyy);


    // Compute correlation update rate

    echo_word32_t tmp32 = st->beta0 * Syy;

    if (tmp32 > st->beta_max * See) tmp32 = st->beta_max * See;

    echo_float_t alpha = tmp32 / See;

    echo_float_t alpha_1 = FLOAT_SUB(FLOAT_ONE, alpha);


    st->Pey = FLOAT_ADD(FLOAT_MULT(alpha_1, st->Pey), FLOAT_MULT(alpha, Pey));

    st->Pyy = FLOAT_ADD(FLOAT_MULT(alpha_1, st->Pyy), FLOAT_MULT(alpha, Pyy));

    if (FLOAT_LT(st->Pyy, FLOAT_ONE)) st->Pyy = FLOAT_ONE;

    if (FLOAT_LT(st->Pey, FLOAT_MULT(MIN_LEAK, st->Pyy)))

      st->Pey = FLOAT_MULT(MIN_LEAK, st->Pyy);

    if (FLOAT_GT(st->Pey, st->Pyy)) st->Pey = st->Pyy;


    st->leak_estimate =

        FLOAT_EXTRACT16(FLOAT_SHL(FLOAT_DIVU(st->Pey, st->Pyy), 14));

    if (st->leak_estimate > 16383)

      st->leak_estimate = 32767;

    else

      st->leak_estimate = st->leak_estimate * 2;


    // Compute RER

    echo_word16_t RER;

    RER = (.0001f * Sxx + 3.f * st->leak_estimate * Syy) / See;

    if (RER < Sey * Sey / (1 + See * Syy)) RER = Sey * Sey / (1 + See * Syy);

    if (RER > .5f) RER = .5f;


    if (!st->adapted && st->sum_adapt > M &&

        st->leak_estimate * Syy > .03f * Syy) {

      st->adapted = 1;

    }


    if (st->adapted) {

      for (int i = 0; i <= st->frame_size; i++) {

        echo_word32_t r = st->leak_estimate * st->Yf[i];

        echo_word32_t e = st->Rf[i] + 1;

        if (r > .5f * e) r = .5f * e;

        r = .7f * r + .3f * (RER * e);

        st->power_1[i] = r / (e * (st->power[i] + 10));

      }

    } else {

      echo_word16_t adapt_rate = 0;

      if (Sxx > N * 1000.0f) {

        tmp32 = .25f * Sxx;

        if (tmp32 > .25f * See) tmp32 = .25f * See;

        adapt_rate = tmp32 / See;

      }

      for (int i = 0; i <= st->frame_size; i++)

        st->power_1[i] = adapt_rate / (st->power[i] + 10);

      st->sum_adapt = st->sum_adapt + adapt_rate;

    }


    std::memmove(st->last_y,

                 &st->last_y[st->frame_size],

                 st->frame_size * sizeof(echo_word16_t));

    if (st->adapted) {

      for (int i = 0; i < st->frame_size; i++)

        st->last_y[st->frame_size + i] = in[i] - out[i];

    }

  }


};


// ============================================================================

// FFT Implementation

// ============================================================================

template <typename Allocator>


inline void* echo_fft_init(int size, AudioFFTBase* driver, const Allocator& alloc) {

  if (!driver) {

    return nullptr;

  }


  // Configure FFT with the required size

  AudioFFTConfig cfg;

  cfg.length = size;

  cfg.rxtx_mode = TX_MODE;  // We need both FFT and IFFT capabilities


  if (!driver->begin(cfg)) {

    return nullptr;

  }

  return new fft_state<Allocator>(size, driver, alloc);

}


template <typename Allocator = std::allocator<uint8_t>>


inline void echo_fft_destroy(void* table) {

  if (table) {

    auto* st = static_cast<fft_state<Allocator>*>(table);

    st->driver->end();

    delete st;

  }

}


template <typename Allocator = std::allocator<uint8_t>>


inline void echo_fft(void* table, echo_word16_t* in,

                    echo_word16_t* out) {

  auto* st = static_cast<fft_state<Allocator>*>(table);

  if (!st || !st->driver) return;


  // Set input values

  for (int i = 0; i < st->N; i++) {

    st->driver->setValue(i, in[i] / (float)st->N);

  }


  // Perform FFT

  st->driver->fft();


  // Get output in packed format: out[0]=real[0], out[1]=real[1],

  // out[2]=img[1],

  // ...

  out[0] = st->driver->getValue(0);  // DC component

  for (int i = 1; i < st->N - 1; i += 2) {

    int bin = (i + 1) / 2;

    float real, img;

    st->driver->getBin(bin, real, img);

    out[i] = real;

    out[i + 1] = img;

  }

  out[st->N - 1] = st->driver->getValue(st->N / 2);  // Nyquist

}


template <typename Allocator = std::allocator<uint8_t>>


inline void echo_ifft(void* table, echo_word16_t* in,

                     echo_word16_t* out) {

  auto* st = static_cast<fft_state<Allocator>*>(table);

  if (!st || !st->driver || !st->driver->isReverseFFT()) return;


  // Set bins from packed format

  st->driver->setBin(0, in[0], 0);

  for (int i = 1; i < st->N - 1; i += 2) {

    int bin = (i + 1) / 2;

    st->driver->setBin(bin, in[i], in[i + 1]);

  }

  st->driver->setBin(st->N / 2, in[st->N - 1], 0);


  // Perform inverse FFT

  st->driver->rfft();


  // Get output

  for (int i = 0; i < st->N; i++) {

    out[i] = st->driver->getValue(i);

  }

}


}  // namespace audio_tools

audio_tools::Allocator
Memory allocateator which uses malloc.
Definition Allocator.h:23

audio_tools::AudioFFTBase
Executes FFT using audio data privded by write() and/or an inverse FFT where the samples are made ava...
Definition AudioFFT.h:191

audio_tools::AudioFFTBase::end
void end() override
Release the allocated memory.
Definition AudioFFT.h:285

audio_tools::AudioFFTBase::config
AudioFFTConfig & config()
Provides the actual configuration.
Definition AudioFFT.h:639

audio_tools::AudioFFTBase::driver
FFTDriver * driver()
Definition AudioFFT.h:551

audio_tools::AudioFFTBase::setBin
bool setBin(int idx, float real, float img)
sets the value of a bin
Definition AudioFFT.h:618

audio_tools::AudioFFTBase::begin
bool begin(AudioFFTConfig info)
starts the processing
Definition AudioFFT.h:207

audio_tools::AudioStream
Base class for all Audio Streams. It support the boolean operator to test if the object is ready with...
Definition BaseStream.h:122

audio_tools::FFTDriver::fft
virtual void fft()=0
Perform FFT.

audio_tools::MDFEchoCancellation
Acoustic echo canceller using MDF algorithm.
Definition MDFEchoCancellation.h:508

audio_tools::MDFEchoCancellation::spectralMulAccum
void spectralMulAccum(const echo_word16_t *X, const echo_word32_t *Y, echo_word16_t *acc, int N, int M)
Accumulate spectral multiplication across multiple frames.
Definition MDFEchoCancellation.h:971

audio_tools::MDFEchoCancellation::getMicChannels
int getMicChannels()
Definition MDFEchoCancellation.h:759

audio_tools::echo_ifft
void echo_ifft(void *table, echo_word16_t *in, echo_word16_t *out)
Perform inverse FFT.
Definition MDFEchoCancellation.h:1613

audio_tools::MDFEchoCancellation::cancel
void cancel(const echo_int16_t *rec, const echo_int16_t *play, echo_int16_t *out)
Definition MDFEchoCancellation.h:575

audio_tools::MDFEchoCancellation::getSamplingRate
int getSamplingRate()
Definition MDFEchoCancellation.h:721

audio_tools::MDFEchoCancellation::mdfAdjustProp
void mdfAdjustProp(const echo_word32_t *W, int N, int M, int P, echo_word16_t *prop)
Adjust proportional adaptation weights.
Definition MDFEchoCancellation.h:1020

audio_tools::echo_fft
void echo_fft(void *table, echo_word16_t *in, echo_word16_t *out)
Perform forward FFT.
Definition MDFEchoCancellation.h:1577

audio_tools::fft_state::temp_real
std::vector< float, FloatAllocator > temp_real
Definition MDFEchoCancellation.h:456

audio_tools::MDFEchoCancellation::~MDFEchoCancellation
~MDFEchoCancellation()
Definition MDFEchoCancellation.h:532

audio_tools::MDFEchoCancellation::getImpulseResponse
void getImpulseResponse(echo_int32_t *response)
Definition MDFEchoCancellation.h:729

audio_tools::EchoState_::K
int K
Definition MDFEchoCancellation.h:388

audio_tools::MDFEchoCancellation::mdfInnerProd
echo_word32_t mdfInnerProd(const echo_word16_t *x, const echo_word16_t *y, int len)
Compute inner product of two vectors.
Definition MDFEchoCancellation.h:925

audio_tools::MDFEchoCancellation::setSpeakerChannels
void setSpeakerChannels(int num)
Definition MDFEchoCancellation.h:764

audio_tools::MDFEchoCancellation::fft_driver
AudioFFTBase * fft_driver
Definition MDFEchoCancellation.h:791

audio_tools::MDFEchoCancellation::setMicChannels
void setMicChannels(int num)
Definition MDFEchoCancellation.h:750

audio_tools::fft_state::driver
AudioFFTBase * driver
Definition MDFEchoCancellation.h:454

audio_tools::echo_fft_init
void * echo_fft_init(int size, AudioFFTBase *driver, const Allocator &alloc)
Initialize FFT state.
Definition MDFEchoCancellation.h:1538

audio_tools::MDFEchoCancellation::filterDcNotch16
void filterDcNotch16(const echo_int16_t *in, echo_word16_t radius, echo_word16_t *out, int len, echo_mem_t *mem, int stride)
Apply DC notch filter to remove DC offset.
Definition MDFEchoCancellation.h:905

audio_tools::fft_state::fft_state
fft_state(int size, AudioFFTBase *drv, const Allocator &alloc=Allocator())
Construct FFT state with specified size and driver.
Definition MDFEchoCancellation.h:465

audio_tools::MDFEchoCancellation::echoFree
void echoFree(T *ptr, size_t count=0)
Deallocate memory using custom allocator.
Definition MDFEchoCancellation.h:839

audio_tools::EchoState_::sampling_rate
echo_int32_t sampling_rate
Definition MDFEchoCancellation.h:389

audio_tools::MDFEchoCancellation::control
int control(int request, void *ptr)
Definition MDFEchoCancellation.h:675

audio_tools::MDFEchoCancellation::MDFEchoCancellation
MDFEchoCancellation(int filterLength, AudioFFTBase &fftDriver, const Allocator &alloc=Allocator())
Definition MDFEchoCancellation.h:515

audio_tools::fft_state::N
int N
Definition MDFEchoCancellation.h:455

audio_tools::MDFEchoCancellation::nb_speakers
int nb_speakers
Definition MDFEchoCancellation.h:795

audio_tools::MDFEchoCancellation::getFilterLength
int getFilterLength()
Definition MDFEchoCancellation.h:745

audio_tools::MDFEchoCancellation::ensureInitialized
void ensureInitialized()
Ensure echo canceller is initialized (lazy initialization)
Definition MDFEchoCancellation.h:801

audio_tools::echo_fft_destroy
void echo_fft_destroy(void *table)
Destroy FFT state and release resources.
Definition MDFEchoCancellation.h:1560

audio_tools::MDFEchoCancellation::setFilterLength
void setFilterLength(int len)
Definition MDFEchoCancellation.h:736

audio_tools::MDFEchoCancellation::playback
void playback(const echo_int16_t *play)
Definition MDFEchoCancellation.h:607

audio_tools::MDFEchoCancellation::getImpulseResponseSize
int getImpulseResponseSize()
Definition MDFEchoCancellation.h:724

audio_tools::MDFEchoCancellation::getFrameSize
int getFrameSize()
Definition MDFEchoCancellation.h:713

audio_tools::MDFEchoCancellation::powerSpectrum
void powerSpectrum(const echo_word16_t *X, echo_word32_t *ps, int N)
Compute power spectrum from FFT output.
Definition MDFEchoCancellation.h:940

audio_tools::MDFEchoCancellation::setSamplingRate
void setSamplingRate(int rate)
Definition MDFEchoCancellation.h:718

audio_tools::MDFEchoCancellation::getState
EchoState * getState()
Definition MDFEchoCancellation.h:787

audio_tools::MDFEchoCancellation::state
EchoState * state
Definition MDFEchoCancellation.h:790

audio_tools::MDFEchoCancellation::echoAlloc
T * echoAlloc(size_t count)
Allocate memory for array of type T using custom allocator.
Definition MDFEchoCancellation.h:821

audio_tools::MDFEchoCancellation::powerSpectrumAccum
void powerSpectrumAccum(const echo_word16_t *X, echo_word32_t *ps, int N)
Accumulate power spectrum from FFT output.
Definition MDFEchoCancellation.h:954

audio_tools::fft_state::temp_img
std::vector< float, FloatAllocator > temp_img
Definition MDFEchoCancellation.h:457

audio_tools::MDFEchoCancellation::capture
void capture(const echo_int16_t *rec, echo_int16_t *out)
Definition MDFEchoCancellation.h:585

audio_tools::MDFEchoCancellation::nb_mic
int nb_mic
Definition MDFEchoCancellation.h:794

audio_tools::fft_state::FloatAllocator
typename std::allocator_traits< Allocator >::template rebind_alloc< float > FloatAllocator
Definition MDFEchoCancellation.h:452

audio_tools::MDFEchoCancellation::setFFTDriver
void setFFTDriver(AudioFFTBase &fftDriver)
Definition MDFEchoCancellation.h:778

audio_tools::MDFEchoCancellation::reset
void reset()
Definition MDFEchoCancellation.h:629

audio_tools::EchoState_::frame_size
int frame_size
Definition MDFEchoCancellation.h:380

audio_tools::MDFEchoCancellation::MDFEchoCancellation
MDFEchoCancellation(int filterLength, int nbMic, int nbSpeakers, AudioFFTBase &fftDriver, const Allocator &alloc=Allocator())
Definition MDFEchoCancellation.h:526

audio_tools::MDFEchoCancellation::spxExp
float spxExp(float x)
Compute exponential function.
Definition MDFEchoCancellation.h:887

audio_tools::MDFEchoCancellation::weightedSpectralMulConj
void weightedSpectralMulConj(const echo_float_t *w, const echo_float_t p, const echo_word16_t *X, const echo_word16_t *Y, echo_word32_t *prod, int N)
Compute weighted spectral multiplication with conjugate.
Definition MDFEchoCancellation.h:996

audio_tools::MDFEchoCancellation::initialized
bool initialized
Definition MDFEchoCancellation.h:796

audio_tools::MDFEchoCancellation::getSpeakerChannels
int getSpeakerChannels()
Definition MDFEchoCancellation.h:773

audio_tools::MDFEchoCancellation::spxCos
float spxCos(float x)
Compute cosine function.
Definition MDFEchoCancellation.h:894

audio_tools::MDFEchoCancellation::echoStateInitMc
EchoState * echoStateInitMc(int frame_size, int filter_length, int nb_mic, int nb_speakers)
Initialize multi-channel echo canceller state.
Definition MDFEchoCancellation.h:1055

audio_tools::MDFEchoCancellation::echoCancellationImpl
void echoCancellationImpl(EchoState *st, const echo_int16_t *in, const echo_int16_t *far_end, echo_int16_t *out)
Core echo cancellation implementation.
Definition MDFEchoCancellation.h:1179

audio_tools::MDFEchoCancellation::allocator
Allocator allocator
Definition MDFEchoCancellation.h:792

audio_tools::MDFEchoCancellation::filter_length
int filter_length
Definition MDFEchoCancellation.h:793

audio_tools
Generic Implementation of sound input and output for desktop environments using portaudio.
Definition AudioCodecsBase.h:10

audio_tools::VAR1_UPDATE
static const echo_float_t VAR1_UPDATE
Definition MDFEchoCancellation.h:326

audio_tools::VAR2_SMOOTH
static const echo_float_t VAR2_SMOOTH
Definition MDFEchoCancellation.h:323

audio_tools::VAR2_UPDATE
static const echo_float_t VAR2_UPDATE
Definition MDFEchoCancellation.h:329

audio_tools::MIN_LEAK
static const echo_float_t MIN_LEAK
Definition MDFEchoCancellation.h:317

audio_tools::VAR1_SMOOTH
static const echo_float_t VAR1_SMOOTH
Definition MDFEchoCancellation.h:320

audio_tools::VAR_BACKTRACK
static const echo_float_t VAR_BACKTRACK
Definition MDFEchoCancellation.h:332

audio_tools::AudioFFTConfig
Configuration for AudioFFT. If there are more then 1 channel the channel_used is defining which chann...
Definition AudioFFT.h:40

audio_tools::AudioFFTConfig::rxtx_mode
RxTxMode rxtx_mode
TX_MODE = FFT, RX_MODE = IFFT.
Definition AudioFFT.h:59

audio_tools::EchoState_
Internal echo canceller state structure.
Definition MDFEchoCancellation.h:379

audio_tools::echo_float_t
Definition MDFEchoCancellation.h:173

audio_tools::fft_state
FFT state management structure with custom allocator support.
Definition MDFEchoCancellation.h:451