OpenAudio_ArduinoLibrary/examples/FormantShifter_FD_OA/AudioEffectFormantShiftFD_O...

/* AudioEffectFormantShiiftFD_OA_F32.h
 * Demonstrate formant shifting via frequency domain processin.
 *
 * Created: Chip Audette (OpenAudio) March 2019
 * See FormantShifter_FD_OA.ino for notes.
 *
 * Adapt to OpenAudio Library  - Bob Larkin June 2020
 * MIT License.  Use at your own risk.
 */
#ifndef _AudioEffectFormantShiftFD_OA_F32_h
#define _AudioEffectFormantShiftFD_OA_F32_h

#include "AudioStream_F32.h"
#include <arm_math.h>
#include "FFT_Overlapped_OA_F32.h"

class AudioEffectFormantShiftFD_OA_F32 : public AudioStream_F32
{
  public:
    // constructors...a few different options.  The usual one should be:
    //   AudioEffectFormantShiftFD_OA_F32(const AudioSettings_F32 &settings, const int _N_FFT)
    AudioEffectFormantShiftFD_OA_F32(void) : AudioStream_F32(1, inputQueueArray_f32) { };
    AudioEffectFormantShiftFD_OA_F32(const AudioSettings_F32 &settings) :
      AudioStream_F32(1, inputQueueArray_f32) {
      sample_rate_Hz = settings.sample_rate_Hz;
    }
    AudioEffectFormantShiftFD_OA_F32(const AudioSettings_F32 &settings, const int _N_FFT) :
      AudioStream_F32(1, inputQueueArray_f32) {
      setup(settings, _N_FFT);
    }

    //destructor...release all of the memory that has been allocated
    ~AudioEffectFormantShiftFD_OA_F32(void) {
      if (complex_2N_buffer != NULL) delete complex_2N_buffer;
    }

    int setup(const AudioSettings_F32 &settings, const int _N_FFT) {
      sample_rate_Hz = settings.sample_rate_Hz;
      int N_FFT;

      //setup the FFT and IFFT.  If they return a negative FFT, it wasn't an allowed FFT size.
      N_FFT = myFFT.setup(settings, _N_FFT); //hopefully, we got the same N_FFT that we asked for
      if (N_FFT < 1) return N_FFT;
      N_FFT = myIFFT.setup(settings, _N_FFT); //hopefully, we got the same N_FFT that we asked for
      if (N_FFT < 1) return N_FFT;

      //decide windowing
      Serial.println("AudioEffectFormantShiftFD_OA_F32: setting myFFT to use hanning...");
      (myFFT.getFFTObject())->useHanningWindow(); //applied prior to FFT
      #if 1
        if (myIFFT.getNBuffBlocks() > 3) {
          Serial.println("AudioEffectFormantShiftFD_OA_F32: setting myIFFT to use hanning...");
          (myIFFT.getIFFTObject())->useHanningWindow(); //window again after IFFT
        }
      #endif

      //print info about setup
      Serial.println("AudioEffectFormantShiftFD_OA_F32: FFT parameters...");
      Serial.print("    : N_FFT = ");  Serial.println(N_FFT);
      Serial.print("    : audio_block_samples = ");  Serial.println(settings.audio_block_samples);
      Serial.print("    : FFT N_BUFF_BLOCKS = ");  Serial.println(myFFT.getNBuffBlocks());
      Serial.print("    : IFFT N_BUFF_BLOCKS = ");  Serial.println(myIFFT.getNBuffBlocks());
      Serial.print("    : FFT use window = ");  Serial.println(myFFT.getFFTObject()->get_flagUseWindow());
      Serial.print("    : IFFT use window = ");  Serial.println((myIFFT.getIFFTObject())->get_flagUseWindow());

      //allocate memory to hold frequency domain data
      complex_2N_buffer = new float32_t[2 * N_FFT];

      //we're done.  return!
      enabled = 1;
      return N_FFT;
    }

    float setScaleFactor(float scale_fac) {
      if (scale_fac < 0.00001) scale_fac = 0.00001;
      return shift_scale_fac = scale_fac;
    }
    float getScaleFactor(void) {
      return shift_scale_fac;
    }

    virtual void update(void);

  private:
    int enabled = 0;
    float32_t *complex_2N_buffer;
    audio_block_f32_t *inputQueueArray_f32[1];
    FFT_Overlapped_OA_F32 myFFT;
    IFFT_Overlapped_OA_F32 myIFFT;
    float lowpass_freq_Hz = 1000.f;
    float sample_rate_Hz = AUDIO_SAMPLE_RATE;
    float shift_scale_fac = 1.0; //how much to shift formants (frequency multiplier).  1.0 is no shift
};


void AudioEffectFormantShiftFD_OA_F32::update(void)
{
  //get a pointer to the latest data
  audio_block_f32_t *in_audio_block = AudioStream_F32::receiveReadOnly_f32();
  if (!in_audio_block) return;

  //simply return the audio if this class hasn't been enabled
  if (!enabled) {
    AudioStream_F32::transmit(in_audio_block);
    AudioStream_F32::release(in_audio_block);
    return;
  }

  //convert to frequency domain
  myFFT.execute(in_audio_block, complex_2N_buffer);
  AudioStream_F32::release(in_audio_block);  //We just passed ownership to myFFT, so release it here.

  // ////////////// Do your processing here!!!

  //define some variables
  int fftSize = myFFT.getNFFT();
  int N_2 = fftSize / 2 + 1;
  int source_ind; // neg_dest_ind;
  float source_ind_float, interp_fac;
  float new_mag, scale;
  float orig_mag[N_2];
  //int max_source_ind = (int)(((float)N_2) * (10000.0 / (48000.0 / 2.0))); //highest frequency bin to grab from (Assuming 48kHz sample rate)

  #if 1
    float max_source_Hz = 10000.0; //highest frequency to use as source data
    int max_source_ind = min(int(max_source_Hz / sample_rate_Hz * fftSize + 0.5),N_2);
  #else
    int max_source_ind = N_2;  //this line causes this feature to be defeated
  #endif

  //get the magnitude for each FFT bin and store somewhere safes
  arm_cmplx_mag_f32(complex_2N_buffer, orig_mag, N_2);

  //now, loop over each bin and compute the new magnitude based on shifting the formants
  for (int dest_ind = 1; dest_ind < N_2; dest_ind++) { //don't start at zero bin, keep it at its original

    //what is the source bin for the new magnitude for this current destination bin
    source_ind_float = (((float)dest_ind) / shift_scale_fac) + 0.5;
    //source_ind = (int)(source_ind_float+0.5);  //no interpolation but round to the neariest index
    //source_ind = min(max(source_ind,1),N_2-1);
    source_ind = min(max(1, (int)source_ind_float), N_2 - 2); //Chip: why -2 and not -1?  Because later, for for the interpolation, we do a +1 and we want to stay within nyquist
    interp_fac = source_ind_float - (float)source_ind;
    interp_fac = max(0.0, interp_fac);  //this will be used in the interpolation in a few lines

    //what is the new magnitude
    new_mag = 0.0; scale = 0.0;
    if (source_ind < max_source_ind) {

      //interpolate in the original magnitude vector to find the new magnitude that we want
      //new_mag=orig_mag[source_ind];  //the magnitude that we desire
      //scale = new_mag / orig_mag[dest_ind];//compute the scale factor
      new_mag = orig_mag[source_ind];
      new_mag += interp_fac * (orig_mag[source_ind] - orig_mag[source_ind + 1]);
      scale = new_mag / orig_mag[dest_ind];

      //apply scale factor
      complex_2N_buffer[2 * dest_ind] *= scale; //real
      complex_2N_buffer[2 * dest_ind + 1] *= scale; //imaginary
    } else {
      complex_2N_buffer[2 * dest_ind] = 0.0; //real
      complex_2N_buffer[2 * dest_ind + 1] = 0.0; //imaginary
    }

    //zero out the lowest bin
    complex_2N_buffer[0] = 0.0; //real
    complex_2N_buffer[1] = 0.0; //imaginary
  }

  //rebuild the negative frequency space
  myFFT.rebuildNegativeFrequencySpace(complex_2N_buffer); //set the negative frequency space based on the positive


  // ///////////// End do your processing here

  //call the IFFT
  audio_block_f32_t *out_audio_block = myIFFT.execute(complex_2N_buffer); //out_block is pre-allocated in here.


  //send the returned audio block.  Don't issue the release command here because myIFFT will re-use it
  AudioStream_F32::transmit(out_audio_block); //don't release this buffer because myIFFT re-uses it within its own code
  return;
};
#endif