WSOLA_8H_source.html

 /* Copyright 2000-2018 Matt Flax <flatmax@flatmax.org>
    This file is part of GTK+ IOStream class set

    GTK+ IOStream is free software; you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation; either version 2 of the License, or
    (at your option) any later version.

    GTK+ IOStream is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You have received a copy of the GNU General Public License
    along with GTK+ IOStream
  */
 #ifndef WSOLA_H_
 #define WSOLA_H_

 #include "config.h"
 #ifdef HAVE_EMSCRIPTEN
 #include <emscripten/bind.h>
 #endif

 #ifdef _MSC_VER
 #define MS_ROUND
 #ifdef _MSC_VER
 #define _USE_MATH_DEFINES
 #endif
 #include <math.h>

 double round(double number) {
     return number < 0.0 ? ceil(number - 0.5) : floor(number + 0.5);
 }
 #endif

 #include <Debug.H>

 #define WSOLA_MOD2_ERROR -10+WSOLA_ERROR_OFFSET
 #define WSOLA_NFRAMES_JACK_ERROR -11+WSOLA_ERROR_OFFSET
 #define WSOLA_ROWS_ERROR -12+WSOLA_ERROR_OFFSET
 #define WSOLA_COLS_ERROR -13+WSOLA_ERROR_OFFSET


 class WSOLADebug : virtual public Debug {
 public:
     WSOLADebug() {
 #ifndef NDEBUG
         errors[WSOLA_MOD2_ERROR]=std::string("Developer error : BUFF_SIZE must be divisible by 2. ");
         errors[WSOLA_NFRAMES_JACK_ERROR]=std::string("Jack nframes request error : Jack wants to process a number of frames which WSOLA can't handle. ");
         errors[WSOLA_ROWS_ERROR]=std::string("Row request error : You are trying to access beyond the end of the array. ");
         errors[WSOLA_COLS_ERROR]=std::string("Col request error : You are trying to access beyond the end of the array. ");
 #endif
     }

     virtual ~WSOLADebug() {}
 };

 #include <Eigen/Dense>
 using namespace Eigen;

 typedef float FP_TYPE;

 #define FS_DEFAULT 48000.
 #define TAU 0.02

 #define DEFAULT_CH_CNT 1

 #define M_DEFAULT 3;


 class WSOLA {

     float fs;

     int N;
     int NO2;
     int M;
     int m;
     double rem;

     Array<FP_TYPE, Dynamic , Dynamic> buffer;

     Array<FP_TYPE, Dynamic, Dynamic> wnd;

     Array<FP_TYPE, Dynamic, Dynamic> nextOutput;

     Array<FP_TYPE, Dynamic, Dynamic> simComp;

     template<typename Derived>
     int findSimilarityInBuffer(const DenseBase<Derived> &buffer);

     template<typename Derived>
     FP_TYPE findSimilarity(const ArrayBase<Derived> &outputIn) {
         simComp=outputIn;
         simComp*=wnd;
         return rms(nextOutput-simComp);
     }

     template<typename Derived>
     FP_TYPE rms(const ArrayBase<Derived> &s) {
         //r=sqrt(mean(s.^2));
 //        cout<<"norm"<<endl;
 //        cout<<s.matrix().norm()<<endl;
         return s.matrix().norm();
     }

     void OLAWnd(void);

     int inputSamplesRequired;

     void init(void);
 public:

     Array<FP_TYPE, Dynamic, Dynamic> output;
     Array<FP_TYPE, Dynamic, Dynamic> input;

     WSOLA();

     WSOLA(int chCnt);

     virtual ~WSOLA();

 #ifdef HAVE_EMSCRIPTEN
     int processOurInput(FP_TYPE timeScale) {
         return process(timeScale, input);
     }
 #endif

     template<typename Derived>
     int process(FP_TYPE timeScale, const DenseBase<Derived> &input) {
 //        cout<<"input : "<<endl;
 //        cout<<input<<endl;
 //        cout<<"buffer pre shift : "<<endl;
 //        cout<<buffer<<endl;
         // shift the buffer on
         int chCnt=buffer.rows();
         buffer.block(0,0,chCnt,buffer.cols()-inputSamplesRequired)=buffer.block(0,inputSamplesRequired,chCnt,buffer.cols()-inputSamplesRequired);
 //        cout<<"buffer post shift : "<<endl;
 //        cout<<buffer<<endl;
         // load the required input samples into the buffer
         buffer.block(0,buffer.cols()-inputSamplesRequired,chCnt,inputSamplesRequired)=input.block(0,0,chCnt,inputSamplesRequired);
 //        cout<<"buffer with input : "<<endl;
 //        cout<<buffer<<endl;

         processInner(); // do the inner processing

         // shift on by the ratio of N/2
 //        cout<<"rem "<<rem<<endl;
         double shiftOn=timeScale*NO2+rem;
 //        cout<<"shiftOn "<<shiftOn<<endl;
         inputSamplesRequired=static_cast<int>(round(shiftOn));
 //        cout<<"inputSamplesRequired "<<inputSamplesRequired<<endl;
         rem=shiftOn-(double)inputSamplesRequired;
 //        cout<<"rem "<<rem<<endl;
         return inputSamplesRequired;
     }

     void processInner(void);

 //    template<typename Derived>
 //    int loadBuffer(, const DenseBase<Derived> &input);

     int getMaxInputSamplesRequired(void) {
         return NO2*(M+2);
     }

     int getSamplesRequired(void) {
         return inputSamplesRequired;
     }

     int getOutputSize(void){
         return NO2;
     }

     void reset(int chCnt);

     int noMoreAudio(){
         return inputSamplesRequired-=NO2;
     }

     int loadInput(int n, int m, FP_TYPE val);

     FP_TYPE unloadOutput(int n, int m);

     void setFS(float fsIn);

 };

 #endif // WSOLA_H_
WSOLA::inputSamplesRequired
int inputSamplesRequired
The number of audio samples required for the next call to process.
Definition: WSOLA.H:134

WSOLA::NO2
int NO2
Half the window size.
Definition: WSOLA.H:87

WSOLA::N
int N
The size of the window.
Definition: WSOLA.H:86

WSOLA_COLS_ERROR
#define WSOLA_COLS_ERROR
Occurs when trying to access a col > the input or output Array cols.
Definition: WSOLA.H:43

Debug.H

Eigen

config.h

WSOLA::nextOutput
Array< FP_TYPE, Dynamic, Dynamic > nextOutput
The output vector to search for, each channel per row.
Definition: WSOLA.H:96

WSOLADebug::WSOLADebug
WSOLADebug()
Definition: WSOLA.H:51

WSOLA::rem
double rem
The remainder fraction of a sample to remember for next time (can&#39;t move on by fractions of a sample)...
Definition: WSOLA.H:90

WSOLA::m
int m
The current row index into the buffer.
Definition: WSOLA.H:89

Debug::errors
std::map< int, std::string > errors
This will contain a map between error numbers and descriptive std::strings for the errors...
Definition: Debug.H:115

WSOLA::simComp
Array< FP_TYPE, Dynamic, Dynamic > simComp
Temporary vector used for computation.
Definition: WSOLA.H:98

WSOLA::rms
FP_TYPE rms(const ArrayBase< Derived > &s)
Definition: WSOLA.H:124

WSOLA_ROWS_ERROR
#define WSOLA_ROWS_ERROR
Occurs when trying to access a row > the input or output Array rows.
Definition: WSOLA.H:42

WSOLA::noMoreAudio
int noMoreAudio()
Definition: WSOLA.H:233

WSOLA::wnd
Array< FP_TYPE, Dynamic, Dynamic > wnd
The overlap add window.
Definition: WSOLA.H:94

WSOLA::findSimilarity
FP_TYPE findSimilarity(const ArrayBase< Derived > &outputIn)
Definition: WSOLA.H:112

WSOLA::getSamplesRequired
int getSamplesRequired(void)
Definition: WSOLA.H:214

FP_TYPE
float FP_TYPE
The floating point type to use if not previously declared.
Definition: WSOLA.H:67

WSOLA::input
Array< FP_TYPE, Dynamic, Dynamic > input
The input vector, each row is a channel.
Definition: WSOLA.H:142

WSOLA::output
Array< FP_TYPE, Dynamic, Dynamic > output
The output vector, each row is a channel.
Definition: WSOLA.H:141

Array< FP_TYPE, Dynamic, Dynamic >

round
double precision function round(x)
Definition: round.f:2

WSOLA_MOD2_ERROR
#define WSOLA_MOD2_ERROR
< Provided by GTKIOStream on sf.net
Definition: WSOLA.H:40

WSOLA_NFRAMES_JACK_ERROR
#define WSOLA_NFRAMES_JACK_ERROR
Occurs when jack wants to process nframes which is not divisible by N/2.
Definition: WSOLA.H:41

Debug
Definition: Debug.H:112

WSOLA::process
int process(FP_TYPE timeScale, const DenseBase< Derived > &input)
Definition: WSOLA.H:169

WSOLADebug::~WSOLADebug
virtual ~WSOLADebug()
Destructor.
Definition: WSOLA.H:61

WSOLA::getMaxInputSamplesRequired
int getMaxInputSamplesRequired(void)
Definition: WSOLA.H:207

WSOLA::M
int M
The number of windows in the search buffer.
Definition: WSOLA.H:88

WSOLA
Definition: WSOLA.H:82

WSOLA::getOutputSize
int getOutputSize(void)
Definition: WSOLA.H:220

WSOLA::fs
float fs
The sample rate in Hz.
Definition: WSOLA.H:84

WSOLA::buffer
Array< FP_TYPE, Dynamic, Dynamic > buffer
The buffer of audio, each channel on its own row.
Definition: WSOLA.H:92

WSOLADebug
Definition: WSOLA.H:47