2011-03-02 07:37:39 -05:00
|
|
|
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
|
|
|
|
|
|
|
|
/*
|
|
|
|
QM DSP Library
|
|
|
|
|
|
|
|
Centre for Digital Music, Queen Mary, University of London.
|
|
|
|
This file copyright 2005 Nicolas Chetry, copyright 2008 QMUL.
|
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or
|
|
|
|
modify it under the terms of the GNU General Public License as
|
|
|
|
published by the Free Software Foundation; either version 2 of the
|
|
|
|
License, or (at your option) any later version. See the file
|
|
|
|
COPYING included with this distribution for more information.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef MFCC_H
|
|
|
|
#define MFCC_H
|
|
|
|
|
|
|
|
#include "base/Window.h"
|
|
|
|
|
|
|
|
class FFTReal;
|
|
|
|
|
|
|
|
struct MFCCConfig {
|
|
|
|
int FS;
|
|
|
|
int fftsize;
|
|
|
|
int nceps;
|
|
|
|
double logpower;
|
|
|
|
bool want_c0;
|
|
|
|
WindowType window;
|
|
|
|
MFCCConfig(int _FS) :
|
|
|
|
FS(_FS), fftsize(2048), nceps(19),
|
|
|
|
logpower(1.0), want_c0(true), window(HammingWindow) { }
|
|
|
|
};
|
|
|
|
|
|
|
|
class MFCC
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
MFCC(MFCCConfig config);
|
|
|
|
virtual ~MFCC();
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Process time-domain input data. inframe must contain
|
|
|
|
* getfftlength() samples. outceps must contain space for nceps
|
|
|
|
* values, plus one if want_c0 is specified.
|
|
|
|
*/
|
|
|
|
int process(const double *inframe, double *outceps);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Process time-domain input data. real and imag must contain
|
|
|
|
* getfftlength()/2+1 elements (i.e. the conjugate half of the FFT
|
|
|
|
* is not expected). outceps must contain space for nceps values,
|
|
|
|
* plus one if want_c0 is specified.
|
|
|
|
*/
|
|
|
|
int process(const double *real, const double *imag, double *outceps);
|
|
|
|
|
|
|
|
int getfftlength() const { return fftSize; }
|
|
|
|
|
|
|
|
private:
|
|
|
|
/* Filter bank parameters */
|
2016-10-05 18:16:44 -04:00
|
|
|
double lowestFrequency;
|
|
|
|
int linearFilters;
|
2011-03-02 07:37:39 -05:00
|
|
|
double linearSpacing;
|
|
|
|
int logFilters;
|
|
|
|
double logSpacing;
|
2016-10-05 18:16:44 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
/* FFT length */
|
|
|
|
int fftSize;
|
2016-10-05 18:16:44 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
int totalFilters;
|
|
|
|
double logPower;
|
2016-10-05 18:16:44 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
/* Misc. */
|
|
|
|
int samplingRate;
|
|
|
|
int nceps;
|
2016-10-05 18:16:44 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
/* MFCC vector */
|
|
|
|
double *ceps;
|
2016-10-05 18:16:44 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
double **mfccDCTMatrix;
|
|
|
|
double **mfccFilterWeights;
|
2016-10-05 18:16:44 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
/* The analysis window */
|
|
|
|
Window<double> *window;
|
2016-10-05 18:16:44 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
/* For the FFT */
|
|
|
|
double *realOut;
|
|
|
|
double *imagOut;
|
|
|
|
double *fftMag;
|
|
|
|
double *earMag;
|
|
|
|
FFTReal *fft;
|
|
|
|
|
|
|
|
/* Set if user want C0 */
|
|
|
|
int WANT_C0;
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|