2011-03-02 07:37:39 -05:00
|
|
|
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* ClusterMeltSegmenter.h
|
|
|
|
*
|
|
|
|
* Created by Mark Levy on 23/03/2006.
|
|
|
|
* Copyright 2006 Centre for Digital Music, Queen Mary, University of London.
|
|
|
|
|
|
|
|
This program is free software; you can redistribute it and/or
|
|
|
|
modify it under the terms of the GNU General Public License as
|
|
|
|
published by the Free Software Foundation; either version 2 of the
|
|
|
|
License, or (at your option) any later version. See the file
|
|
|
|
COPYING included with this distribution for more information.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
#include "segment.h"
|
|
|
|
#include "Segmenter.h"
|
|
|
|
#include "hmm/hmm.h"
|
|
|
|
#include "base/Window.h"
|
|
|
|
|
|
|
|
using std::vector;
|
|
|
|
|
|
|
|
class Decimator;
|
|
|
|
class ConstantQ;
|
|
|
|
class MFCC;
|
|
|
|
class FFTReal;
|
|
|
|
|
|
|
|
class ClusterMeltSegmenterParams
|
|
|
|
// defaults are sensible for 11025Hz with 0.2 second hopsize
|
|
|
|
{
|
|
|
|
public:
|
2015-10-04 14:51:05 -04:00
|
|
|
ClusterMeltSegmenterParams() :
|
2011-03-02 07:37:39 -05:00
|
|
|
featureType(FEATURE_TYPE_CONSTQ),
|
|
|
|
hopSize(0.2),
|
|
|
|
windowSize(0.6),
|
|
|
|
fmin(62),
|
2015-10-04 14:51:05 -04:00
|
|
|
fmax(16000),
|
2011-03-02 07:37:39 -05:00
|
|
|
nbins(8),
|
|
|
|
ncomponents(20),
|
|
|
|
nHMMStates(40),
|
|
|
|
nclusters(10),
|
|
|
|
histogramLength(15),
|
|
|
|
neighbourhoodLimit(20) { }
|
|
|
|
feature_types featureType;
|
|
|
|
double hopSize; // in secs
|
|
|
|
double windowSize; // in secs
|
|
|
|
int fmin;
|
|
|
|
int fmax;
|
|
|
|
int nbins;
|
|
|
|
int ncomponents;
|
|
|
|
int nHMMStates;
|
|
|
|
int nclusters;
|
|
|
|
int histogramLength;
|
|
|
|
int neighbourhoodLimit;
|
|
|
|
};
|
|
|
|
|
|
|
|
class ClusterMeltSegmenter : public Segmenter
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
ClusterMeltSegmenter(ClusterMeltSegmenterParams params);
|
|
|
|
virtual ~ClusterMeltSegmenter();
|
|
|
|
virtual void initialise(int samplerate);
|
|
|
|
virtual int getWindowsize();
|
|
|
|
virtual int getHopsize();
|
|
|
|
virtual void extractFeatures(const double* samples, int nsamples);
|
|
|
|
void setFeatures(const vector<vector<double> >& f); // provide the features yourself
|
|
|
|
virtual void segment(); // segment into default number of segment-types
|
|
|
|
void segment(int m); // segment into m segment-types
|
|
|
|
int getNSegmentTypes() { return nclusters; }
|
|
|
|
|
|
|
|
protected:
|
|
|
|
void makeSegmentation(int* q, int len);
|
2015-10-05 10:17:49 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
void extractFeaturesConstQ(const double *, int);
|
|
|
|
void extractFeaturesMFCC(const double *, int);
|
|
|
|
|
|
|
|
Window<double> *window;
|
|
|
|
FFTReal *fft;
|
2015-10-04 14:51:05 -04:00
|
|
|
ConstantQ* constq;
|
2011-03-02 07:37:39 -05:00
|
|
|
MFCC* mfcc;
|
|
|
|
model_t* model; // the HMM
|
|
|
|
int* q; // the decoded HMM state sequence
|
2015-10-05 10:17:49 -04:00
|
|
|
vector<vector<double> > histograms;
|
2015-10-04 14:51:05 -04:00
|
|
|
|
2015-10-05 10:17:49 -04:00
|
|
|
feature_types featureType;
|
2011-03-02 07:37:39 -05:00
|
|
|
double hopSize; // in seconds
|
|
|
|
double windowSize; // in seconds
|
2015-10-04 14:51:05 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
// constant-Q parameters
|
|
|
|
int fmin;
|
|
|
|
int fmax;
|
|
|
|
int nbins;
|
|
|
|
int ncoeff;
|
2015-10-04 14:51:05 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
// PCA parameters
|
|
|
|
int ncomponents;
|
2015-10-04 14:51:05 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
// HMM parameters
|
|
|
|
int nHMMStates;
|
2015-10-04 14:51:05 -04:00
|
|
|
|
2011-03-02 07:37:39 -05:00
|
|
|
// clustering parameters
|
|
|
|
int nclusters;
|
|
|
|
int histogramLength;
|
|
|
|
int neighbourhoodLimit;
|
|
|
|
|
|
|
|
Decimator *decimator;
|
|
|
|
};
|