api/0.2.5/_k_means_quantizer_8cpp_source.html

 /*
 GRT MIT License
 Copyright (c) <2012> <Nicholas Gillian, Media Lab, MIT>

 Permission is hereby granted, free of charge, to any person obtaining a copy of this software
 and associated documentation files (the "Software"), to deal in the Software without restriction,
 including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense,
 and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so,
 subject to the following conditions:

 The above copyright notice and this permission notice shall be included in all copies or substantial
 portions of the Software.

 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT
 LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
 IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
 WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
 SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 */

 #define GRT_DLL_EXPORTS
 #include "KMeansQuantizer.h"

 GRT_BEGIN_NAMESPACE

 //Define the string that will be used to identify the object
 std::string KMeansQuantizer::id = "KMeansQuantizer";
 std::string KMeansQuantizer::getId() { return KMeansQuantizer::id; }

 //Register your module with the FeatureExtraction base class
 RegisterFeatureExtractionModule< KMeansQuantizer > KMeansQuantizer::registerModule( KMeansQuantizer::getId() );

 KMeansQuantizer::KMeansQuantizer(const UINT numClusters) : FeatureExtraction( KMeansQuantizer::getId() )
 {
  this->numClusters = numClusters;
 }

 KMeansQuantizer::KMeansQuantizer(const KMeansQuantizer &rhs) : FeatureExtraction( KMeansQuantizer::getId() )
 {
  //Invoke the equals operator to copy the data from the rhs instance to this instance
  *this = rhs;
 }

 KMeansQuantizer::~KMeansQuantizer(){
 }

 KMeansQuantizer& KMeansQuantizer::operator=(const KMeansQuantizer &rhs){
  if(this!=&rhs){
  //Copy any class variables from the rhs instance to this instance
  this->numClusters = rhs.numClusters;
  this->clusters = rhs.clusters;
  this->quantizationDistances = rhs.quantizationDistances;

  //Copy the base variables
  copyBaseVariables( (FeatureExtraction*)&rhs );
  }
  return *this;
 }

 bool KMeansQuantizer::deepCopyFrom(const FeatureExtraction *featureExtraction){

  if( featureExtraction == NULL ) return false;

  if( this->getId() == featureExtraction->getId() ){

  //Cast the feature extraction pointer to a pointer to your custom feature extraction module
  //Then invoke the equals operator
  *this = *dynamic_cast<const KMeansQuantizer*>(featureExtraction);

  return true;
  }

  errorLog << "deepCopyFrom(FeatureExtraction *featureExtraction) - FeatureExtraction Types Do Not Match!" << std::endl;

  return false;
 }

 bool KMeansQuantizer::computeFeatures(const VectorFloat &inputVector){

  //Run the quantize algorithm
  quantize( inputVector );

  return true;
 }

 bool KMeansQuantizer::reset(){

  FeatureExtraction::reset();

  if( trained ){
  std::fill(quantizationDistances.begin(),quantizationDistances.end(),0);
  }

  return true;
 }

 bool KMeansQuantizer::clear(){

  FeatureExtraction::clear();

  clusters.clear();
  quantizationDistances.clear();
  quantizationDistances.clear();

  return true;
 }

 bool KMeansQuantizer::save( std::fstream &file ) const{

  if( !file.is_open() ){
  errorLog << "save(fstream &file) - The file is not open!" << std::endl;
  return false;
  }

  //Save the header
  file << "KMEANS_QUANTIZER_FILE_V1.0" << std::endl;

  //Save the feature extraction base class settings
  if( !saveFeatureExtractionSettingsToFile( file ) ){
  errorLog << "save(fstream &file) - Failed to save base feature extraction settings to file!" << std::endl;
  return false;
  }

  //Save the KMeansQuantizer settings
  file << "QuantizerTrained: " << trained << std::endl;
  file << "NumClusters: " << numClusters << std::endl;

  if( trained ){
  file << "Clusters: \n";
  for(UINT k=0; k<numClusters; k++){
  for(UINT j=0; j<numInputDimensions; j++){
  file << clusters[k][j];
  if( j != numInputDimensions-1 ) file << "\t";
  else file << std::endl;
  }
  }
  }

  return true;
 }

 bool KMeansQuantizer::load( std::fstream &file ){

  //Clear any previouly built model and settings
  clear();

  if( !file.is_open() ){
  errorLog << "load(fstream &file) - The file is not open!" << std::endl;
  return false;
  }

  std::string word;

  //First, you should read and validate the header
  file >> word;
  if( word != "KMEANS_QUANTIZER_FILE_V1.0" ){
  errorLog << "load(fstream &file) - Invalid file format!" << std::endl;
  return false;
  }

  //Second, you should load the base feature extraction settings to the file
  if( !loadFeatureExtractionSettingsFromFile( file ) ){
  errorLog << "loadFeatureExtractionSettingsFromFile(fstream &file) - Failed to load base feature extraction settings from file!" << std::endl;
  return false;
  }

  file >> word;
  if( word != "QuantizerTrained:" ){
  errorLog << "load(fstream &file) - Failed to load QuantizerTrained!" << std::endl;
  return false;
  }
  file >> trained;

  file >> word;
  if( word != "NumClusters:" ){
  errorLog << "load(fstream &file) - Failed to load NumClusters!" << std::endl;
  return false;
  }
  file >> numClusters;

  if( trained ){
  clusters.resize(numClusters, numInputDimensions);
  file >> word;
  if( word != "Clusters:" ){
  errorLog << "load(fstream &file) - Failed to load Clusters!" << std::endl;
  return false;
  }

  for(UINT k=0; k<numClusters; k++){
  for(UINT j=0; j<numInputDimensions; j++){
  file >> clusters[k][j];
  }
  }

  initialized = true;
  featureDataReady = false;
  quantizationDistances.resize(numClusters,0);
  }

  return true;
 }

 bool KMeansQuantizer::train_(ClassificationData &trainingData){
  MatrixFloat data = trainingData.getDataAsMatrixFloat();
  return train( data );
 }

 bool KMeansQuantizer::train_(TimeSeriesClassificationData &trainingData){
  MatrixFloat data = trainingData.getDataAsMatrixFloat();
  return train( data );
 }

 bool KMeansQuantizer::train_(ClassificationDataStream &trainingData){
  MatrixFloat data = trainingData.getDataAsMatrixFloat();
  return train( data );
 }

 bool KMeansQuantizer::train_(UnlabelledData &trainingData){
  MatrixFloat data = trainingData.getDataAsMatrixFloat();
  return train( data );
 }

 bool KMeansQuantizer::train_(MatrixFloat &trainingData){

  //Clear any previous model
  clear();

  //Train the KMeans model
  KMeans kmeans;
  kmeans.setNumClusters(numClusters);
  kmeans.setComputeTheta( true );
  kmeans.setMinChange( minChange );
  kmeans.setMinNumEpochs( minNumEpochs );
  kmeans.setMaxNumEpochs( maxNumEpochs );

  if( !kmeans.train_(trainingData) ){
  errorLog << "train_(MatrixFloat &trainingData) - Failed to train quantizer!" << std::endl;
  return false;
  }

  trained = true;
  initialized = true;
  numInputDimensions = trainingData.getNumCols();
  numOutputDimensions = 1; //This is always 1 for the KMeansQuantizer
  featureVector.resize(numOutputDimensions,0);
  clusters = kmeans.getClusters();
  quantizationDistances.resize(numClusters,0);

  return true;
 }

 UINT KMeansQuantizer::quantize(const Float inputValue){
  return quantize( VectorFloat(1,inputValue) );
 }

 UINT KMeansQuantizer::quantize(const VectorFloat &inputVector){

  if( !trained ){
  errorLog << "computeFeatures(const VectorFloat &inputVector) - The quantizer has not been trained!" << std::endl;
  return 0;
  }

  if( inputVector.getSize() != numInputDimensions ){
  errorLog << "computeFeatures(const VectorFloat &inputVector) - The size of the inputVector (" << inputVector.getSize() << ") does not match that of the filter (" << numInputDimensions << ")!" << std::endl;
  return 0;
  }

  //Find the minimum cluster
  Float minDist = grt_numeric_limits< Float >::max();
  UINT quantizedValue = 0;

  for(UINT k=0; k<numClusters; k++){
  //Compute the squared Euclidean distance
  quantizationDistances[k] = 0;
  for(UINT i=0; i<numInputDimensions; i++){
  quantizationDistances[k] += grt_sqr( inputVector[i]-clusters[k][i] );
  }
  if( quantizationDistances[k] < minDist ){
  minDist = quantizationDistances[k];
  quantizedValue = k;
  }
  }

  featureVector[0] = quantizedValue;
  featureDataReady = true;

  return quantizedValue;
 }

 UINT KMeansQuantizer::getNumClusters() const{
  return numClusters;
 }

 bool KMeansQuantizer::setNumClusters(const UINT numClusters){
  clear();
  this->numClusters = numClusters;
  return true;
 }

 GRT_END_NAMESPACE
KMeansQuantizer::train_
virtual bool train_(ClassificationData &trainingData)
Definition: KMeansQuantizer.cpp:203

KMeansQuantizer::computeFeatures
virtual bool computeFeatures(const VectorFloat &inputVector)
Definition: KMeansQuantizer.cpp:78

GRTBase::getId
std::string getId() const
Definition: GRTBase.cpp:85

KMeansQuantizer::quantize
UINT quantize(const Float inputValue)
Definition: KMeansQuantizer.cpp:252

KMeansQuantizer::reset
virtual bool reset()
Definition: KMeansQuantizer.cpp:86

KMeansQuantizer::KMeansQuantizer
KMeansQuantizer(const UINT numClusters=10)
Definition: KMeansQuantizer.cpp:33

MLBase::reset
virtual bool reset()
Definition: MLBase.cpp:147

MatrixFloat
Definition: MatrixFloat.h:36

FeatureExtraction::saveFeatureExtractionSettingsToFile
bool saveFeatureExtractionSettingsToFile(std::fstream &file) const
Definition: FeatureExtraction.cpp:118

ClassificationDataStream
Definition: ClassificationDataStream.h:42

UnlabelledData::getDataAsMatrixFloat
MatrixFloat getDataAsMatrixFloat() const
Definition: UnlabelledData.cpp:662

Vector::resize
virtual bool resize(const unsigned int size)
Definition: Vector.h:133

KMeans::train_
virtual bool train_(MatrixFloat &data)
Definition: KMeans.cpp:153

MLBase::train
virtual bool train(ClassificationData trainingData)
Definition: MLBase.cpp:107

Vector::getSize
UINT getSize() const
Definition: Vector.h:201

KMeansQuantizer::deepCopyFrom
virtual bool deepCopyFrom(const FeatureExtraction *featureExtraction)
Definition: KMeansQuantizer.cpp:60

MLBase::setMinChange
bool setMinChange(const Float minChange)
Definition: MLBase.cpp:344

UnlabelledData
Definition: UnlabelledData.h:38

grt_numeric_limits
Definition: GRTTypedefs.h:74

Matrix::clear
bool clear()
Definition: Matrix.h:553

KMeansQuantizer::setNumClusters
bool setNumClusters(const UINT numClusters)
Definition: KMeansQuantizer.cpp:294

TimeSeriesClassificationData::getDataAsMatrixFloat
MatrixFloat getDataAsMatrixFloat() const
Definition: TimeSeriesClassificationData.cpp:1067

RegisterFeatureExtractionModule< KMeansQuantizer >

KMeansQuantizer.h
The KMeansQuantizer module quantizes the N-dimensional input vector to a 1-dimensional discrete value...

ClassificationData
Definition: ClassificationData.h:43

ClassificationDataStream::getDataAsMatrixFloat
MatrixFloat getDataAsMatrixFloat() const
Definition: ClassificationDataStream.cpp:920

Matrix::getNumCols
unsigned int getNumCols() const
Definition: Matrix.h:581

KMeansQuantizer::getId
static std::string getId()
Definition: KMeansQuantizer.cpp:28

FeatureExtraction
Definition: FeatureExtraction.h:38

MLBase::setMinNumEpochs
bool setMinNumEpochs(const UINT minNumEpochs)
Definition: MLBase.cpp:329

KMeansQuantizer::getNumClusters
UINT getNumClusters() const
Definition: KMeansQuantizer.cpp:290

KMeansQuantizer::clear
virtual bool clear()
Definition: KMeansQuantizer.cpp:97

VectorFloat
Definition: VectorFloat.h:33

FeatureExtraction::loadFeatureExtractionSettingsFromFile
bool loadFeatureExtractionSettingsFromFile(std::fstream &file)
Definition: FeatureExtraction.cpp:132

KMeansQuantizer::~KMeansQuantizer
virtual ~KMeansQuantizer()
Definition: KMeansQuantizer.cpp:44

KMeansQuantizer::operator=
KMeansQuantizer & operator=(const KMeansQuantizer &rhs)
Definition: KMeansQuantizer.cpp:47

KMeansQuantizer
Definition: KMeansQuantizer.h:49

KMeans
Definition: KMeans.h:41

ClassificationData::getDataAsMatrixFloat
MatrixFloat getDataAsMatrixFloat() const
Definition: ClassificationData.cpp:1497

Matrix::resize
virtual bool resize(const unsigned int r, const unsigned int c)
Definition: Matrix.h:245

TimeSeriesClassificationData
Definition: TimeSeriesClassificationData.h:42

FeatureExtraction::copyBaseVariables
bool copyBaseVariables(const FeatureExtraction *featureExtractionModule)
Definition: FeatureExtraction.cpp:64

KMeansQuantizer::save
virtual bool save(std::fstream &file) const
Definition: KMeansQuantizer.cpp:108

FeatureExtraction::clear
virtual bool clear() override
Definition: FeatureExtraction.cpp:106

MLBase::setMaxNumEpochs
bool setMaxNumEpochs(const UINT maxNumEpochs)
Definition: MLBase.cpp:320

KMeansQuantizer::load
virtual bool load(std::fstream &file)
Definition: KMeansQuantizer.cpp:142

Clusterer::setNumClusters
bool setNumClusters(const UINT numClusters)
Definition: Clusterer.cpp:262