dgmdoc/a00479_source.html

 #include "TrainNodeGMM.h"
 #include "macroses.h"

 namespace DirectGraphicalModels
 {
     // Constants
     const size_t        CTrainNodeGMM::MIN_SAMPLES = 16;
     const long double   CTrainNodeGMM::MAX_COEFFICIENT = 1.0;

     // Constructor
     CTrainNodeGMM::CTrainNodeGMM(byte nStates, word nFeatures, TrainNodeGMMParams params)
         : CBaseRandomModel(nStates)
         , CTrainNode(nStates, nFeatures)
         , m_params(params)
     {
         m_vGaussianMixtures.resize(nStates);
         for (auto &gaussianMixture : m_vGaussianMixtures)
             gaussianMixture.reserve(m_params.maxGausses);
         if (m_params.minSamples < MIN_SAMPLES) m_params.minSamples = MIN_SAMPLES;
     }

     // Constructor
     CTrainNodeGMM::CTrainNodeGMM(byte nStates, word nFeatures, byte maxGausses)
         : CBaseRandomModel(nStates)
         , CTrainNode(nStates, nFeatures)
         , m_params(TRAIN_NODE_GMM_PARAMS_DEFAULT)
     {
         m_params.maxGausses = maxGausses;
         m_vGaussianMixtures.resize(nStates);
         for (auto &gaussianMixture : m_vGaussianMixtures)
             gaussianMixture.reserve(m_params.maxGausses);
     }

     // Destructor
     CTrainNodeGMM::~CTrainNodeGMM(void)
     { }

     void CTrainNodeGMM::reset(void)
     {
         m_vGaussianMixtures.clear();
         m_minAlpha = 1;
     }

     namespace {
         // Calculates distance from all Gaussians in a mixture to the point <x>
         // If when using Mahalanobis distance, a Gaussian is not full, the scaled Euclidian for this Gaussian is returned
         inline std::vector<double> getDistance(const Mat &x, const GaussianMixture &gaussianMixture, size_t samplesTreshold, double dist_Etreshold, double dist_Mtreshold)
         {
             std::vector<double> res(gaussianMixture.size());
             for (size_t i = 0; i < res.size(); i++)
                 if (dist_Mtreshold)     // Euclidian distance
                     res[i] = gaussianMixture[i].getEuclidianDistance(x);
                 else                    // Mahalanobis distance
                     res[i] = gaussianMixture[i].getNumPoints() >= samplesTreshold ? gaussianMixture[i].getMahalanobisDistance(x)
                     : gaussianMixture[i].getEuclidianDistance(x) * dist_Mtreshold / dist_Etreshold;
             return res;
         }

         // Calculates divergence from Gaussian <x> to all other Gaussians in the mixture (including itself)
         // If a Gaussian from mixture is not full, the returned divergence is infinity
         // The caller should care about argument <x>
         inline std::vector<double> getDivergence(const CKDGauss &x, const GaussianMixture &gaussianMixture, size_t samplesTreshold)
         {
             std::vector<double> res(gaussianMixture.size());
             for (size_t i = 0; i < res.size(); i++)
                 res[i] = gaussianMixture[i].getNumPoints() >= samplesTreshold ? x.getKullbackLeiberDivergence(gaussianMixture[i]) : DBL_MAX;
             return res;
         }
     }

     void CTrainNodeGMM::addFeatureVec(const Mat &featureVector, byte gt) {
         // Assertions
         DGM_ASSERT_MSG(gt < m_nStates, "The groundtruth value %u is out of range [0; %u)", gt, m_nStates);

         Mat point;
         featureVector.convertTo(point, CV_64FC1);

         GaussianMixture &gaussianMixture = m_vGaussianMixtures[gt];                         // GMM of current state

         if (gaussianMixture.empty())
             gaussianMixture.emplace_back(point);            // NEW GAUSS
         else {
             std::vector<double> dist = getDistance(point, gaussianMixture, m_params.minSamples, m_params.dist_Etreshold, m_params.dist_Mtreshold);                  // Calculate distances all existing Gaussians in the mixture to the point

             // Find the smallest distance
             auto it = std::min_element(dist.begin(), dist.end());
             double minDist = *it;

             double dist_treshold = (m_params.dist_Mtreshold < 0) ? m_params.dist_Etreshold : m_params.dist_Mtreshold;

             // Add to existing Gaussian or crete a new one
             if ((minDist > dist_treshold) && (gaussianMixture.size() < m_params.maxGausses))
                 gaussianMixture.emplace_back(point);        // NEW GAUSS
             else {
                 size_t updIdx = std::distance(dist.begin(), it);
                 CKDGauss &updGauss = gaussianMixture[updIdx];               // the nearest Gaussian
                 updGauss += point;                                          // update the nearest Gauss

                 // Chech the updated Gauss function if after update it became too close to another Gauss function
                 if ((m_params.div_KLtreshold > 0) && (updGauss.getNumPoints() >= m_params.minSamples)) {
                     // Calculate divergences between updGauss and all other gausses
                     std::vector<double> div = getDivergence(updGauss, gaussianMixture, m_params.minSamples);
                     div[updIdx] = DBL_MAX;                                  // divergence to itself

                     // Find the smallest divergence
                     auto it = std::min_element(div.begin(), div.end());

                     // Merge together if they are too close
                     if ((it != div.end()) && (*it < m_params.div_KLtreshold)) {
                         size_t idx = std::distance(div.begin(), it);
                         gaussianMixture[idx] += updGauss;
                         gaussianMixture.erase(gaussianMixture.begin() + updIdx);
                     }
                 }
             }
         }
     }

     namespace {
         template<typename T>
         void printMat(const std::string &name, const Mat &m) {
             if (!name.empty()) printf("%s:\n", name.c_str());
             for (int y = 0; y < m.rows; y++) {
                 for (int x = 0; x < m.cols; x++)
                     printf("%.1f\t", m.at<T>(y, x));
                 printf("\n");
             }
         }

         void printStatus(std::vector<GaussianMixture> &vGaussianMixtures, long double minCoefficient) {
 #ifdef DEBUG_PRINT_INFO
             printf("\nCTrainNodeGMM::Status\n");
             printf("---------------------------\n");
             printf("( minCoefficient = %Le )\n", minCoefficient);

             for (size_t s = 0; s < vGaussianMixtures.size(); s++) {     // states
                 printf("Class %zu (%zu gausses):\n", s, vGaussianMixtures[s].size());

                 word g = 0;
                 for (const CKDGauss &gauss : vGaussianMixtures[s]) {
                     printf("\tG[%u]: %zupts; ", g++, gauss.getNumPoints());
                     printf("alpha: %Le;\n", gauss.getAlpha());
                     //printf("aK: %e;\n", gauss.getAlpha() / m_minCoefficient);

                     //printMat<double>("MU:", gauss.getMu());
                     //printMat<double>("SIGMA:", gauss.getSigma());
                 } // gausses
                 printf("\n");
             } // s
 #endif
         }
     }

     void CTrainNodeGMM::train(bool)
     {
         // merge gausses with too small number of samples
         for (GaussianMixture &gaussianMixture : m_vGaussianMixtures) {          // state
             for (auto it = gaussianMixture.begin(); it != gaussianMixture.end(); it++) {
                 size_t nPoints = it->getNumPoints();
                 if (nPoints < m_params.minSamples) {                // if Gaussian is not full
                     if (nPoints >= MIN_SAMPLES) {
                         size_t g = std::distance(gaussianMixture.begin(), it);
                         std::vector<double> div = getDivergence(*it, gaussianMixture, m_params.minSamples);
                         div[g] = DBL_MAX;                           // distance to itself (redundant here)

                         // Finding the smallest divergence
                         auto itm = std::min_element(div.begin(), div.end());
                         if (itm != div.end()) {
                             size_t gaussIdx = std::distance(div.begin(), itm);
                             gaussianMixture[gaussIdx] += (*it);
                         }
                     } // if Gaussian has less then MIN_SAMPLES points, consider it as a noise and delete
                     gaussianMixture.erase(it);
                     it--;
                 } // if Gaussian full
             } // gausses
         } // gaussianMixture

         // getting the coefficients
         for (GaussianMixture &gaussianMixture : m_vGaussianMixtures) {          // state
             for (auto itGauss = gaussianMixture.begin(); itGauss != gaussianMixture.end(); itGauss++) {
                 long double alpha = itGauss->getAlpha();
                 if (alpha > MAX_COEFFICIENT) {          // i.e. if (Coefficient = \infinitiy) delete Gaussian
                     gaussianMixture.erase(itGauss);
                     itGauss--;
                     continue;
                 }
                 if (m_minAlpha > alpha)
                     m_minAlpha = alpha;
             } // gausses
         } // gaussianMixture

         printStatus(m_vGaussianMixtures, m_minAlpha);
     }

     void CTrainNodeGMM::saveFile(FILE *pFile) const
     {
         // m_params
         fwrite(&m_params.maxGausses, sizeof(word), 1, pFile);
         fwrite(&m_params.minSamples, sizeof(size_t), 1, pFile);
         fwrite(&m_params.dist_Etreshold, sizeof(double), 1, pFile);
         fwrite(&m_params.dist_Mtreshold, sizeof(double), 1, pFile);
         fwrite(&m_params.div_KLtreshold, sizeof(double), 1, pFile);

         // m_pvpGausses;
         for (const GaussianMixture &gaussianMixture : m_vGaussianMixtures) {    // state
             word nGausses = static_cast<word>(gaussianMixture.size());
             fwrite(&nGausses, sizeof(word), 1, pFile);
             for (const CKDGauss &gauss : gaussianMixture) {
                 size_t  nPoints = gauss.getNumPoints();
                 Mat     mu      = gauss.getMu();
                 Mat     sigma   = gauss.getSigma();

                 fwrite(&nPoints, sizeof(long), 1, pFile);
                 for (word y = 0; y < getNumFeatures(); y++)
                     fwrite(&mu.at<double>(y, 0), sizeof(double), 1, pFile);
                 for (word y = 0; y < getNumFeatures(); y++)
                     for (word x = 0; x < getNumFeatures(); x++)
                         fwrite(&sigma.at<double>(y, x), sizeof(double), 1, pFile);
                 mu.release();
                 sigma.release();
             } // gauss
         } // gaussianMixture

         fwrite(&m_minAlpha, sizeof(long double), 1, pFile);
     }

     void CTrainNodeGMM::loadFile(FILE *pFile)
     {
         // m_params
         fread(&m_params.maxGausses, sizeof(word), 1, pFile);
         fread(&m_params.minSamples, sizeof(size_t), 1, pFile);
         fread(&m_params.dist_Etreshold, sizeof(double), 1, pFile);
         fread(&m_params.dist_Mtreshold, sizeof(double), 1, pFile);
         fread(&m_params.div_KLtreshold, sizeof(double), 1, pFile);

         // m_pvpGausses;
         m_vGaussianMixtures.resize(m_nStates);
         for (GaussianMixture &gaussianMixture : m_vGaussianMixtures) {              // state
             word nGausses;
             fread(&nGausses, sizeof(word), 1, pFile);
             gaussianMixture.assign(nGausses, CKDGauss(getNumFeatures()));
             for (CKDGauss &gauss : gaussianMixture) {
                 long nPoints;
                 Mat mu(getNumFeatures(), 1, CV_64FC1);
                 Mat sigma(getNumFeatures(), getNumFeatures(), CV_64FC1);

                 fread(&nPoints, sizeof(long), 1, pFile);
                 for (word y = 0; y < getNumFeatures(); y++)
                     fread(&mu.at<double>(y, 0), sizeof(double), 1, pFile);
                 for (word y = 0; y < getNumFeatures(); y++)
                     for (word x = 0; x < getNumFeatures(); x++)
                         fread(&sigma.at<double>(y, x), sizeof(double), 1, pFile);

                 gauss.setMu(mu);
                 gauss.setSigma(sigma);
                 gauss.setNumPoints(nPoints);

                 mu.release();
                 sigma.release();
             } // gausses
         } // gaussianMixture

         fread(&m_minAlpha, sizeof(long double), 1, pFile);
     }

     void CTrainNodeGMM::calculateNodePotentials(const Mat &featureVector, Mat &potential, Mat &mask) const
     {
         Mat fv;
         Mat aux1, aux2, aux3;

         featureVector.convertTo(fv, CV_64FC1);

         for (byte s = 0; s < m_nStates; s++) {                      // state
             const GaussianMixture &gaussianMixture = m_vGaussianMixtures[s];

             if (gaussianMixture.empty())    mask.at<byte>(s, 0) = 0;
             else {
                 size_t nAllPoints = 0;                                  // number of points were used for approximating the density for current state
                 for (const CKDGauss &gauss : gaussianMixture)
                     nAllPoints += gauss.getNumPoints();

                 for (const CKDGauss &gauss : gaussianMixture) {
                     double      k = static_cast<double>(gauss.getNumPoints()) / nAllPoints;
                     double      value = gauss.getValue(fv, aux1, aux2, aux3);
                     long double aK = gauss.getAlpha() / m_minAlpha;     // scaled Gaussian coefficient
                     potential.at<float>(s, 0) += static_cast<float>(k * aK * value);
                 } // gausses
             }
         } // s
     }
 }
DirectGraphicalModels::CTrainNodeGMM::saveFile
void saveFile(FILE *pFile) const
Saves the random model into the file.
Definition: TrainNodeGMM.cpp:196

DirectGraphicalModels::TrainNodeGMMParams::dist_Etreshold
double dist_Etreshold
Minimum Euclidean distance between Gauss functions.
Definition: TrainNodeGMM.h:15

DirectGraphicalModels::TrainNodeGMMParams::div_KLtreshold
double div_KLtreshold
Minimum Kullback-Leiber divergence between Gauss functions. If this parameter is negative, the merging of Gaussians in addFeatureVec() function will be disabled.
Definition: TrainNodeGMM.h:17

DirectGraphicalModels::ITrain::getNumFeatures
word getNumFeatures(void) const
Returns number of features.
Definition: ITrain.h:37

DirectGraphicalModels::CTrainNodeGMM::reset
void reset(void)
Resets class variables.
Definition: TrainNodeGMM.cpp:38

DirectGraphicalModels::CTrainNodeGMM::train
void train(bool doClean=false)
Random model training.
Definition: TrainNodeGMM.cpp:154

DirectGraphicalModels::TrainNodeGMMParams
Gaussian Mixture Model parameters.
Definition: TrainNodeGMM.h:12

DirectGraphicalModels
Definition: AveragePrecision.cpp:4

DirectGraphicalModels::CTrainNodeGMM::CTrainNodeGMM
CTrainNodeGMM(byte nStates, word nFeatures, TrainNodeGMMParams params=TRAIN_NODE_GMM_PARAMS_DEFAULT)
Constructor.
Definition: TrainNodeGMM.cpp:11

DirectGraphicalModels::CTrainNodeGMM::MAX_COEFFICIENT
static const long double MAX_COEFFICIENT
Definition: TrainNodeGMM.h:82

DirectGraphicalModels::CBaseRandomModel
Base abstract class for random model training.
Definition: BaseRandomModel.h:24

DirectGraphicalModels::TrainNodeGMMParams::maxGausses
word maxGausses
The maximal number of Gauss functions for approximation.
Definition: TrainNodeGMM.h:13

DirectGraphicalModels::CTrainNodeGMM::m_minAlpha
long double m_minAlpha
Definition: TrainNodeGMM.h:88

DirectGraphicalModels::CTrainNodeGMM::MIN_SAMPLES
static const size_t MIN_SAMPLES
Definition: TrainNodeGMM.h:81

DirectGraphicalModels::CTrainNodeGMM::calculateNodePotentials
void calculateNodePotentials(const Mat &featureVector, Mat &potential, Mat &mask) const
Calculates the node potential, based on the feature vector.
Definition: TrainNodeGMM.cpp:267

DirectGraphicalModels::CTrainNodeGMM::~CTrainNodeGMM
virtual ~CTrainNodeGMM(void)
Definition: TrainNodeGMM.cpp:35

DirectGraphicalModels::GaussianMixture
std::vector< CKDGauss > GaussianMixture
Definition: KDGauss.h:230

DirectGraphicalModels::CTrainNodeGMM::m_params
TrainNodeGMMParams m_params
Definition: TrainNodeGMM.h:86

DirectGraphicalModels::TRAIN_NODE_GMM_PARAMS_DEFAULT
const TrainNodeGMMParams TRAIN_NODE_GMM_PARAMS_DEFAULT
Definition: TrainNodeGMM.h:23

DirectGraphicalModels::CTrainNode
Base abstract class for node potentials training.
Definition: TrainNode.h:47

DirectGraphicalModels::TrainNodeGMMParams::dist_Mtreshold
double dist_Mtreshold
Minimum Mahalanobis distance between Gauss functions. If this parameter is negative, the Euclidean distance is used.
Definition: TrainNodeGMM.h:16

DirectGraphicalModels::CTrainNodeGMM::m_vGaussianMixtures
std::vector< GaussianMixture > m_vGaussianMixtures
Definition: TrainNodeGMM.h:87

DirectGraphicalModels::CKDGauss
Multivariate Gaussian distribution class.
Definition: KDGauss.h:28

DirectGraphicalModels::TrainNodeGMMParams::minSamples
size_t minSamples
Minimum number of sapmles to approximate a Gauss function.
Definition: TrainNodeGMM.h:14

DirectGraphicalModels::CTrainNodeGMM::addFeatureVec
void addFeatureVec(const Mat &featureVector, byte gt)
Adds new feature vector.
Definition: TrainNodeGMM.cpp:71

DirectGraphicalModels::CBaseRandomModel::m_nStates
byte m_nStates
The number of states (classes)
Definition: BaseRandomModel.h:87

DirectGraphicalModels::CTrainNodeGMM::loadFile
void loadFile(FILE *pFile)
Loads the random model from the file.
Definition: TrainNodeGMM.cpp:228