cpp_api/api/trainer_8h_source.html

 // ----------------------------------------------------------------------------

 // -                        CloudViewer: www.cloudViewer.org                  -

 // ----------------------------------------------------------------------------

 // Copyright (c) 2018-2024 www.cloudViewer.org

 // SPDX-License-Identifier: MIT

 // ----------------------------------------------------------------------------


 #pragma once


 // system

 #include <vector>


 // dlib

 #include <dlib/matrix.h>

 #include <dlib/svm.h>


 class LDATrainer {

 public:

     typedef dlib::matrix<float, 0, 1> sample_type;

     typedef dlib::linear_kernel<sample_type> kernel_type;

     typedef dlib::decision_function<kernel_type> trained_function_type;

     // typedef trained_function_type::mem_manager_type mem_manager_type;


     trained_function_type train(const std::vector<sample_type>& samplesvec,

                                 const std::vector<float>& labels) const {

         size_t fdim = samplesvec[0].size();

         size_t nsamples = samplesvec.size();


         long ndata_class1 = 0, ndata_class2 = 0;

         for (size_t i = 0; i < nsamples; ++i) {

             if (labels[i] > 0)

                 ++ndata_class1;

             else

                 ++ndata_class2;

         }


         dlib::matrix<sample_type, 0, 1> samples1, samples2;

         samples1.set_size(ndata_class1);

         samples2.set_size(ndata_class2);

         sample_type mu1;

         mu1.set_size(fdim);

         sample_type mu2;

         mu2.set_size(fdim);

         for (size_t i = 0; i < fdim; ++i) {

             mu1(i) = 0;

             mu2(i) = 0;

         }


         ndata_class1 = 0;

         ndata_class2 = 0;

         for (size_t i = 0; i < nsamples; ++i) {

             if (labels[i] > 0) {

                 samples1(ndata_class1) = samplesvec[i];

                 ++ndata_class1;

                 mu1 += samplesvec[i];

             } else {

                 samples2(ndata_class2) = samplesvec[i];

                 ++ndata_class2;

                 mu2 += samplesvec[i];

             }

         }

         mu1 /= ndata_class1;

         mu2 /= ndata_class2;


         // if you get a compilation error coming from here (with templates

         // and a 'visual_studio_sucks_cov_helper' structure involved) then

         // you may have to patch the dlib's file 'matrix_utilities.h":

         //

         // line 1611, replace

         //  const matrix<double,EXP::type::NR,EXP::type::NC, typename

         // EXP::mem_manager_type> avg = mean(m);

         // by

         //  const typename EXP::type avg = mean(m);

         //

         dlib::matrix<float> sigma1 = covariance(samples1);

         dlib::matrix<float> sigma2 = covariance(samples2);


         sample_type w_vect = pinv(sigma1 + sigma2) * (mu2 - mu1);


         trained_function_type ret;

         // ret.alpha.set_size(fdim);

         // for (int i=0; i<fdim; ++i) ret.alpha(i) = w_vect(i);

         ret.alpha = w_vect;

         ret.b = dot(w_vect, (mu1 + mu2) * 0.5);

         // linear kernel idiocy

         ret.basis_vectors.set_size(fdim);

         for (size_t i = 0; i < fdim; ++i) {

             ret.basis_vectors(i).set_size(fdim);

             for (size_t j = 0; j < fdim; ++j) ret.basis_vectors(i)(j) = 0;

             ret.basis_vectors(i)(i) = 1;

         }

         return ret;

     }


 #if 0

     trained_function_type train(const trained_function_type::sample_vector_type& samplesvec, const trained_function_type::scalar_vector_type& labels) const

     {

         int fdim = samplesvec(0).size();

         int nsamples = samplesvec.size();


         int ndata_class1 = 0, ndata_class2 = 0;

         for (int i=0; i<nsamples; ++i)

         {

             if (labels(i)>0)

                 ++ndata_class1;

             else

                 ++ndata_class2;

         }


         dlib::matrix<sample_type,0,1> samples1, samples2;

         samples1.set_size(ndata_class1);

         samples2.set_size(ndata_class2);

         sample_type mu1; mu1.set_size(fdim);

         sample_type mu2; mu2.set_size(fdim);

         for (int i=0; i<fdim; ++i)

         {

             mu1(i)=0;

             mu2(i)=0;

         }


         ndata_class1 = 0; ndata_class2 = 0;

         for (int i=0; i<nsamples; ++i)

         {

             if (labels(i)>0)

             {

                 samples1(ndata_class1) = samplesvec(i);

                 ++ndata_class1;

                 mu1 += samplesvec(i);

             }

             else

             {

                 samples2(ndata_class2) = samplesvec(i);

                 ++ndata_class2;

                 mu2 += samplesvec(i);

             }

         }

         mu1 /= ndata_class1;

         mu2 /= ndata_class2;


         // if you get a compilation error coming from here (with templates

         // and a 'visual_studio_sucks_cov_helper' structure involved) then

         // you may have to patch the dlib's file 'matrix_utilities.h":

         //

         // line 1611, replace

         //  const matrix<double,EXP::type::NR,EXP::type::NC, typename EXP::mem_manager_type> avg = mean(m);

         // by

         //  const typename EXP::type avg = mean(m);

         //

         dlib::matrix<float> sigma1 = covariance(samples1);

         dlib::matrix<float> sigma2 = covariance(samples2);


         sample_type w_vect = pinv(sigma1+sigma2) * (mu2 - mu1);


         trained_function_type ret;

         //ret.alpha.set_size(fdim);

         //for (int i=0; i<fdim; ++i) ret.alpha(i) = w_vect(i);

         ret.alpha = w_vect;

         ret.b = dot(w_vect,(mu1+mu2)*0.5);

         // linear kernel idiocy

         ret.basis_vectors.set_size(fdim);

         for (int i=0; i<fdim; ++i)

         {

             ret.basis_vectors(i).set_size(fdim);

             for (int j=0; j<fdim; ++j)

                 ret.basis_vectors(i)(j)=0;

             ret.basis_vectors(i)(i) = 1;

         }

         return ret;

         /*LinearPredictor classifier;

         classifier.weights.resize(fdim+1);

         for (int i=0; i<fdim; ++i) classifier.weights[i] = w_vect(i);

         classifier.weights[fdim] = -dot(w_vect,(mu1+mu2)*0.5);

         return classifier;*/

     }

 #endif


     void train(int nfolds,

                const std::vector<sample_type>& samples,

                const std::vector<float>& labels) {

         dlib::probabilistic_decision_function<kernel_type> pdecfun =

                 dlib::train_probabilistic_decision_function(*this, samples,

                                                             labels, nfolds);

         dlib::decision_function<kernel_type>& decfun = pdecfun.decision_funct;

         int dim = samples.back().size();

         // see comments in linearSVM.hpp

         m_weights.clear();

         m_weights.resize(dim + 1, 0);

         dlib::matrix<float> w(dim, 1);

         w = 0;

         for (int i = 0; i < decfun.alpha.nr(); ++i) {

             w += decfun.alpha(i) * decfun.basis_vectors(i);

         }

         for (int i = 0; i < dim; ++i) m_weights[i] = w(i);

         m_weights[dim] = -decfun.b;

         for (int i = 0; i <= dim; ++i) m_weights[i] *= pdecfun.alpha;

         m_weights[dim] += pdecfun.beta;


         // TODO: check if necessary here

         for (int i = 0; i <= dim; ++i) m_weights[i] = -m_weights[i];

     }


     double predict(const sample_type& data) const {

         assert(!m_weights.empty());

         double ret = m_weights.back();

         for (size_t d = 0; d < m_weights.size() - 1; ++d)

             ret += static_cast<double>(m_weights[d]) * data(d);

         return ret;

     }


     std::vector<float> m_weights;

 };


 static void GramSchmidt(dlib::matrix<LDATrainer::sample_type, 0, 1>& basis,

                         LDATrainer::sample_type& newX) {

     // goal: find a basis so that the given vector is the new X

     // principle: at least one basis vector is not orthogonal with newX (except

     // if newX is null but we suppose this is not the case)

     // => use the max dot product vector, and replace it by newX. this forms a

     // set of linearly independent vectors. then apply the Gram-Schmidt process

     long dim = basis.size();

     double maxabsdp = -1.0;

     long selectedCoord = 0;

     for (long i = 0; i < dim; ++i) {

         double absdp = fabs(dot(basis(i), newX));

         if (absdp > maxabsdp) {

             absdp = maxabsdp;

             selectedCoord = i;

         }

     }

     // swap basis vectors to use the selected coord as the X vector, then

     // replaced by newX

     basis(selectedCoord) = basis(0);

     basis(0) = newX;

     // Gram-Schmidt process to re-orthonormalise the basis.

     // Thanks Wikipedia for the stabilized version

     for (long j = 0; j < dim; ++j) {

         for (long i = 0; i < j; ++i)

             basis(j) -= (dot(basis(j), basis(i)) / dot(basis(i), basis(i))) *

                         basis(i);


         basis(j) /= sqrt(dot(basis(j), basis(j)));

     }

 }


 static void ComputeReferencePoints(Classifier::Point2D& refpt_pos,

                                    Classifier::Point2D& refpt_neg,

                                    const std::vector<float>& proj1,

                                    const std::vector<float>& proj2,

                                    const std::vector<float>& labels,

                                    unsigned* _npos = 0,

                                    unsigned* _nneg = 0) {

     assert(proj1.size() == proj2.size() && proj1.size() == labels.size());


     refpt_neg = refpt_pos = Classifier::Point2D(0, 0);


     size_t npos = 0;

     size_t nneg = 0;

     for (size_t i = 0; i < labels.size(); ++i) {

         if (labels[i] < 0) {

             refpt_neg += Classifier::Point2D(proj1[i], proj2[i]);

             ++nneg;

         } else {

             refpt_pos += Classifier::Point2D(proj1[i], proj2[i]);

             ++npos;

         }

     }

     if (npos) refpt_pos /= static_cast<float>(npos);

     if (nneg) refpt_neg /= static_cast<float>(nneg);


     if (_npos) *_npos = npos;

     if (_nneg) *_nneg = nneg;

 }


 static bool DilateClassifier(

         Classifier& classifier,

         std::vector<float>& proj1,

         std::vector<float>& proj2,

         const std::vector<float>& labels,

         const std::vector<LDATrainer::sample_type>& samples,

         LDATrainer& trainer,

         LDATrainer& orthoTrainer) {

     // m_app->dispToConsole("[Cloud dilatation]");

     Classifier::Point2D e1 = classifier.refPointPos - classifier.refPointNeg;

     e1.normalize();

     Classifier::Point2D e2(-e1.y, e1.x);

     Classifier::Point2D ori =

             (classifier.refPointPos + classifier.refPointNeg) / 2;


     float m11 = 0, m21 = 0, m12 = 0, m22 = 0;  // m12, m22 null by construction

     float v11 = 0, v12 = 0, v21 = 0, v22 = 0;

     size_t nsamples1 = 0;

     size_t nsamples2 = 0;

     size_t nsamples = proj1.size();

     assert(proj1.size() == proj2.size());

     for (size_t i = 0; i < nsamples; ++i) {

         Classifier::Point2D p(proj1[i], proj2[i]);

         p -= ori;

         float p1 = p.dot(e1);

         float p2 = p.dot(e2);

         if (labels[i] < 0) {

             m11 += p1;

             v11 += p1 * p1;

             m12 += p2;

             v12 += p2 * p2;

             ++nsamples1;

         } else {

             m21 += p1;

             v21 += p1 * p1;

             m22 += p2;

             v22 += p2 * p2;

             ++nsamples2;

         }

     }

     m11 /= nsamples1;

     v11 = (v11 - m11 * m11 * nsamples1) / (nsamples1 - 1);

     m21 /= nsamples2;

     v21 = (v21 - m21 * m21 * nsamples2) / (nsamples2 - 1);

     m12 /= nsamples1;

     v12 = (v12 - m12 * m12 * nsamples1) / (nsamples1 - 1);

     m22 /= nsamples2;

     v22 = (v22 - m22 * m22 * nsamples2) / (nsamples2 - 1);


     float d1 = sqrt(v11 / v12);

     float d2 = sqrt(v21 / v22);

     classifier.axisScaleRatio = sqrt(d1 * d2);


     float bdValues[4] = {e1.x, e1.y, e2.x / classifier.axisScaleRatio,

                          e2.y / classifier.axisScaleRatio};

     dlib::matrix<float, 2, 2> bd(bdValues);


     float biValues[4] = {e1.x, e2.x, e1.y, e2.y};

     dlib::matrix<float, 2, 2> bi(biValues);

     dlib::matrix<float, 2, 2> c = inv(trans(bd)) /* bi * bd */;


     std::vector<float>& w1 = trainer.m_weights;

     std::vector<float>& w2 = orthoTrainer.m_weights;

     assert(w1.size() == w2.size());


     std::vector<float> wn1, wn2;

     try {

         wn1.resize(w1.size());

         wn2.resize(w2.size());

     } catch (const std::bad_alloc&) {

         // not enough memory

         return false;

     }


     // first shift so the center of the figure is at the midpoint

     w1.back() -= ori.x;

     w2.back() -= ori.y;

     // now transform / scale along e2

     {

         for (size_t i = 0; i < w1.size(); ++i) {

             wn1[i] = c(0, 0) * w1[i] + c(0, 1) * w2[i];

             wn2[i] = c(1, 0) * w1[i] + c(1, 1) * w2[i];

         }

     }


     trainer.m_weights = wn1;

     orthoTrainer.m_weights = wn2;


     // reset projections

     {

         for (size_t i = 0; i < nsamples; ++i) {

             proj1[i] = trainer.predict(samples[i]);

             proj2[i] = orthoTrainer.predict(samples[i]);

         }

     }


     classifier.weightsAxis1 = wn1;

     classifier.weightsAxis2 = wn2;


     // update reference points

     ComputeReferencePoints(classifier.refPointPos, classifier.refPointNeg,

                            proj1, proj2, labels);


     return true;

 }

Classifier
Classifier.
Definition: classifier.h:23

Classifier::weightsAxis2
std::vector< float > weightsAxis2
Definition: classifier.h:71

Classifier::axisScaleRatio
float axisScaleRatio
Definition: classifier.h:73

Classifier::Point2D
Vector2Tpl< float > Point2D
2D point
Definition: classifier.h:26

Classifier::weightsAxis1
std::vector< float > weightsAxis1
Definition: classifier.h:71

Classifier::refPointPos
Point2D refPointPos
Definition: classifier.h:74

Classifier::refPointNeg
Point2D refPointNeg
Definition: classifier.h:74

LDATrainer
Definition: trainer.h:17

LDATrainer::predict
double predict(const sample_type &data) const
Definition: trainer.h:202

LDATrainer::m_weights
std::vector< float > m_weights
Classifier weights.
Definition: trainer.h:211

LDATrainer::train
trained_function_type train(const std::vector< sample_type > &samplesvec, const std::vector< float > &labels) const
Definition: trainer.h:24

LDATrainer::trained_function_type
dlib::decision_function< kernel_type > trained_function_type
Definition: trainer.h:21

LDATrainer::kernel_type
dlib::linear_kernel< sample_type > kernel_type
Definition: trainer.h:20

LDATrainer::train
void train(int nfolds, const std::vector< sample_type > &samples, const std::vector< float > &labels)
Definition: trainer.h:177

LDATrainer::sample_type
dlib::matrix< float, 0, 1 > sample_type
Definition: trainer.h:19

Vector2Tpl< float >

Vector2Tpl::dot
Type dot(const Vector2Tpl &v) const
Dot product.
Definition: CVGeom.h:71

Vector2Tpl::x
Type x
Definition: CVGeom.h:36

Vector2Tpl::normalize
void normalize()
Sets vector norm to unity.
Definition: CVGeom.h:65

Vector2Tpl::y
Type y
Definition: CVGeom.h:36

dot
__host__ __device__ float dot(float2 a, float2 b)
Definition: cutil_math.h:1119

fabs
__host__ __device__ float2 fabs(float2 v)
Definition: cutil_math.h:1254

GramSchmidt
static void GramSchmidt(dlib::matrix< LDATrainer::sample_type, 0, 1 > &basis, LDATrainer::sample_type &newX)
Gram-Schmidt process to re-orthonormalise the basis.
Definition: trainer.h:215

DilateClassifier
static bool DilateClassifier(Classifier &classifier, std::vector< float > &proj1, std::vector< float > &proj2, const std::vector< float > &labels, const std::vector< LDATrainer::sample_type > &samples, LDATrainer &trainer, LDATrainer &orthoTrainer)
Definition: trainer.h:279

ComputeReferencePoints
static void ComputeReferencePoints(Classifier::Point2D &refpt_pos, Classifier::Point2D &refpt_neg, const std::vector< float > &proj1, const std::vector< float > &proj2, const std::vector< float > &labels, unsigned *_npos=0, unsigned *_nneg=0)
Compute pos. and neg. reference points.
Definition: trainer.h:248