UFJF-Machine-Learning-Toolkit/Perceptron_8hpp_source.html

 #ifndef PERCEPTRONPRIMAL__HPP

 #define PERCEPTRONPRIMAL__HPP


 #include "PrimalClassifier.hpp"

 #include "DualClassifier.hpp"

 #include <chrono>


 namespace mltk{

     namespace classifier {

         using namespace std::chrono;


         template<typename T>

         class PerceptronPrimal : public PrimalClassifier<T> {

         public:

             explicit PerceptronPrimal(std::shared_ptr<Data<T> > samples = nullptr, double q = 2, double rate = 0.5,

                                       Solution *initial_solution = nullptr);

             PerceptronPrimal(const Data<T>& samples, double q = 2, double rate = 0.5, Solution *initial_solution = nullptr);

             bool train() override;


             double evaluate(const Point<T> &p, bool raw_value = false) override;

         };


         template<typename T>

         class PerceptronFixedMarginPrimal : public PrimalClassifier<T> {

         public:

             PerceptronFixedMarginPrimal() = default;

             explicit PerceptronFixedMarginPrimal(const mltk::Data<T>& samples, double gamma = 0,

                                                  double q = 2, double rate = 0.5, Solution *initial_solution = nullptr);


             bool train() override;


             double evaluate(const Point<T> &p, bool raw_value = false) override;

         };


         template<typename T>

         class PerceptronDual : public DualClassifier<T> {

         private:

             Solution *initial = nullptr;

         public:

             PerceptronDual() = default;

             PerceptronDual(const Data<T>& samples,

                             KernelType kernel_type, double kernel_param = 0,

                             double rate = 0.5, Solution *initial_solution = nullptr);


             explicit PerceptronDual(const Data<T>& samples, double rate = 0.5,

                                     Solution *initial_solution = nullptr);


             bool train() override;

         };


         template<typename T>

         class PerceptronFixedMarginDual : public DualClassifier<T> {

         public:

             PerceptronFixedMarginDual() = default;

             explicit PerceptronFixedMarginDual(const mltk::Data<T>& samples, KernelType kernel_type = KernelType::INNER_PRODUCT,

                                                double kernel_param = 0, double gamma = 0, double rate = 0.5,

                                                Solution *initial_solution = nullptr);


             bool train() override;

         };


         template<typename T>

         class BalancedPerceptron : public classifier::PrimalClassifier<T> {

         private:

             Point<double> weights;

             double bias = 0;


         public:

             BalancedPerceptron() = default;


             explicit BalancedPerceptron(const Data<T> &samples, const size_t &seed = 0) {

                 this->samples = mltk::make_data<T>(samples);

                 this->seed = seed;

             }


             bool train() override {

                 size_t epoch = 0, ite = 0;

                 bool stop = false;

                 double gamma1 = std::numeric_limits<double>::max(), gamma2 = std::numeric_limits<double>::max();

                 size_t errors = 0;


                 this->bias = 0;

                 mltk::random_init<double>(this->weights, this->samples->dim(), this->seed);

                 this->samples->shuffle(this->seed);

                 this->timer.reset();


                 while (epoch < this->MAX_EPOCH) {

                     errors = 0;

                     for (auto it = this->samples->begin(); it != this->samples->end(); ++it) {

                         auto point = *it;

                         int pred = ((mltk::dot(weights, *point) + bias) >= 0) ? 1 : -1;


                         if (point->Y() != pred) {

                             weights += this->rate * (*point) * point->Y();

                             bias += this->rate * bias;

                             ite++;

                             errors++;

                         }


                         if (ite > this->MAX_UP) {

                             stop = true;

                             break;

                         }


                     }

                     epoch++;

                     if (stop || this->timer.elapsed() > this->max_time || errors == 0) break;

                 }


                 for (auto it = this->samples->begin(); it != this->samples->end(); ++it) {

                     auto point = *(*it);

                     double func = point.Y() * (mltk::dot(weights, point) + bias);


                     if (point.Y() == 1 && func < gamma1) gamma1 = func;

                     if (point.Y() == -1 && func < gamma2) gamma2 = func;

                 }

                 double rmargin = (fabs(gamma1) > fabs(gamma2)) ? fabs(gamma2) : fabs(gamma1);

                 double mmargin = (fabs(gamma1) + fabs(gamma2)) / 2;

                 if(fabs(gamma2) > fabs(gamma1)){

                     bias += fabs(mmargin - rmargin);

                 }else{

                     bias -= fabs(mmargin - rmargin);

                 }

                 this->solution.w = weights;

                 this->solution.bias = bias;


                 return (errors == 0);

             }


             double evaluate(const Point<T> &p, bool raw_value) override {

                 if (raw_value) {

                     return mltk::dot(weights, p) + bias;

                 } else {

                     return ((mltk::dot(weights, p) + bias) >= 0) ? 1 : -1;

                 }

             }


             std::string getFormulationString() override { return "Primal"; }

         };


         template<typename T>

         PerceptronPrimal<T>::PerceptronPrimal(std::shared_ptr<Data<T> > samples, double q, double rate,

                                               Solution *initial_solution) {

             this->samples = samples;

             this->q = q;

             this->rate = rate;

             if (initial_solution)

                 this->solution = *initial_solution;

         }


         template<typename T>

         PerceptronPrimal<T>::PerceptronPrimal(const Data<T> &samples, double q, double rate,

                                               Solution *initial_solution) {

             this->samples = mltk::make_data<T>(samples);

             this->q = q;

             this->rate = rate;

             if (initial_solution)

                 this->solution = *initial_solution;

         }


         template<typename T>

         bool PerceptronPrimal<T>::train() {

             size_t size = this->samples->size(), dim = this->samples->dim();

             int i, j, e = 0, idx;

             double y, time = this->start_time + this->max_time;

             bool cond;

             std::vector<double> func(size, 0);

             std::vector<T> x;

             std::vector<int> index = this->samples->getIndex();


             if (this->solution.w.empty()) this->solution.w.resize(dim);

             this->solution.bias = 0;

             this->solution.norm = 0.0;


             this->timer.reset();

             while (this->timer.elapsed() - time <= 0) {

                 for (e = 0, i = 0; i < size; ++i) {

                     idx = index[i];

                     auto p = this->samples->point(idx);

                     x = p->X();

                     y = p->Y();


                     //calculating function

                     for (func[idx] = this->solution.bias, j = 0; j < dim; ++j)

                         func[idx] += this->solution.w[j] * x[j];


                     //Checking if the point is a mistake

                     if (y * func[idx] <= 0.0) {

                         for (this->solution.norm = 0.0, j = 0; j < dim; ++j) {

                             this->solution.w[j] += this->rate * y * x[j];

                             this->solution.norm += this->solution.w[j] * this->solution.w[j];

                         }

                         this->solution.norm = sqrt(this->solution.norm);

                         this->solution.bias += this->rate * y;

                         this->ctot++;

                         e++;

                     } else if (this->steps > 0 && e > 1) break;

                 }

                 this->steps++;    //Number of iterations update


                 //stop criterion

                 if (e == 0) break;

                 if (this->steps > this->MAX_IT) break;

                 if (this->ctot > this->MAX_UP) break;

             }


             return (e == 0);

         }


         template<typename T>

         double PerceptronPrimal<T>::evaluate(const Point<T> &p, bool raw_value) {

             return PrimalClassifier<T>::evaluate(p, raw_value);

         }


         template<typename T>

         PerceptronFixedMarginPrimal<T>::PerceptronFixedMarginPrimal(const mltk::Data<T>& samples, double gamma,

                                                                     double q, double rate, Solution *initial_solution) {

             this->samples = mltk::make_data<T>(samples);

             this->q = q;

             this->rate = rate;

             this->gamma = gamma;

             if (initial_solution)

                 this->solution = *initial_solution;

         }


         template<typename T>

         bool PerceptronFixedMarginPrimal<T>::train() {

             size_t i, j, k, e, s, r, dim = this->samples->dim();

             size_t size = this->samples->size(), n = dim;

             int idx, sign = 1, n_temp = 0, largn = 0;

             double norm = this->solution.norm, lambda = 1.0, y, time = this->start_time + this->max_time;

             double sumnorm = 0.0, bias = this->solution.bias, largw = 0.0, largw_temp = 0.0;

             bool cond;

             std::vector<double> func = this->solution.func.X(), w = this->solution.w.X();

             std::vector<T> x;

             std::vector<int> index = this->samples->getIndex();

             std::shared_ptr<Point<T> > p;


             if (func.empty()) func.resize(size);

             if (w.empty()) w.resize(dim);

             e = s = 0;

             this->timer.reset();

             while (this->timer.elapsed() - time <= 0) {

                 for (e = 0, i = 0; i < size; ++i) {

                     idx = index[i];

                     p = this->samples->point(idx);

                     x = p->X();

                     y = p->Y();


                     //calculating function

                     for (func[idx] = bias, j = 0; j < dim; ++j) {

                         func[idx] += w[j] * x[j];

                     }


                     //Checking if the point is a mistake

                     if (y * func[idx] <= this->gamma * norm - this->samples->point(idx)->Alpha() * this->flexible) {

                         lambda = (norm != 0.0) ? (1 - this->rate * this->gamma / norm) : 1;

                         for (r = 0; r < size; ++r) {

                             std::shared_ptr<Point<T> > b = this->samples->point(r);

                             b->Alpha() *= lambda;

                             this->samples->setPoint(r, b);

                         }


                         if (this->q == 1.0) { //Linf

                             for (sumnorm = 0.0, j = 0; j < dim; ++j) {

                                 sign = (w[j] < 0) ? -1 : 1;

                                 lambda = (norm > 0 && w[j] != 0) ? this->gamma * sign : 0;

                                 w[j] += this->rate * (y * x[j] - lambda);

                                 sumnorm += fabs(w[j]);

                             }

                             norm = sumnorm;

                         } else if (this->q == 2.0) { //L2

                             for (sumnorm = 0.0, j = 0; j < dim; ++j) {

                                 lambda = (norm > 0 && w[j] != 0) ? w[j] * this->gamma / norm : 0;

                                 w[j] += this->rate * (y * x[j] - lambda);

                                 sumnorm += w[j] * w[j];

                             }

                             norm = sqrt(sumnorm);

                         } else if (this->q == -1.0) { //L1

                             largw_temp = fabs(w[0]);

                             n_temp = 1;

                             for (j = 0; j < dim; ++j) {

                                 if (largw == 0 || fabs(largw - fabs(w[j])) / largw < this->EPS) {

                                     sign = (w[j] < 0) ? -1 : 1;

                                     lambda = (norm > 0 && w[j] != 0) ? this->gamma * sign / n : 0;

                                     w[j] += this->rate * (y * x[j] - lambda);

                                 } else

                                     w[j] += this->rate * (y * x[j]);


                                 if (j > 0) {

                                     if (fabs(largw_temp - fabs(w[j])) / largw_temp < this->EPS)

                                         n_temp++;

                                     else if (fabs(w[j]) > largw_temp) {

                                         largw_temp = fabs(w[j]);

                                         n_temp = 1;

                                     }

                                 }

                             }

                             largw = largw_temp;

                             n = n_temp;

                             norm = largw;

                             if (n > largn) largn = n;

                         } else { //Other Lp formulations

                             for (sumnorm = 0, j = 0; j < dim; ++j) {

                                 lambda = (norm > 0 && w[j] != 0) ? w[j] * this->gamma *

                                                                    std::pow(fabs(w[j]), this->q - 2.0) *

                                                                    std::pow(norm, 1.0 - this->q) : 0;

                                 w[j] += this->rate * (y * x[j] - lambda);

                                 sumnorm += std::pow(fabs(w[j]), this->q);

                             }

                             norm = std::pow(sumnorm, 1.0 / this->q);

                         }

                         bias += this->rate * y;

                         p->Alpha() += this->rate;

                         this->samples->setPoint(idx, p);


                         k = (i > s) ? s++ : e;

                         j = index[k];

                         index[k] = idx;

                         index[i] = j;

                         this->ctot++;

                         e++;

                     } else if (this->steps > 0 && e > 1 && i > s) break;

                 }

                 ++this->steps; //Number of iterations update


                 //stop criterion

                 if (e == 0) break;

                 if (this->steps > this->MAX_IT) break;

                 if (this->ctot > this->MAX_UP) break;

             }


             this->solution.norm = norm;

             this->solution.bias = bias;

             this->solution.w = w;

             return (e == 0);

         }


         template<typename T>

         double PerceptronFixedMarginPrimal<T>::evaluate(const Point<T> &p, bool raw_value) {

             double func = 0.0;

             int i;

             size_t dim = this->samples->dim();


             if (p.X().size() != dim) {

                 std::cerr << "The point must have the same dimension of the feature set!" << std::endl;

                 return 0;

             }


             for (func = this->solution.bias, i = 0; i < dim; i++) {

                 func += this->solution.w[i] * p[i];

             }


             if (!raw_value) return (func >= this->solution.margin * this->solution.norm) ? 1 : -1;

             else return func;

         }


         template<typename T>

         PerceptronDual<T>::PerceptronDual(const Data<T>& samples, KernelType kernel_type,

                                           double kernel_param, double rate, Solution *initial_solution) {

             this->samples = mltk::make_data<T>(samples);

             if (initial_solution) {

                 this->solution = *initial_solution;

                 this->alpha = (*initial_solution).alpha;

             }

             this->rate = rate;

             this->kernel = new Kernel<T>(kernel_type, kernel_param);

         }


         template<typename T>

         PerceptronDual<T>::PerceptronDual(const Data<T>& samples, double rate, Solution *initial_solution) {

             this->samples = mltk::make_data<T>(samples);

             if (initial_solution) {

                 this->solution = *initial_solution;

                 this->alpha = (*initial_solution).alpha;

             }

             this->initial = initial_solution;

             this->rate = rate;

             this->kernel = nullptr;

         }


         template<typename T>

         bool PerceptronDual<T>::train() {

             size_t e, i, j, idx, r, size = this->samples->size(), dim = this->samples->dim();

             double norm = this->solution.norm, time = this->start_time + this->max_time;

             double bias = this->solution.bias, f;

             const double sqrate = this->rate * this->rate;

             const double tworate = 2 * this->rate;

             std::vector<int> index(size); //= this->samples->getIndex();

             std::vector<double> func(size, 0.0), Kv;

             std::vector<std::shared_ptr<Point<T> > > points = this->samples->points();

             if(!this->kernel) this->kernel = new Kernel<T>(mltk::KernelType::INNER_PRODUCT);

             this->kernel->compute(this->samples);

             dMatrix *K = this->kernel->getKernelMatrixPointer();

             int y;

             iota(index.begin(), index.end(), 0);

             if (this->alpha.empty()) {

                 this->alpha.assign(size, 0.0);

             }

             if(!initial){

                 this->solution = Solution();

             }

             this->timer.reset();

             e = 1;

             auto time_elapsed = this->timer.elapsed() - time;

             while (time_elapsed <= 0) {

                 for (e = 0, i = 0; i < size; ++i) {

                     idx = index[i];

                     y = points[idx]->Y();


                     //Calculating function

                     for (f = bias, r = 0; r < size; ++r)

                         f += this->alpha[r] * points[index[r]]->Y() * (*K)[idx][index[r]];

                     func[idx] = f;


                     //Checking if the point is a mistake

                     if (y * f <= 0.0) {

                         norm = std::sqrt(norm * norm + tworate * points[idx]->Y() * (func[idx] - bias) + sqrate * (*K)[idx][idx]);

                         this->alpha[i] += this->rate;

                         bias += this->rate * y;

                         ++this->ctot, ++e;

                     } else if (this->steps > 0 && e > 1) break;

                 }

                 time_elapsed = this->timer.elapsed() - time;

                 ++this->steps;


                 //stop criterion

                 if (e == 0) break;

                 if (this->steps > this->MAX_IT) break;

                 if (this->ctot > this->MAX_UP) break;

             }

             this->solution.bias = bias;

             this->solution.norm = norm;

             this->solution.alpha = this->alpha;

             this->solution.margin = 0.0;

             this->solution.w.resize(dim);


             for (i = 0; i < size; i++) {

                 for (j = 0; j < dim; j++) {

                     this->solution.w[j] += this->alpha[i] * points[i]->Y() * points[i]->X()[j];

                 }

             }


             return (e == 0);

         }


         template<typename T>

         PerceptronFixedMarginDual<T>::PerceptronFixedMarginDual(const mltk::Data<T>& samples, KernelType kernel_type,

                                                                 double kernel_param, double gamma, double rate,

                                                                 Solution *initial_solution) {

             this->samples = mltk::make_data<T>(samples);

             //this->solution = *initial_solution;

             this->rate = rate;

             this->kernel = new Kernel<T>(kernel_type, kernel_param);

             this->gamma = gamma;

             if (initial_solution)

                 this->alpha = (*initial_solution).alpha;

         }


         template<typename T>

         bool PerceptronFixedMarginDual<T>::train() {

             size_t e, i, j, k, s, idx, r, size = this->samples->size(), dim = this->samples->dim();

             double y, lambda, norm = this->solution.norm, time = this->start_time + this->max_time;

             double bias = this->solution.bias;

             const double sqrate = this->rate * this->rate;

             const double tworate = 2 * this->rate;

             std::vector<int> index = this->samples->getIndex();

             std::vector<double> func = this->solution.func.X(), Kv;

             this->kernel->compute(this->samples);

             dMatrix *K = this->kernel->getKernelMatrixPointer();


             if(this->alpha.empty()){

                 this->alpha.resize(this->samples->size());

             }


             if (func.empty()) { func.resize(size); }

             e = 1, s = 0;

             this->timer.reset();


             while (this->timer.elapsed() - time <= 0) {

                 for (e = 0, i = 0; i < size; ++i) {

                     idx = index[i];

                     y = (*this->samples)[idx]->Y();


                     //Checking if the point is a mistake


                     if (y * func[idx] - this->gamma * norm <= 0) {

                         lambda = (this->gamma) ? (1 - this->rate * this->gamma / norm) : 1;

                         norm *= lambda;


                         for (r = 0; r < size; ++r) {

                             (*this->samples)[r]->Alpha() *= lambda;

                             func[r] = lambda * func[r] + this->rate * y * ((*K)[idx][r] + 1) + bias * (1 - lambda);

                         }


                         norm = sqrt(norm * norm + tworate * (*this->samples)[idx]->Y() * lambda * (func[idx] - bias) +

                                     sqrate * (*K)[idx][idx]);

                         (*this->samples)[idx]->Alpha() += this->rate;


                         bias += this->rate * y;


                         k = (i > s) ? ++s : e;

                         j = index[k];

                         index[k] = idx;

                         index[i] = j;

                         ++this->ctot;

                         ++e;

                     } else if (this->steps > 0 && e > 1 && i > s) break;

                 }


                 ++this->steps; //Number of iterations update

                 //stop criterion

                 if (e == 0) break;

                 if (this->steps > this->MAX_IT) break;

                 if (this->ctot > this->MAX_UP) break;

             }


             this->samples->setIndex(index);

             this->solution.bias = bias;

             this->solution.norm = norm;

             this->solution.func = func;

             this->solution.w.resize(dim);

             this->solution.alpha.resize(size);

             for (i = 0; i < dim; i++) {

                 for (j = 0; j < size; j++) {

                     this->solution.alpha[j] = (*this->samples)[j]->Alpha();

                     this->solution.w[i] +=

                             (*this->samples)[j]->Alpha() * (*this->samples)[j]->Y() * (*this->samples)[j]->X()[i];

                 }

             }


             return (e == 0);

         }

     }

 }


 #endif

DualClassifier.hpp

PrimalClassifier.hpp

mltk::Data< T >

mltk::Data::point
PointPointer< T > point(int index) const
Returns a shared pointer to the point with the given index.
Definition: Data.hpp:1510

mltk::Data::size
size_t size() const
Returns the size of the dataset.
Definition: Data.hpp:208

mltk::Data::setIndex
void setIndex(std::vector< int > index)
Set the index vector for the data.
Definition: Data.hpp:1754

mltk::Data::setPoint
void setPoint(int index, std::shared_ptr< Point< T > > p)
setPoint Set the point in a position of the data.
Definition: Data.hpp:1515

mltk::Data::getIndex
std::vector< int > getIndex() const
Returns the vector of indexes.
Definition: Data.hpp:1695

mltk::Data::dim
size_t dim() const
Returns the dimension of the dataset.
Definition: Data.hpp:213

mltk::Data::shuffle
void shuffle(const size_t &seed=42)
Shuffle the data with a given seed.
Definition: Data.hpp:1349

mltk::Kernel< T >

mltk::Point< T >

mltk::Point::X
Rep const  & X() const
Returns the attributes representation of the point (std::vector by default).
Definition: Point.hpp:139

mltk::Point::Y
double const  & Y() const
Returns the class or value of the point.
Definition: Point.hpp:152

mltk::Solution
Definition: Solution.hpp:13

mltk::Solution::alpha
std::vector< double > alpha
Alpha Vector for Dual methods.
Definition: Solution.hpp:21

mltk::classifier::BalancedPerceptron
Definition: Perceptron.hpp:80

mltk::classifier::BalancedPerceptron::train
bool train() override
Function that execute the training phase of a Learner.
Definition: Perceptron.hpp:93

mltk::classifier::BalancedPerceptron::getFormulationString
std::string getFormulationString() override
getFormulationString Returns a string that represents the formulation of the learner (Primal or Dual)...
Definition: Perceptron.hpp:155

mltk::classifier::BalancedPerceptron::evaluate
double evaluate(const Point< T > &p, bool raw_value) override
Returns the class of a feature point based on the trained Learner.
Definition: Perceptron.hpp:147

mltk::classifier::DualClassifier
Definition: DualClassifier.hpp:16

mltk::classifier::PerceptronDual
Wrapper for the implementation of the Perceptron dual algorithm.
Definition: Perceptron.hpp:50

mltk::classifier::PerceptronDual::train
bool train() override
Function that execute the training phase of a Learner.
Definition: Perceptron.hpp:402

mltk::classifier::PerceptronFixedMarginDual
Wrapper for the implementation of the Perceptron dual with fixed margin algorithm.
Definition: Perceptron.hpp:69

mltk::classifier::PerceptronFixedMarginDual::train
bool train() override
Function that execute the training phase of a Learner.
Definition: Perceptron.hpp:480

mltk::classifier::PerceptronFixedMarginPrimal
Wrapper for the implementation of the Perceptron primal with fixed margin algorithm.
Definition: Perceptron.hpp:35

mltk::classifier::PerceptronFixedMarginPrimal::evaluate
double evaluate(const Point< T > &p, bool raw_value=false) override
Returns the class of a feature point based on the trained Learner.
Definition: Perceptron.hpp:358

mltk::classifier::PerceptronFixedMarginPrimal::train
bool train() override
Function that execute the training phase of a Learner.
Definition: Perceptron.hpp:245

mltk::classifier::PerceptronPrimal
Wrapper for the implementation of the Perceptron primal algorithm.
Definition: Perceptron.hpp:21

mltk::classifier::PerceptronPrimal::evaluate
double evaluate(const Point< T > &p, bool raw_value=false) override
Returns the class of a feature point based on the trained Learner.
Definition: Perceptron.hpp:229

mltk::classifier::PerceptronPrimal::train
bool train() override
Function that execute the training phase of a Learner.
Definition: Perceptron.hpp:180

mltk::classifier::PrimalClassifier
Definition: PrimalClassifier.hpp:14

mltk::classifier::PrimalClassifier::evaluate
double evaluate(const Point< T > &p, bool raw_value=false) override
Returns the class of a feature point based on the trained Learner.
Definition: PrimalClassifier.hpp:42

mltk::timer
A helper class to measure execution time for benchmarking purposes.
Definition: ThreadPool.hpp:503

mltk
UFJF-MLTK main namespace for core functionalities.
Definition: classifier/Classifier.hpp:11

mltk::dot
T dot(const Point< T, R > &p, const Point< T, R > &p1)
Computes the dot product with a vector.
Definition: Point.hpp:528

mltk::max
T max(const Point< T, R > &p)
Returns the max value of the point.
Definition: Point.hpp:544