Aakash-kaushik/mlpack/linear__svm__function__impl_8hpp_source.html

 #ifndef MLPACK_METHODS_LINEAR_SVM_LINEAR_SVM_FUNCTION_IMPL_HPP
 #define MLPACK_METHODS_LINEAR_SVM_LINEAR_SVM_FUNCTION_IMPL_HPP

 #include <mlpack/core/math/make_alias.hpp>
 #include <mlpack/core/math/shuffle_data.hpp>

 // In case it hasn't been included yet.
 #include "linear_svm_function.hpp"

 namespace mlpack {
 namespace svm {

 template <typename MatType>
 LinearSVMFunction<MatType>::LinearSVMFunction(
     const MatType& dataset,
     const arma::Row<size_t>& labels,
     const size_t numClasses,
     const double lambda,
     const double delta,
     const bool fitIntercept) :
     dataset(math::MakeAlias(const_cast<MatType&>(dataset), false)),
     numClasses(numClasses),
     lambda(lambda),
     delta(delta),
     fitIntercept(fitIntercept)
 {
   InitializeWeights(initialPoint, dataset.n_rows, numClasses, fitIntercept);
   initialPoint *= 0.005;

   // Calculate the label matrix.
   GetGroundTruthMatrix(labels, groundTruth);
 }

 template <typename MatType>
 void LinearSVMFunction<MatType>::InitializeWeights(
     arma::mat &weights,
     const size_t featureSize,
     const size_t numClasses,
     const bool fitIntercept)
 {
   // Initialize values to 0.005 * r. 'r' is a matrix of random values taken from
   // a Gaussian distribution with mean zero and variance one.
   if (fitIntercept)
     weights.randn(featureSize + 1, numClasses);
   else
     weights.randn(featureSize, numClasses);
   weights *= 0.005;
 }

 template <typename MatType>
 void LinearSVMFunction<MatType>::GetGroundTruthMatrix(
     const arma::Row<size_t>& labels,
     arma::sp_mat& groundTruth)
 {
   // Calculate the ground truth matrix according to the labels passed. The
   // ground truth matrix is a matrix of dimensions 'numClasses * numExamples',
   // where each column contains a single entry of '1', marking the label
   // corresponding to that example.

   // Row pointers and column pointers corresponding to the entries.
   arma::uvec rowPointers(labels.n_elem);
   arma::uvec colPointers(labels.n_elem + 1);

   // colPointers[0] needs to be set to 0.
   colPointers[0] = 0;

   // Row pointers are the labels of the examples, and column pointers are the
   // number of cumulative entries made uptil that column.
   for (size_t i = 0; i < labels.n_elem; ++i)
   {
     rowPointers(i) = labels(i);
     colPointers(i + 1) = i + 1;
   }

   // All entries are '1'.
   arma::vec values;
   values.ones(labels.n_elem);

   // Calculate the matrix.
   groundTruth = arma::sp_mat(rowPointers, colPointers, values, numClasses,
                              labels.n_elem);
 }

 template <typename MatType>
 void LinearSVMFunction<MatType>::Shuffle()
 {
   // Determine new ordering.
   arma::uvec ordering = arma::shuffle(arma::linspace<arma::uvec>(0,
       dataset.n_cols - 1, dataset.n_cols));

   // Re-sort data.
   arma::mat newData = dataset.cols(ordering);
   math::ClearAlias(dataset);
   dataset = std::move(newData);

   // Assemble data for batch constructor.  We need reverse orderings though...
   arma::uvec reverseOrdering(ordering.n_elem);
   for (size_t i = 0; i < ordering.n_elem; ++i)
     reverseOrdering[ordering[i]] = i;

   arma::umat newLocations(2, groundTruth.n_nonzero);
   arma::vec values(groundTruth.n_nonzero);
   arma::sp_mat::const_iterator it = groundTruth.begin();
   size_t loc = 0;
   while (it != groundTruth.end())
   {
     newLocations(0, loc) = reverseOrdering(it.col());
     newLocations(1, loc) = it.row();
     values(loc) = (*it);

     ++it;
     ++loc;
   }

   groundTruth = arma::sp_mat(newLocations, values, groundTruth.n_rows,
                              groundTruth.n_cols);
 }

 template <typename MatType>
 double LinearSVMFunction<MatType>::Evaluate(
     const arma::mat& parameters)
 {
   // The objective function is the hinge loss function and it is
   // calculated over all the training examples.

   // Calculate the loss and regularization terms.
   // L_i = Σ_i Σ_m max(0, Δ + (w_m x_i + b_m) - (w_{y_i} x_i + b_{y_i}))
   // where (m != y_i)
   double loss, regularization;

   // Scores for each class are evaluated.
   arma::mat scores;

   // Check intercept condition.
   if (!fitIntercept)
   {
     scores = parameters.t() * dataset;
   }
   else
   {
     // When using `fitIntercept` we need to add the `b_i` term explicitly.
     // The first `parameters.n_rows - 1` rows of parameters holds the value
     // of Weights `w_i`, and the last row holds `b_i`.
     // On calculating the score, we add `b_i` term to each element of
     // `i_th` row of `scores`.
     scores = parameters.rows(0, dataset.n_rows - 1).t() * dataset
         + arma::repmat(parameters.row(dataset.n_rows).t(), 1,
         dataset.n_cols);
   }

   // Evaluate the margin by the following steps:
   //  - Subtracting the score of correct class from all the class scores.
   //  - Adding the margin parameter `delta`.
   //  - Removing the `delta` parameter from correct class label in each
   //    column.
   arma::mat margin = scores - (arma::repmat(arma::ones(numClasses).t()
       * (scores % groundTruth), numClasses, 1)) + delta
       - (delta * groundTruth);

   // The Hinge Loss Function
   loss = arma::accu(arma::clamp(margin, 0.0, DBL_MAX)) / dataset.n_cols;

   // Adding the regularization term.
   regularization = 0.5 * lambda * arma::dot(parameters, parameters);

   return loss + regularization;
 }

 template <typename MatType>
 double LinearSVMFunction<MatType>::Evaluate(
     const arma::mat& parameters,
     const size_t firstId,
     const size_t batchSize)
 {
   const size_t lastId = firstId + batchSize - 1;

   // Calculate the loss and regularization terms.
   double loss, regularization, cost;

   // Scores for each class are evaluated.
   arma::mat scores;

   // Check intercept condition.
   if (!fitIntercept)
   {
     scores = parameters.t() * dataset.cols(firstId, lastId);
   }
   else
   {
     scores = parameters.rows(0, dataset.n_rows - 1).t()
         * dataset.cols(firstId, lastId)
         + arma::repmat(parameters.row(dataset.n_rows).t(), 1,
         dataset.n_cols);
   }

   arma::mat margin = scores - (arma::repmat(arma::ones(numClasses).t()
       * (scores % groundTruth.cols(firstId, lastId)), numClasses, 1))
       + delta - (delta * groundTruth.cols(firstId, lastId));

   // The Hinge Loss Function
   loss = arma::accu(arma::clamp(margin, 0.0, DBL_MAX));
   loss /= batchSize;

   // Adding the regularization term.
   regularization = 0.5 * lambda * arma::dot(parameters, parameters);

   cost = loss + regularization;
   return cost;
 }

 template <typename MatType>
 template <typename GradType>
 void LinearSVMFunction<MatType>::Gradient(
     const arma::mat& parameters,
     GradType& gradient)
 {
   // The objective is to minimize the loss, which is evaluated as the sum
   // of all the positive elements of `margin` matrix.
   // So, we focus of these positive elements and reduce them.
   // Also, we need to increase the score of the correct class.

   // Scores for each class are evaluated.
   arma::mat scores;

   if (!fitIntercept)
   {
     scores = parameters.t() * dataset;
   }
   else
   {
     scores = parameters.rows(0, dataset.n_rows - 1).t() * dataset
         + arma::repmat(parameters.row(dataset.n_rows).t(), 1,
         dataset.n_cols);
   }

   arma::mat margin = scores - (arma::repmat(arma::ones(numClasses).t()
       * (scores % groundTruth), numClasses, 1)) + delta
       - (delta * groundTruth);

   // An element of `mask` matrix holds `1` corresponding to
   // each positive element of `margin` matrix.
   arma::mat mask = margin.for_each([](arma::mat::elem_type& val)
       { val = (val > 0) ? 1: 0; });

   arma::mat difference = groundTruth
       % (-arma::repmat(arma::sum(mask), numClasses, 1)) + mask;

   // The gradient is evaluated as follows:
   //  - Add `x_i` to `w_j` if `margin_i_m`is positive.
   //  - Subtract `x_i` from `w_y_i` for each positive
   //    `margin_i_j`.
   //  - Take the average over the size of dataset.
   //  - Add the regularization parameter.

   // Check intercept condition
   if (!fitIntercept)
   {
     gradient = dataset * difference.t();
   }
   else
   {
     gradient.set_size(arma::size(parameters));
     gradient.submat(0, 0, parameters.n_rows - 2, parameters.n_cols - 1) =
         dataset * difference.t();
     gradient.row(parameters.n_rows - 1) =
         arma::ones<arma::rowvec>(dataset.n_cols) * difference.t();
   }

   gradient /= dataset.n_cols;

   // Adding the regularization contribution to the gradient.
   gradient += lambda * parameters;
 }

 template <typename MatType>
 template <typename GradType>
 void LinearSVMFunction<MatType>::Gradient(
     const arma::mat& parameters,
     const size_t firstId,
     GradType& gradient,
     const size_t batchSize)
 {
   const size_t lastId = firstId + batchSize - 1;

   // Scores for each class are evaluated.
   arma::mat scores;

   // Check intercept condition.
   if (!fitIntercept)
   {
     scores = parameters.t() * dataset.cols(firstId, lastId);
   }
   else
   {
     scores = parameters.rows(0, dataset.n_rows - 1).t()
         * dataset.cols(firstId, lastId)
         + arma::repmat(parameters.row(dataset.n_rows).t(), 1, batchSize);
   }

   arma::mat margin = scores - (arma::repmat(arma::ones(numClasses).t()
       * (scores % groundTruth.cols(firstId, lastId)), numClasses, 1))
       + delta - (delta * groundTruth.cols(firstId, lastId));

   // For each sample, find the total number of classes where
   // ( margin > 0 ).
   arma::mat mask = margin.for_each([](arma::mat::elem_type& val)
       { val = (val > 0) ? 1: 0; });

   arma::mat difference = groundTruth.cols(firstId, lastId)
       % (-arma::repmat(arma::sum(mask), numClasses, 1)) + mask;

   // Check intercept condition
   if (!fitIntercept)
   {
     gradient = dataset.cols(firstId, lastId) * difference.t();
   }
   else
   {
     gradient.set_size(arma::size(parameters));
     gradient.submat(0, 0, parameters.n_rows - 2, parameters.n_cols - 1) =
         dataset.cols(firstId, lastId) * difference.t();
     gradient.row(parameters.n_rows - 1) =
         arma::ones<arma::rowvec>(batchSize) * difference.t();
   }

   gradient /= batchSize;

   // Adding the regularization contribution to the gradient.
   gradient += lambda * parameters;
 }

 template <typename MatType>
 template <typename GradType>
 double LinearSVMFunction<MatType>::EvaluateWithGradient(
     const arma::mat& parameters,
     GradType& gradient) const
 {
   double loss, regularization, cost;

   // Scores for each class are evaluated.
   arma::mat scores;

   if (!fitIntercept)
   {
     scores = parameters.t() * dataset;
   }
   else
   {
     scores = parameters.rows(0, dataset.n_rows - 1).t() * dataset
         + arma::repmat(parameters.row(dataset.n_rows).t(), 1,
         dataset.n_cols);
   }

   arma::mat margin = scores - (arma::repmat(arma::ones(numClasses).t()
       * (scores % groundTruth), numClasses, 1)) + delta
       - (delta * groundTruth);

   // For each sample, find the total number of classes where
   // ( margin > 0 ).
   arma::mat mask = margin.for_each([](arma::mat::elem_type& val)
       { val = (val > 0) ? 1: 0; });

   arma::mat difference = groundTruth
       % (-arma::repmat(arma::sum(mask), numClasses, 1)) + mask;

   // Check intercept condition
   if (!fitIntercept)
   {
     gradient = dataset * difference.t();
   }
   else
   {
     gradient.set_size(arma::size(parameters));
     gradient.submat(0, 0, parameters.n_rows - 2, parameters.n_cols - 1) =
             dataset * difference.t();
     gradient.row(parameters.n_rows - 1) =
             arma::ones<arma::rowvec>(dataset.n_cols) * difference.t();
   }

   gradient /= dataset.n_cols;

   // Adding the regularization contribution to the gradient.
   gradient += lambda * parameters;

   // The Hinge Loss Function
   loss = arma::accu(arma::clamp(margin, 0.0, DBL_MAX));
   loss /= dataset.n_cols;

   // Adding the regularization term.
   regularization = 0.5 * lambda * arma::dot(parameters, parameters);

   cost = loss + regularization;
   return cost;
 }

 template <typename MatType>
 template <typename GradType>
 double LinearSVMFunction<MatType>::EvaluateWithGradient(
     const arma::mat& parameters,
     const size_t firstId,
     GradType& gradient,
     const size_t batchSize) const
 {
   const size_t lastId = firstId + batchSize - 1;

   // Calculate the loss and regularization terms.
   double loss, regularization, cost;

   // Scores for each class are evaluated.
   arma::mat scores;

   // Check intercept condition.
   if (!fitIntercept)
   {
     scores = parameters.t() * dataset.cols(firstId, lastId);
   }
   else
   {
     scores = parameters.rows(0, dataset.n_rows - 1).t()
         * dataset.cols(firstId, lastId)
         + arma::repmat(parameters.row(dataset.n_rows).t(), 1, dataset.n_cols);
   }

   arma::mat margin = scores - (arma::repmat(arma::ones(numClasses).t()
       * (scores % groundTruth.cols(firstId, lastId)), numClasses, 1))
       + delta - (delta * groundTruth.cols(firstId, lastId));

   // For each sample, find the total number of classes where
   // ( margin > 0 ).
   arma::mat mask = margin.for_each([](arma::mat::elem_type& val)
       { val = (val > 0) ? 1: 0; });

   arma::mat difference = groundTruth.cols(firstId, lastId)
       % (-arma::repmat(arma::sum(mask), numClasses, 1)) + mask;

   // Check intercept condition
   if (!fitIntercept)
   {
     gradient = dataset.cols(firstId, lastId) * difference.t();
   }
   else
   {
     gradient.set_size(arma::size(parameters));
     gradient.submat(0, 0, parameters.n_rows - 2, parameters.n_cols - 1) =
         dataset.cols(firstId, lastId) * difference.t();
     gradient.row(parameters.n_rows - 1) =
         arma::ones<arma::rowvec>(batchSize) * difference.t();
   }

   gradient /= batchSize;


   // Adding the regularization contribution to the gradient.
   gradient += lambda * parameters;

   // The Hinge Loss Function
   loss = arma::accu(arma::clamp(margin.cols(firstId, lastId), 0.0, DBL_MAX));
   loss /= batchSize;

   // Adding the regularization term.
   regularization = 0.5 * lambda * arma::dot(parameters, parameters);

   cost = loss + regularization;
   return cost;
 }

 template <typename MatType>
 size_t LinearSVMFunction<MatType>::NumFunctions() const
 {
   // The number of points in the dataset is the number of functions, as this
   // is a data dependent function.
   return dataset.n_cols;
 }

 } // namespace svm
 } // namespace mlpack


 #endif // MLPACK_METHODS_LINEAR_SVM_LINEAR_SVM_FUNCTION_IMPL_HPP
linear_svm_function.hpp

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: cv.hpp:1

mlpack::svm::LinearSVMFunction::GetGroundTruthMatrix
void GetGroundTruthMatrix(const arma::Row< size_t > &labels, arma::sp_mat &groundTruth)
Constructs the ground truth label matrix with the passed labels.
Definition: linear_svm_function_impl.hpp:74

mlpack::svm::LinearSVMFunction::EvaluateWithGradient
double EvaluateWithGradient(const arma::mat &parameters, GradType &gradient) const
Evaluate the gradient of the hinge loss function, following the LinearFunctionType requirements on th...
Definition: linear_svm_function_impl.hpp:360

mlpack::svm::LinearSVMFunction::Gradient
void Gradient(const arma::mat &parameters, GradType &gradient)
Evaluate the gradient of the hinge loss function following the LinearFunctionType requirements on the...
Definition: linear_svm_function_impl.hpp:239

mlpack::svm::LinearSVMFunction::LinearSVMFunction
LinearSVMFunction(const MatType &dataset, const arma::Row< size_t > &labels, const size_t numClasses, const double lambda=0.0001, const double delta=1.0, const bool fitIntercept=false)
Construct the Linear SVM objective function with given parameters.
Definition: linear_svm_function_impl.hpp:27

mlpack::svm::LinearSVMFunction::Evaluate
double Evaluate(const arma::mat &parameters)
Evaluate the hinge loss function for all the datapoints.
Definition: linear_svm_function_impl.hpp:146

make_alias.hpp

shuffle_data.hpp

mlpack::svm::LinearSVMFunction::NumFunctions
size_t NumFunctions() const
Return the number of functions.
Definition: linear_svm_function_impl.hpp:494

mlpack::math::ClearAlias
void ClearAlias(arma::Mat< ElemType > &mat)
Clear an alias so that no data is overwritten.
Definition: make_alias.hpp:110

mlpack::svm::LinearSVMFunction::Shuffle
void Shuffle()
Shuffle the dataset.
Definition: linear_svm_function_impl.hpp:111

mlpack::math::MakeAlias
arma::Cube< ElemType > MakeAlias(arma::Cube< ElemType > &input, const bool strict=true)
Make an alias of a dense cube.
Definition: make_alias.hpp:24

mlpack::svm::LinearSVMFunction::InitializeWeights
static void InitializeWeights(arma::mat &weights, const size_t featureSize, const size_t numClasses, const bool fitIntercept=false)
Initialize Linear SVM weights (trainable parameters) with the given parameters.
Definition: linear_svm_function_impl.hpp:53