Aakash-kaushik/mlpack/logistic__regression__function__impl_8hpp_source.html

 #ifndef MLPACK_METHODS_LOGISTIC_REGRESSION_FUNCTION_IMPL_HPP
 #define MLPACK_METHODS_LOGISTIC_REGRESSION_FUNCTION_IMPL_HPP

 // In case it hasn't been included yet.
 #include "logistic_regression_function.hpp"

 #include <mlpack/core.hpp>

 namespace mlpack {
 namespace regression {

 template<typename MatType>
 LogisticRegressionFunction<MatType>::LogisticRegressionFunction(
     const MatType& predictors,
     const arma::Row<size_t>& responses,
     const double lambda) :
     // We promise to be well-behaved... the elements won't be modified.
     predictors(math::MakeAlias(const_cast<MatType&>(predictors), false)),
     responses(math::MakeAlias(const_cast<arma::Row<size_t>&>(responses),
         false)),
     lambda(lambda)
 {
   // Sanity check.
   if (responses.n_elem != predictors.n_cols)
   {
     Log::Fatal << "LogisticRegressionFunction::LogisticRegressionFunction(): "
         << "predictors matrix has " << predictors.n_cols << " points, but "
         << "responses vector has " << responses.n_elem << " elements (should be"
         << " " << predictors.n_cols << ")!" << std::endl;
   }
 }

 template<typename MatType>
 void LogisticRegressionFunction<MatType>::Shuffle()
 {
   MatType newPredictors;
   arma::Row<size_t> newResponses;

   math::ShuffleData(predictors, responses, newPredictors, newResponses);

   // If we are an alias, make sure we don't write to the original data.
   math::ClearAlias(predictors);
   math::ClearAlias(responses);

   // Take ownership of the new data.
   predictors = std::move(newPredictors);
   responses = std::move(newResponses);
 }

 template<typename MatType>
 double LogisticRegressionFunction<MatType>::Evaluate(
     const arma::mat& parameters) const
 {
   // The objective function is the log-likelihood function (w is the parameters
   // vector for the model; y is the responses; x is the predictors; sig() is the
   // sigmoid function):
   //   f(w) = sum(y log(sig(w'x)) + (1 - y) log(sig(1 - w'x))).
   // We want to minimize this function.  L2-regularization is just lambda
   // multiplied by the squared l2-norm of the parameters then divided by two.

   // For the regularization, we ignore the first term, which is the intercept
   // term and take every term except the last one in the decision variable.
   const double regularization = 0.5 * lambda *
       arma::dot(parameters.tail_cols(parameters.n_elem - 1),
       parameters.tail_cols(parameters.n_elem - 1));

   // Calculate vectors of sigmoids.  The intercept term is parameters(0, 0) and
   // does not need to be multiplied by any of the predictors.
   const arma::rowvec sigmoid = 1.0 / (1.0 + arma::exp(-(parameters(0, 0) +
       parameters.tail_cols(parameters.n_elem - 1) * predictors)));

   // Assemble full objective function.  Often the objective function and the
   // regularization as given are divided by the number of features, but this
   // doesn't actually affect the optimization result, so we'll just ignore those
   // terms for computational efficiency.  Note that the conversion causes some
   // copy and slowdown, but this is so negligible compared to the rest of the
   // calculation it is not worth optimizing for.
   const double result = arma::accu(arma::log(1.0 -
       arma::conv_to<arma::rowvec>::from(responses) + sigmoid %
       (2 * arma::conv_to<arma::rowvec>::from(responses) - 1.0)));

   // Invert the result, because it's a minimization.
   return regularization - result;
 }

 template<typename MatType>
 double LogisticRegressionFunction<MatType>::Evaluate(
                   const arma::mat& parameters,
                   const size_t begin,
                   const size_t batchSize) const
 {
   // Calculate the regularization term.
   const double regularization = lambda *
       (batchSize / (2.0 * predictors.n_cols)) *
       arma::dot(parameters.tail_cols(parameters.n_elem - 1),
                 parameters.tail_cols(parameters.n_elem - 1));

   // Calculate the sigmoid function values.
   const arma::rowvec sigmoid = 1.0 / (1.0 + arma::exp(-(parameters(0, 0) +
       parameters.tail_cols(parameters.n_elem - 1) *
       predictors.cols(begin, begin + batchSize - 1))));

   // Compute the objective for the given batch size from a given point.
   arma::rowvec respD = arma::conv_to<arma::rowvec>::from(responses.subvec(begin,
       begin + batchSize - 1));
   const double result = arma::accu(arma::log(1.0 - respD + sigmoid %
       (2 * respD - 1.0)));

   // Invert the result, because it's a minimization.
   return regularization - result;
 }

 template<typename MatType>
 void LogisticRegressionFunction<MatType>::Gradient(
     const arma::mat& parameters,
     arma::mat& gradient) const
 {
   // Regularization term.
   arma::mat regularization;
   regularization = lambda * parameters.tail_cols(parameters.n_elem - 1);

   const arma::rowvec sigmoids = (1 / (1 + arma::exp(-parameters(0, 0)
       - parameters.tail_cols(parameters.n_elem - 1) * predictors)));

   gradient.set_size(arma::size(parameters));
   gradient[0] = -arma::accu(responses - sigmoids);
   gradient.tail_cols(parameters.n_elem - 1) = (sigmoids - responses) *
       predictors.t() + regularization;
 }

 template<typename MatType>
 template<typename GradType>
 void LogisticRegressionFunction<MatType>::Gradient(
                 const arma::mat& parameters,
                 const size_t begin,
                 GradType& gradient,
                 const size_t batchSize) const
 {
   // Regularization term.
   arma::mat regularization;
   regularization = lambda * parameters.tail_cols(parameters.n_elem - 1)
       / predictors.n_cols * batchSize;

   const arma::rowvec exponents = parameters(0, 0) +
       parameters.tail_cols(parameters.n_elem - 1) *
       predictors.cols(begin, begin + batchSize - 1);
   // Calculating the sigmoid function values.
   const arma::rowvec sigmoids = 1.0 / (1.0 + arma::exp(-exponents));

   gradient.set_size(parameters.n_rows, parameters.n_cols);
   gradient[0] = -arma::accu(responses.subvec(begin, begin + batchSize - 1) -
       sigmoids);
   gradient.tail_cols(parameters.n_elem - 1) = (sigmoids -
       responses.subvec(begin, begin + batchSize - 1)) *
       predictors.cols(begin, begin + batchSize - 1).t() + regularization;
 }

 template <typename MatType>
 void LogisticRegressionFunction<MatType>::PartialGradient(
     const arma::mat& parameters,
     const size_t j,
     arma::sp_mat& gradient) const
 {
   const arma::rowvec diffs = responses - (1 / (1 + arma::exp(-parameters(0, 0)
       - parameters.tail_cols(parameters.n_elem - 1) * predictors)));

   gradient.set_size(arma::size(parameters));

   if (j == 0)
   {
     gradient[j] = -arma::accu(diffs);
   }
   else
   {
     gradient[j] = arma::dot(-predictors.row(j - 1), diffs) + lambda *
       parameters(0, j);
   }
 }

 template<typename MatType>
 template<typename GradType>
 double LogisticRegressionFunction<MatType>::EvaluateWithGradient(
     const arma::mat& parameters,
     GradType& gradient) const
 {
   // Regularization term.
   arma::mat regularization = lambda *
       parameters.tail_cols(parameters.n_elem - 1);

   const double objectiveRegularization = lambda / 2.0 *
       arma::dot(parameters.tail_cols(parameters.n_elem - 1),
                 parameters.tail_cols(parameters.n_elem - 1));

   // Calculate the sigmoid function values.
   const arma::rowvec sigmoids = 1.0 / (1.0 + arma::exp(-(parameters(0, 0) +
       parameters.tail_cols(parameters.n_elem - 1) * predictors)));

   gradient.set_size(arma::size(parameters));
   gradient[0] = -arma::accu(responses - sigmoids);
   gradient.tail_cols(parameters.n_elem - 1) = (sigmoids - responses) *
       predictors.t() + regularization;

   // Now compute the objective function using the sigmoids.
   double result = arma::accu(arma::log(1.0 -
       arma::conv_to<arma::rowvec>::from(responses) + sigmoids %
       (2 * arma::conv_to<arma::rowvec>::from(responses) - 1.0)));

   // Invert the result, because it's a minimization.
   return objectiveRegularization - result;
 }

 template<typename MatType>
 template<typename GradType>
 double LogisticRegressionFunction<MatType>::EvaluateWithGradient(
     const arma::mat& parameters,
     const size_t begin,
     GradType& gradient,
     const size_t batchSize) const
 {
   // Regularization term.
   arma::mat regularization =
       lambda * parameters.tail_cols(parameters.n_elem - 1) / predictors.n_cols *
       batchSize;

   const double objectiveRegularization = lambda *
       (batchSize / (2.0 * predictors.n_cols)) *
       arma::dot(parameters.tail_cols(parameters.n_elem - 1),
                 parameters.tail_cols(parameters.n_elem - 1));

   // Calculate the sigmoid function values.
   const arma::rowvec sigmoids = 1.0 / (1.0 + arma::exp(-(parameters(0, 0) +
       parameters.tail_cols(parameters.n_elem - 1) *
       predictors.cols(begin, begin + batchSize - 1))));

   gradient.set_size(parameters.n_rows, parameters.n_cols);
   gradient[0] = -arma::accu(responses.subvec(begin, begin + batchSize - 1) -
       sigmoids);
   gradient.tail_cols(parameters.n_elem - 1) = (sigmoids -
       responses.subvec(begin, begin + batchSize - 1)) *
       predictors.cols(begin, begin + batchSize - 1).t() + regularization;

   // Now compute the objective function using the sigmoids.
   arma::rowvec respD = arma::conv_to<arma::rowvec>::from(responses.subvec(begin,
       begin + batchSize - 1));
   const double result = arma::accu(arma::log(1.0 - respD + sigmoids %
       (2 * respD - 1.0)));

   // Invert the result, because it's a minimization.
   return objectiveRegularization - result;
 }

 } // namespace regression
 } // namespace mlpack

 #endif
logistic_regression_function.hpp

mlpack::regression::LogisticRegressionFunction::Gradient
void Gradient(const arma::mat &parameters, arma::mat &gradient) const
Evaluate the gradient of the logistic regression log-likelihood function with the given parameters...
Definition: logistic_regression_function_impl.hpp:137

mlpack::Log::Fatal
static MLPACK_EXPORT util::PrefixedOutStream Fatal
Prints fatal messages prefixed with [FATAL], then terminates the program.
Definition: log.hpp:90

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: cv.hpp:1

mlpack::regression::LogisticRegressionFunction::PartialGradient
void PartialGradient(const arma::mat &parameters, const size_t j, arma::sp_mat &gradient) const
Evaluate the gradient of the logistic regression log-likelihood function with the given parameters...
Definition: logistic_regression_function_impl.hpp:188

arma

mlpack::regression::LogisticRegressionFunction::Evaluate
double Evaluate(const arma::mat &parameters) const
Evaluate the logistic regression log-likelihood function with the given parameters.
Definition: logistic_regression_function_impl.hpp:69

mlpack::regression::LogisticRegressionFunction::EvaluateWithGradient
double EvaluateWithGradient(const arma::mat &parameters, GradType &gradient) const
Evaluate the objective function and gradient of the logistic regression log-likelihood function simul...
Definition: logistic_regression_function_impl.hpp:211

core.hpp
Include all of the base components required to write mlpack methods, and the main mlpack Doxygen docu...

mlpack::regression::LogisticRegressionFunction::Shuffle
void Shuffle()
Shuffle the order of function visitation.
Definition: logistic_regression_function_impl.hpp:48

mlpack::math::ShuffleData
void ShuffleData(const MatType &inputPoints, const LabelsType &inputLabels, MatType &outputPoints, LabelsType &outputLabels, const std::enable_if_t<!arma::is_SpMat< MatType >::value > *=0, const std::enable_if_t<!arma::is_Cube< MatType >::value > *=0)
Shuffle a dataset and associated labels (or responses).
Definition: shuffle_data.hpp:28

mlpack::math::ClearAlias
void ClearAlias(arma::Mat< ElemType > &mat)
Clear an alias so that no data is overwritten.
Definition: make_alias.hpp:110

mlpack::math::MakeAlias
arma::Cube< ElemType > MakeAlias(arma::Cube< ElemType > &input, const bool strict=true)
Make an alias of a dense cube.
Definition: make_alias.hpp:24

mlpack::regression::LogisticRegressionFunction::LogisticRegressionFunction
LogisticRegressionFunction(const MatType &predictors, const arma::Row< size_t > &responses, const double lambda=0)
Creates the LogisticRegressionFunction.
Definition: logistic_regression_function_impl.hpp:24