Aakash-kaushik/mlpack/regularized__svd__function__impl_8hpp_source.html

 #ifndef MLPACK_METHODS_REGULARIZED_SVD_REGULARIZED_FUNCTION_SVD_IMPL_HPP
 #define MLPACK_METHODS_REGULARIZED_SVD_REGULARIZED_FUNCTION_SVD_IMPL_HPP

 #include "regularized_svd_function.hpp"
 #include <mlpack/core/math/make_alias.hpp>

 namespace mlpack {
 namespace svd {

 template <typename MatType>
 RegularizedSVDFunction<MatType>::RegularizedSVDFunction(const MatType& data,
                                                         const size_t rank,
                                                         const double lambda) :
     data(math::MakeAlias(const_cast<MatType&>(data), false)),
     rank(rank),
     lambda(lambda)
 {
   // Number of users and items in the data.
   numUsers = max(data.row(0)) + 1;
   numItems = max(data.row(1)) + 1;

   // Initialize the parameters.
   initialPoint.randu(rank, numUsers + numItems);
 }

 template<typename MatType>
 void RegularizedSVDFunction<MatType>::Shuffle()
 {
   data = data.cols(arma::shuffle(arma::linspace<arma::uvec>(0, data.n_cols - 1,
       data.n_cols)));
 }

 template <typename MatType>
 double RegularizedSVDFunction<MatType>::Evaluate(const arma::mat& parameters)
 const
 {
   return Evaluate(parameters, 0, data.n_cols);
 }

 template <typename MatType>
 double RegularizedSVDFunction<MatType>::Evaluate(const arma::mat& parameters,
                                                  const size_t start,
                                                  const size_t batchSize) const
 {
   // The cost for the optimization is as follows:
   //          f(u, v) = sum((rating(i, j) - u(i).t() * v(j))^2)
   // The sum is over all the ratings in the rating matrix.
   // 'i' points to the user and 'j' points to the item being considered.
   // The regularization term is added to the above cost, where the vectors u(i)
   // and v(j) are regularized for each rating they contribute to.

   // It's possible this loop could be changed so that it's SIMD-vectorized.
   double objective = 0.0;
   for (size_t i = start; i < start + batchSize; ++i)
   {
     // Indices for accessing the the correct parameter columns.
     const size_t user = data(0, i);
     const size_t item = data(1, i) + numUsers;

     // Calculate the squared error in the prediction.
     const double rating = data(2, i);
     double ratingError = rating - arma::dot(parameters.col(user),
                                             parameters.col(item));
     double ratingErrorSquared = ratingError * ratingError;

     // Calculate the regularization penalty corresponding to the parameters.
     double userVecNorm = arma::norm(parameters.col(user), 2);
     double itemVecNorm = arma::norm(parameters.col(item), 2);
     double regularizationError = lambda * (userVecNorm * userVecNorm +
                                            itemVecNorm * itemVecNorm);

     objective += (ratingErrorSquared + regularizationError);
   }

   return objective;
 }

 template <typename MatType>
 void RegularizedSVDFunction<MatType>::Gradient(const arma::mat& parameters,
                                                arma::mat& gradient) const
 {
   // For an example with rating corresponding to user 'i' and item 'j', the
   // gradients for the parameters is as follows:
   //           grad(u(i)) = lambda * u(i) - error * v(j)
   //           grad(v(j)) = lambda * v(j) - error * u(i)
   // 'error' is the prediction error for that example, which is:
   //           rating(i, j) - u(i).t() * v(j)
   // The full gradient is calculated by summing the contributions over all the
   // training examples.

   gradient.zeros(rank, numUsers + numItems);

   for (size_t i = 0; i < data.n_cols; ++i)
   {
     // Indices for accessing the the correct parameter columns.
     const size_t user = data(0, i);
     const size_t item = data(1, i) + numUsers;

     // Prediction error for the example.
     const double rating = data(2, i);
     double ratingError = rating - arma::dot(parameters.col(user),
                                             parameters.col(item));

     // Gradient is non-zero only for the parameter columns corresponding to the
     // example.
     gradient.col(user) += 2 * (lambda * parameters.col(user) -
                                ratingError * parameters.col(item));
     gradient.col(item) += 2 * (lambda * parameters.col(item) -
                                ratingError * parameters.col(user));
   }
 }

 template <typename MatType>
 template <typename GradType>
 void RegularizedSVDFunction<MatType>::Gradient(const arma::mat& parameters,
                                                const size_t start,
                                                GradType& gradient,
                                                const size_t batchSize) const
 {
   gradient.zeros(rank, numUsers + numItems);

   // It's possible this could be SIMD-vectorized for additional speedup.
   for (size_t i = start; i < start + batchSize; ++i)
   {
     const size_t user = data(0, i);
     const size_t item = data(1, i) + numUsers;

     // Prediction error for the example.
     const double rating = data(2, i);
     double ratingError = rating - arma::dot(parameters.col(user),
                                             parameters.col(item));

     // Gradient is non-zero only for the parameter columns corresponding to the
     // example.
     gradient.col(user) += 2 * (lambda * parameters.col(user) -
                                ratingError * parameters.col(item));
     gradient.col(item) += 2 * (lambda * parameters.col(item) -
                                ratingError * parameters.col(user));
   }
 }

 } // namespace svd
 } // namespace mlpack

 // Template specialization for the SGD optimizer.
 namespace ens {

 template <>
 template <>
 double StandardSGD::Optimize(
     mlpack::svd::RegularizedSVDFunction<arma::mat>& function,
     arma::mat& parameters)
 {
   // Find the number of functions to use.
   const size_t numFunctions = function.NumFunctions();

   // To keep track of where we are and how things are going.
   size_t currentFunction = 0;
   double overallObjective = 0;

   // Calculate the first objective function.
   for (size_t i = 0; i < numFunctions; ++i)
     overallObjective += function.Evaluate(parameters, i);

   const arma::mat data = function.Dataset();

   // Now iterate!
   for (size_t i = 1; i != maxIterations; ++i, currentFunction++)
   {
     // Is this iteration the start of a sequence?
     if ((currentFunction % numFunctions) == 0)
     {
       const size_t epoch = i / numFunctions + 1;
       mlpack::Log::Info << "Epoch " << epoch << "; " << "objective "
           << overallObjective << "." << std::endl;

       // Reset the counter variables.
       overallObjective = 0;
       currentFunction = 0;
     }

     const size_t numUsers = function.NumUsers();

     // Indices for accessing the the correct parameter columns.
     const size_t user = data(0, currentFunction);
     const size_t item = data(1, currentFunction) + numUsers;

     // Prediction error for the example.
     const double rating = data(2, currentFunction);
     double ratingError = rating - arma::dot(parameters.col(user),
                                             parameters.col(item));

     double lambda = function.Lambda();

     // Gradient is non-zero only for the parameter columns corresponding to the
     // example.
     parameters.col(user) -= stepSize * (lambda * parameters.col(user) -
                                         ratingError * parameters.col(item));
     parameters.col(item) -= stepSize * (lambda * parameters.col(item) -
                                         ratingError * parameters.col(user));

     // Now add that to the overall objective function.
     overallObjective += function.Evaluate(parameters, currentFunction);
   }

   return overallObjective;
 }


 template <>
 template <>
 inline double ParallelSGD<ExponentialBackoff>::Optimize(
     mlpack::svd::RegularizedSVDFunction<arma::mat>& function,
     arma::mat& iterate)
 {
   double overallObjective = DBL_MAX;
   double lastObjective;

   // The order in which the functions will be visited.
   arma::Col<size_t> visitationOrder = arma::linspace<arma::Col<size_t>>(0,
       (function.NumFunctions() - 1), function.NumFunctions());

   const arma::mat data = function.Dataset();

   // Iterate till the objective is within tolerance or the maximum number of
   // allowed iterations is reached. If maxIterations is 0, this will iterate
   // till convergence.
   for (size_t i = 1; i != maxIterations; ++i)
   {
     // Calculate the overall objective.
     lastObjective = overallObjective;
     overallObjective = 0;

     #pragma omp parallel for reduction(+:overallObjective)
     for (omp_size_t j = 0; j < (omp_size_t) function.NumFunctions(); ++j)
     {
       overallObjective += function.Evaluate(iterate, j);
     }

     // Output current objective function.
     mlpack::Log::Info << "Parallel SGD: iteration " << i << ", objective "
         << overallObjective << "." << std::endl;

     if (std::isnan(overallObjective) || std::isinf(overallObjective))
     {
       mlpack::Log::Warn << "Parallel SGD: converged to " << overallObjective
           << "; terminating with failure. Try a smaller step size?"
           << std::endl;
       return overallObjective;
     }

     if (std::abs(lastObjective - overallObjective) < tolerance)
     {
       mlpack::Log::Info << "SGD: minimized within tolerance " << tolerance
           << "; terminating optimization." << std::endl;
       return overallObjective;
     }

     // Get the stepsize for this iteration
     double stepSize = decayPolicy.StepSize(i);

     if (shuffle) // Determine order of visitation.
       std::shuffle(visitationOrder.begin(), visitationOrder.end(),
           mlpack::math::randGen);

     #pragma omp parallel
     {
       // Each processor gets a subset of the instances.
       // Each subset is of size threadShareSize.
       size_t threadId = 0;
       #ifdef HAS_OPENMP
         threadId = omp_get_thread_num();
       #endif

       for (size_t j = threadId * threadShareSize;
           j < (threadId + 1) * threadShareSize && j < visitationOrder.n_elem;
           ++j)
       {
         const size_t numUsers = function.NumUsers();

         // Indices for accessing the the correct parameter columns.
         const size_t user = data(0, visitationOrder[j]);
         const size_t item = data(1, visitationOrder[j]) + numUsers;

         // Prediction error for the example.
         const double rating = data(2, visitationOrder[j]);
         double ratingError = rating - arma::dot(iterate.col(user),
             iterate.col(item));

         double lambda = function.Lambda();

         arma::mat userUpdate = stepSize * (lambda * iterate.col(user) -
             ratingError * iterate.col(item));
         arma::mat itemUpdate = stepSize * (lambda * iterate.col(item) -
             ratingError * iterate.col(user));

         // Gradient is non-zero only for the parameter columns corresponding to
         // the example.
         for (size_t i = 0; i < iterate.n_rows; ++i)
         {
           #pragma omp atomic
           iterate(i, user) -= userUpdate(i);
           #pragma omp atomic
           iterate(i, item) -= itemUpdate(i);
         }
       }
     }
   }
   mlpack::Log::Info << "\n Parallel SGD terminated with objective : "
       << overallObjective << std::endl;

   return overallObjective;
 }

 } // namespace ens

 #endif
mlpack::svd::RegularizedSVDFunction::Shuffle
void Shuffle()
Shuffle the points in the dataset.
Definition: regularized_svd_function_impl.hpp:38

mlpack::svd::RegularizedSVDFunction::NumFunctions
size_t NumFunctions() const
Return the number of training examples. Useful for SGD optimizer.
Definition: regularized_svd_function.hpp:104

data

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: cv.hpp:1

ens
Definition: bias_svd_function_impl.hpp:185

mlpack::svd::RegularizedSVDFunction::Evaluate
double Evaluate(const arma::mat &parameters) const
Evaluates the cost function over all examples in the data.
Definition: regularized_svd_function_impl.hpp:45

mlpack::svd::RegularizedSVDFunction::Gradient
void Gradient(const arma::mat &parameters, arma::mat &gradient) const
Evaluates the full gradient of the cost function over all the training examples.
Definition: regularized_svd_function_impl.hpp:90

mlpack::Log::Warn
static MLPACK_EXPORT util::PrefixedOutStream Warn
Prints warning messages prefixed with [WARN ].
Definition: log.hpp:87

mlpack::svd::RegularizedSVDFunction::RegularizedSVDFunction
RegularizedSVDFunction(const MatType &data, const size_t rank, const double lambda)
Constructor for RegularizedSVDFunction class.
Definition: regularized_svd_function_impl.hpp:22

regularized_svd_function.hpp

make_alias.hpp

mlpack::Log::Info
static MLPACK_EXPORT util::PrefixedOutStream Info
Prints informational messages if –verbose is specified, prefixed with [INFO ].
Definition: log.hpp:84

mlpack::math::MakeAlias
arma::Cube< ElemType > MakeAlias(arma::Cube< ElemType > &input, const bool strict=true)
Make an alias of a dense cube.
Definition: make_alias.hpp:24

mlpack::svd::RegularizedSVDFunction
The data is stored in a matrix of type MatType, so that this class can be used with both dense and sp...
Definition: regularized_svd_function.hpp:29

mlpack::math::randGen
MLPACK_EXPORT std::mt19937 randGen
MLPACK_EXPORT is required for global variables; it exports the symbols correctly on Windows...
Definition: random.cpp:18