Aakash-kaushik/mlpack/rnn__impl_8hpp_source.html

 #ifndef MLPACK_METHODS_ANN_RNN_IMPL_HPP
 #define MLPACK_METHODS_ANN_RNN_IMPL_HPP

 // In case it hasn't been included yet.
 #include "rnn.hpp"

 #include "visitor/load_output_parameter_visitor.hpp"
 #include "visitor/save_output_parameter_visitor.hpp"
 #include "visitor/forward_visitor.hpp"
 #include "visitor/backward_visitor.hpp"
 #include "visitor/reset_cell_visitor.hpp"
 #include "visitor/deterministic_set_visitor.hpp"
 #include "visitor/gradient_set_visitor.hpp"
 #include "visitor/gradient_visitor.hpp"
 #include "visitor/weight_set_visitor.hpp"

 #include "util/check_input_shape.hpp"

 namespace mlpack {
 namespace ann  {

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::RNN(
     const size_t rho,
     const bool single,
     OutputLayerType outputLayer,
     InitializationRuleType initializeRule) :
     rho(rho),
     outputLayer(std::move(outputLayer)),
     initializeRule(std::move(initializeRule)),
     inputSize(0),
     outputSize(0),
     targetSize(0),
     reset(false),
     single(single),
     numFunctions(0),
     deterministic(true)
 {
   /* Nothing to do here */
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::RNN(
     const RNN& network) :
     rho(network.rho),
     outputLayer(network.outputLayer),
     initializeRule(network.initializeRule),
     inputSize(network.inputSize),
     outputSize(network.outputSize),
     targetSize(network.targetSize),
     reset(network.reset),
     single(network.single),
     parameter(network.parameter),
     numFunctions(network.numFunctions),
     deterministic(network.deterministic)
 {
   for (size_t i = 0; i < network.network.size(); ++i)
   {
     this->network.push_back(boost::apply_visitor(copyVisitor,
         network.network[i]));
     boost::apply_visitor(resetVisitor, this->network.back());
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::RNN(
     RNN&& network) :
     rho(std::move(network.rho)),
     outputLayer(std::move(network.outputLayer)),
     initializeRule(std::move(network.initializeRule)),
     inputSize(std::move(network.inputSize)),
     outputSize(std::move(network.outputSize)),
     targetSize(std::move(network.targetSize)),
     reset(std::move(network.reset)),
     single(std::move(network.single)),
     network(std::move(network.network)),
     parameter(std::move(network.parameter)),
     numFunctions(std::move(network.numFunctions)),
     deterministic(std::move(network.deterministic))
 {
   // Nothing to do here.
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::~RNN()
 {
   for (LayerTypes<CustomLayers...>& layer : network)
   {
     boost::apply_visitor(deleteVisitor, layer);
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename OptimizerType>
 typename std::enable_if<
       HasMaxIterations<OptimizerType, size_t&(OptimizerType::*)()>
       ::value, void>::type
 RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::
 WarnMessageMaxIterations(OptimizerType& optimizer, size_t samples) const
 {
   if (optimizer.MaxIterations() < samples &&
       optimizer.MaxIterations() != 0)
   {
     Log::Warn << "The optimizer's maximum number of iterations "
               << "is less than the size of the dataset; the "
               << "optimizer will not pass over the entire "
               << "dataset. To fix this, modify the maximum "
               << "number of iterations to be at least equal "
               << "to the number of points of your dataset "
               << "(" << samples << ")." << std::endl;
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename OptimizerType>
 typename std::enable_if<
       !HasMaxIterations<OptimizerType, size_t&(OptimizerType::*)()>
       ::value, void>::type
 RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::
 WarnMessageMaxIterations(OptimizerType& /* optimizer */,
                          size_t /* samples */) const
 {
   return;
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename OptimizerType, typename... CallbackTypes>
 double RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Train(
     arma::cube predictors,
     arma::cube responses,
     OptimizerType& optimizer,
     CallbackTypes&&... callbacks)
 {
   CheckInputShape<std::vector<LayerTypes<CustomLayers...> > >(
       network, predictors.n_rows, "RNN<>::Train()");

   numFunctions = responses.n_cols;

   this->predictors = std::move(predictors);
   this->responses = std::move(responses);

   this->deterministic = true;
   ResetDeterministic();

   if (!reset)
   {
     ResetParameters();
   }

   WarnMessageMaxIterations<OptimizerType>(optimizer, this->predictors.n_cols);

   // Train the model.
   Timer::Start("rnn_optimization");
   const double out = optimizer.Optimize(*this, parameter, callbacks...);
   Timer::Stop("rnn_optimization");

   Log::Info << "RNN::RNN(): final objective of trained model is " << out
       << "." << std::endl;
   return out;
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType,
          CustomLayers...>::ResetCells()
 {
   for (size_t i = 1; i < network.size(); ++i)
   {
     boost::apply_visitor(ResetCellVisitor(rho), network[i]);
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename OptimizerType, typename... CallbackTypes>
 double RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Train(
     arma::cube predictors,
     arma::cube responses,
     CallbackTypes&&... callbacks)
 {
   CheckInputShape<std::vector<LayerTypes<CustomLayers...> > >(
       network, predictors.n_rows, "RNN<>::Train()");

   numFunctions = responses.n_cols;

   this->predictors = std::move(predictors);
   this->responses = std::move(responses);

   this->deterministic = true;
   ResetDeterministic();

   if (!reset)
   {
     ResetParameters();
   }

   OptimizerType optimizer;

   WarnMessageMaxIterations<OptimizerType>(optimizer, this->predictors.n_cols);

   // Train the model.
   Timer::Start("rnn_optimization");
   const double out = optimizer.Optimize(*this, parameter, callbacks...);
   Timer::Stop("rnn_optimization");

   Log::Info << "RNN::RNN(): final objective of trained model is " << out
       << "." << std::endl;
   return out;
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Predict(
     arma::cube predictors, arma::cube& results, const size_t batchSize)
 {
   CheckInputShape<std::vector<LayerTypes<CustomLayers...> > >(
       network, predictors.n_rows, "RNN<>::Predict()");

   ResetCells();

   if (parameter.is_empty())
   {
     ResetParameters();
   }

   if (!deterministic)
   {
     deterministic = true;
     ResetDeterministic();
   }

   const size_t effectiveBatchSize = std::min(batchSize,
       size_t(predictors.n_cols));

   Forward(arma::mat(predictors.slice(0).colptr(0), predictors.n_rows,
       effectiveBatchSize, false, true));
   arma::mat resultsTemp = boost::apply_visitor(outputParameterVisitor,
       network.back());

   outputSize = resultsTemp.n_rows;
   results = arma::zeros<arma::cube>(outputSize, predictors.n_cols, rho);
   results.slice(0).submat(0, 0, results.n_rows - 1,
       effectiveBatchSize - 1) = resultsTemp;

   // Process in accordance with the given batch size.
   for (size_t begin = 0; begin < predictors.n_cols; begin += batchSize)
   {
     const size_t effectiveBatchSize = std::min(batchSize,
         size_t(predictors.n_cols - begin));
     for (size_t seqNum = !begin; seqNum < rho; ++seqNum)
     {
       Forward(arma::mat(predictors.slice(seqNum).colptr(begin),
           predictors.n_rows, effectiveBatchSize, false, true));

       results.slice(seqNum).submat(0, begin, results.n_rows - 1, begin +
           effectiveBatchSize - 1) = boost::apply_visitor(outputParameterVisitor,
           network.back());
     }
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 double RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Evaluate(
     const arma::mat& /* parameters */,
     const size_t begin,
     const size_t batchSize,
     const bool deterministic)
 {
   if (parameter.is_empty())
   {
     ResetParameters();
   }

   if (deterministic != this->deterministic)
   {
     this->deterministic = deterministic;
     ResetDeterministic();
   }

   if (!inputSize)
   {
     inputSize = predictors.n_rows;
     targetSize = responses.n_rows;
   }
   else if (targetSize == 0)
   {
     targetSize = responses.n_rows;
   }

   ResetCells();

   double performance = 0;
   size_t responseSeq = 0;

   for (size_t seqNum = 0; seqNum < rho; ++seqNum)
   {
     // Wrap a matrix around our data to avoid a copy.
     arma::mat stepData(predictors.slice(seqNum).colptr(begin),
         predictors.n_rows, batchSize, false, true);
     Forward(stepData);
     if (!single)
     {
       responseSeq = seqNum;
     }

     performance += outputLayer.Forward(boost::apply_visitor(
         outputParameterVisitor, network.back()),
         arma::mat(responses.slice(responseSeq).colptr(begin),
             responses.n_rows, batchSize, false, true));
   }

   if (outputSize == 0)
   {
     outputSize = boost::apply_visitor(outputParameterVisitor,
         network.back()).n_elem / batchSize;
   }

   return performance;
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 double RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Evaluate(
     const arma::mat& parameters,
     const size_t begin,
     const size_t batchSize)
 {
   return Evaluate(parameters, begin, batchSize, true);
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename GradType>
 double RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::
 EvaluateWithGradient(const arma::mat& /* parameters */,
                      const size_t begin,
                      GradType& gradient,
                      const size_t batchSize)
 {
   // Initialize passed gradient.
   if (gradient.is_empty())
   {
     if (parameter.is_empty())
     {
       ResetParameters();
     }

     gradient = arma::zeros<arma::mat>(parameter.n_rows, parameter.n_cols);
   }
   else
   {
     gradient.zeros();
   }

   if (this->deterministic)
   {
     this->deterministic = false;
     ResetDeterministic();
   }

   if (!inputSize)
   {
     inputSize = predictors.n_rows;
     targetSize = responses.n_rows;
   }
   else if (targetSize == 0)
   {
     targetSize = responses.n_rows;
   }

   ResetCells();

   double performance = 0;
   size_t responseSeq = 0;
   const size_t effectiveRho = std::min(rho, size_t(responses.size()));

   for (size_t seqNum = 0; seqNum < effectiveRho; ++seqNum)
   {
     // Wrap a matrix around our data to avoid a copy.
     arma::mat stepData(predictors.slice(seqNum).colptr(begin),
         predictors.n_rows, batchSize, false, true);
     Forward(stepData);
     if (!single)
     {
       responseSeq = seqNum;
     }

     for (size_t l = 0; l < network.size(); ++l)
     {
       boost::apply_visitor(SaveOutputParameterVisitor(moduleOutputParameter),
           network[l]);
     }

     performance += outputLayer.Forward(boost::apply_visitor(
         outputParameterVisitor, network.back()),
         arma::mat(responses.slice(responseSeq).colptr(begin),
             responses.n_rows, batchSize, false, true));
   }

   if (outputSize == 0)
   {
     outputSize = boost::apply_visitor(outputParameterVisitor,
         network.back()).n_elem / batchSize;
   }

   // Initialize current/working gradient.
   if (currentGradient.is_empty())
   {
     currentGradient = arma::zeros<arma::mat>(parameter.n_rows,
         parameter.n_cols);
   }

   ResetGradients(currentGradient);

   for (size_t seqNum = 0; seqNum < effectiveRho; ++seqNum)
   {
     currentGradient.zeros();
     for (size_t l = 0; l < network.size(); ++l)
     {
       boost::apply_visitor(LoadOutputParameterVisitor(moduleOutputParameter),
           network[network.size() - 1 - l]);
     }

     if (single && seqNum > 0)
     {
       error.zeros();
     }
     else if (single && seqNum == 0)
     {
       outputLayer.Backward(boost::apply_visitor(
           outputParameterVisitor, network.back()),
           arma::mat(responses.slice(0).colptr(begin),
           responses.n_rows, batchSize, false, true), error);
     }
     else
     {
       outputLayer.Backward(boost::apply_visitor(
           outputParameterVisitor, network.back()),
           arma::mat(responses.slice(effectiveRho - seqNum - 1).colptr(begin),
           responses.n_rows, batchSize, false, true), error);
     }

     Backward();
     Gradient(
         arma::mat(predictors.slice(effectiveRho - seqNum - 1).colptr(begin),
         predictors.n_rows, batchSize, false, true));
     gradient += currentGradient;
   }

   return performance;
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Gradient(
     const arma::mat& parameters,
     const size_t begin,
     arma::mat& gradient,
     const size_t batchSize)
 {
   this->EvaluateWithGradient(parameters, begin, gradient, batchSize);
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Shuffle()
 {
   arma::cube newPredictors, newResponses;
   math::ShuffleData(predictors, responses, newPredictors, newResponses);

   predictors = std::move(newPredictors);
   responses = std::move(newResponses);
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType,
          CustomLayers...>::ResetParameters()
 {
   ResetDeterministic();

   // Reset the network parameter with the given initialization rule.
   NetworkInitialization<InitializationRuleType,
                         CustomLayers...> networkInit(initializeRule);
   networkInit.Initialize(network, parameter);

   reset = true;
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Reset()
 {
   ResetParameters();
   ResetCells();
   currentGradient.zeros();
   ResetGradients(currentGradient);
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType,
          CustomLayers...>::ResetDeterministic()
 {
   DeterministicSetVisitor deterministicSetVisitor(deterministic);
   std::for_each(network.begin(), network.end(),
       boost::apply_visitor(deterministicSetVisitor));
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType,
          CustomLayers...>::ResetGradients(
     arma::mat& gradient)
 {
   size_t offset = 0;
   for (LayerTypes<CustomLayers...>& layer : network)
   {
     offset += boost::apply_visitor(GradientSetVisitor(gradient, offset), layer);
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename InputType>
 void RNN<OutputLayerType, InitializationRuleType,
          CustomLayers...>::Forward(const InputType& input)
 {
   boost::apply_visitor(ForwardVisitor(input,
       boost::apply_visitor(outputParameterVisitor, network.front())),
       network.front());

   for (size_t i = 1; i < network.size(); ++i)
   {
     boost::apply_visitor(ForwardVisitor(
         boost::apply_visitor(outputParameterVisitor, network[i - 1]),
         boost::apply_visitor(outputParameterVisitor, network[i])),
         network[i]);
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 void RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::Backward()
 {
   boost::apply_visitor(BackwardVisitor(
         boost::apply_visitor(outputParameterVisitor, network.back()),
         error, boost::apply_visitor(deltaVisitor,
         network.back())), network.back());

   for (size_t i = 2; i < network.size(); ++i)
   {
     boost::apply_visitor(BackwardVisitor(
         boost::apply_visitor(outputParameterVisitor,
         network[network.size() - i]), boost::apply_visitor(
         deltaVisitor, network[network.size() - i + 1]),
         boost::apply_visitor(deltaVisitor, network[network.size() - i])),
         network[network.size() - i]);
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename InputType>
 void RNN<OutputLayerType, InitializationRuleType,
          CustomLayers...>::Gradient(const InputType& input)
 {
   boost::apply_visitor(GradientVisitor(input,
       boost::apply_visitor(deltaVisitor, network[1])), network.front());

   for (size_t i = 1; i < network.size() - 1; ++i)
   {
     boost::apply_visitor(GradientVisitor(
         boost::apply_visitor(outputParameterVisitor, network[i - 1]),
         boost::apply_visitor(deltaVisitor, network[i + 1])),
         network[i]);
   }
 }

 template<typename OutputLayerType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename Archive>
 void RNN<OutputLayerType, InitializationRuleType, CustomLayers...>::serialize(
     Archive& ar, const uint32_t /* version */)
 {
   ar(CEREAL_NVP(parameter));
   ar(CEREAL_NVP(rho));
   ar(CEREAL_NVP(single));
   ar(CEREAL_NVP(inputSize));
   ar(CEREAL_NVP(outputSize));
   ar(CEREAL_NVP(targetSize));
   ar(CEREAL_NVP(reset));

   if (cereal::is_loading<Archive>())
   {
     std::for_each(network.begin(), network.end(),
         boost::apply_visitor(deleteVisitor));
     network.clear();
   }

   ar(CEREAL_VECTOR_VARIANT_POINTER(network));

   // If we are loading, we need to initialize the weights.
   if (cereal::is_loading<Archive>())
   {
     size_t offset = 0;
     for (LayerTypes<CustomLayers...>& layer : network)
     {
       offset += boost::apply_visitor(WeightSetVisitor(parameter, offset),
           layer);

       boost::apply_visitor(resetVisitor, layer);
     }

     deterministic = true;
     ResetDeterministic();
   }
 }

 } // namespace ann
 } // namespace mlpack

 #endif
mlpack::ann::ResetCellVisitor
ResetCellVisitor executes the ResetCell() function.
Definition: reset_cell_visitor.hpp:26

weight_set_visitor.hpp

backward_visitor.hpp

mlpack::ann::BackwardVisitor
BackwardVisitor executes the Backward() function given the input, error and delta parameter...
Definition: backward_visitor.hpp:28

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: cv.hpp:1

std
Definition: pointer_wrapper.hpp:23

mlpack::ann::GradientSetVisitor
GradientSetVisitor update the gradient parameter given the gradient set.
Definition: gradient_set_visitor.hpp:26

mlpack::ann::SaveOutputParameterVisitor
SaveOutputParameterVisitor saves the output parameter into the given parameter set.
Definition: save_output_parameter_visitor.hpp:27

mlpack::ann::DeterministicSetVisitor
DeterministicSetVisitor set the deterministic parameter given the deterministic value.
Definition: deterministic_set_visitor.hpp:28

load_output_parameter_visitor.hpp

gradient_set_visitor.hpp

forward_visitor.hpp

mlpack::ann::RNN
Implementation of a standard recurrent neural network container.
Definition: rnn.hpp:45

mlpack::ann::RNN::RNN
RNN(const size_t rho, const bool single=false, OutputLayerType outputLayer=OutputLayerType(), InitializationRuleType initializeRule=InitializationRuleType())
Create the RNN object.
Definition: rnn_impl.hpp:35

deterministic_set_visitor.hpp

rnn.hpp

mlpack::ann::WeightSetVisitor
WeightSetVisitor update the module parameters given the parameters set.
Definition: weight_set_visitor.hpp:26

check_input_shape.hpp

mlpack::ann::ForwardVisitor
ForwardVisitor executes the Forward() function given the input and output parameter.
Definition: forward_visitor.hpp:28

save_output_parameter_visitor.hpp

mlpack::ann::GradientVisitor
SearchModeVisitor executes the Gradient() method of the given module using the input and delta parame...
Definition: gradient_visitor.hpp:28

mlpack::math::ShuffleData
void ShuffleData(const MatType &inputPoints, const LabelsType &inputLabels, MatType &outputPoints, LabelsType &outputLabels, const std::enable_if_t<!arma::is_SpMat< MatType >::value > *=0, const std::enable_if_t<!arma::is_Cube< MatType >::value > *=0)
Shuffle a dataset and associated labels (or responses).
Definition: shuffle_data.hpp:28

mlpack::ann::LoadOutputParameterVisitor
LoadOutputParameterVisitor restores the output parameter using the given parameter set...
Definition: load_output_parameter_visitor.hpp:28

mlpack::ann::NetworkInitialization
This class is used to initialize the network with the given initialization rule.
Definition: network_init.hpp:33

gradient_visitor.hpp

CEREAL_VECTOR_VARIANT_POINTER
#define CEREAL_VECTOR_VARIANT_POINTER(T)
Cereal does not support the serialization of raw pointer.
Definition: pointer_vector_variant_wrapper.hpp:92

reset_cell_visitor.hpp