Aakash-kaushik/mlpack/brnn__impl_8hpp_source.html

 #ifndef MLPACK_METHODS_ANN_BRNN_IMPL_HPP
 #define MLPACK_METHODS_ANN_BRNN_IMPL_HPP

 // In case it hasn't been included yet.
 #include "brnn.hpp"

 #include "visitor/load_output_parameter_visitor.hpp"
 #include "visitor/save_output_parameter_visitor.hpp"
 #include "visitor/forward_visitor.hpp"
 #include "visitor/backward_visitor.hpp"
 #include "visitor/reset_cell_visitor.hpp"
 #include "visitor/gradient_set_visitor.hpp"
 #include "visitor/gradient_visitor.hpp"
 #include "visitor/weight_set_visitor.hpp"
 #include "visitor/run_set_visitor.hpp"

 namespace mlpack {
 namespace ann  {

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::BRNN(
     const size_t rho,
     const bool single,
     OutputLayerType outputLayer,
     MergeLayerType* mergeLayer,
     MergeOutputType* mergeOutput,
     InitializationRuleType initializeRule) :
     rho(rho),
     outputLayer(std::move(outputLayer)),
     mergeLayer(mergeLayer),
     mergeOutput(mergeOutput),
     initializeRule(std::move(initializeRule)),
     inputSize(0),
     outputSize(0),
     targetSize(0),
     reset(false),
     single(single),
     numFunctions(0),
     deterministic(true),
     forwardRNN(rho, single, outputLayer, initializeRule),
     backwardRNN(rho, single, outputLayer, initializeRule)
 {
   /* Nothing to do here. */
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::~BRNN()
 {
   // Remove the last layers from the forward and backward RNNs, as they are held
   // in mergeLayer.  So, when we use DeleteVisitor with mergeLayer, those two
   // layers will be properly (and not doubly) freed.
   forwardRNN.network.pop_back();
   backwardRNN.network.pop_back();

   // Clean up layers that we allocated.
   boost::apply_visitor(DeleteVisitor(), mergeLayer);
   boost::apply_visitor(DeleteVisitor(), mergeOutput);
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename OptimizerType>
 typename std::enable_if<
       HasMaxIterations<OptimizerType, size_t&(OptimizerType::*)()>
       ::value, void>::type
 BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::WarnMessageMaxIterations
 (OptimizerType& optimizer, size_t samples) const
 {
   if (optimizer.MaxIterations() < samples &&
       optimizer.MaxIterations() != 0)
   {
     Log::Warn << "The optimizer's maximum number of iterations "
               << "is less than the size of the dataset; the "
               << "optimizer will not pass over the entire "
               << "dataset. To fix this, modify the maximum "
               << "number of iterations to be at least equal "
               << "to the number of points of your dataset "
               << "(" << samples << ")." << std::endl;
   }
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename OptimizerType>
 typename std::enable_if<
       !HasMaxIterations<OptimizerType, size_t&(OptimizerType::*)()>
       ::value, void>::type
 BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::WarnMessageMaxIterations
 (OptimizerType& /* optimizer */, size_t /* samples */) const
 {
   return;
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename OptimizerType>
 double BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Train(
     arma::cube predictors,
     arma::cube responses,
     OptimizerType& optimizer)
 {
   numFunctions = responses.n_cols;

   this->predictors = std::move(predictors);
   this->responses = std::move(responses);

   this->deterministic = true;
   ResetDeterministic();

   if (!reset)
   {
     ResetParameters();
   }

   WarnMessageMaxIterations<OptimizerType>(optimizer, this->predictors.n_cols);

   // Train the model.
   Timer::Start("BRNN_optimization");
   const double out = optimizer.Optimize(*this, parameter);
   Timer::Stop("BRNN_optimization");

   Log::Info << "BRNN::BRNN(): final objective of trained model is " << out
       << "." << std::endl;
   return out;
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename OptimizerType>
 double BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Train(
     arma::cube predictors,
     arma::cube responses)
 {
   numFunctions = responses.n_cols;

   this->predictors = std::move(predictors);
   this->responses = std::move(responses);

   this->deterministic = true;
   ResetDeterministic();

   if (!reset)
   {
     ResetParameters();
   }

   OptimizerType optimizer;

   WarnMessageMaxIterations<OptimizerType>(optimizer, this->predictors.n_cols);

   // Train the model.
   const double out = optimizer.Optimize(*this, parameter);

   Log::Info << "BRNN::BRNN(): final objective of trained model is " << out
       << "." << std::endl;
   return out;
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Predict(
     arma::cube predictors, arma::cube& results, const size_t batchSize)
 {
   forwardRNN.rho = backwardRNN.rho = rho;

   forwardRNN.ResetCells();
   backwardRNN.ResetCells();

   if (!deterministic)
   {
     deterministic = true;
     ResetDeterministic();
   }
   if (parameter.is_empty())
   {
     ResetParameters();
   }

   if (std::is_same<MergeLayerType, Concat<>>::value)
   {
     results = arma::zeros<arma::cube>(outputSize * 2, predictors.n_cols, rho);
   }
   else
   {
     results = arma::zeros<arma::cube>(outputSize, predictors.n_cols, rho);
   }

   std::vector<arma::mat> results1, results2;
   arma::mat input;

   // Forward both RNN's from opposite directions.
   for (size_t begin = 0; begin < predictors.n_cols; begin += batchSize)
   {
     const size_t effectiveBatchSize = std::min(batchSize,
         size_t(predictors.n_cols - begin));
     for (size_t seqNum = 0; seqNum < rho; ++seqNum)
     {
       forwardRNN.Forward(arma::mat(
           predictors.slice(seqNum).colptr(begin),
           predictors.n_rows, effectiveBatchSize, false, true));
       backwardRNN.Forward(std::move(arma::mat(
           predictors.slice(rho - seqNum - 1).colptr(begin),
           predictors.n_rows, effectiveBatchSize, false, true)));

       boost::apply_visitor(SaveOutputParameterVisitor(results1),
           forwardRNN.network.back());
       boost::apply_visitor(SaveOutputParameterVisitor(results2),
           backwardRNN.network.back());
     }
     reverse(results1.begin(), results1.end());

     // Forward outputs from both RNN's through merge layer for each time step.
     for (size_t seqNum = 0; seqNum < rho; ++seqNum)
     {
       boost::apply_visitor(LoadOutputParameterVisitor(results1),
           forwardRNN.network.back());
       boost::apply_visitor(LoadOutputParameterVisitor(results2),
           backwardRNN.network.back());

       boost::apply_visitor(ForwardVisitor(input,
           boost::apply_visitor(outputParameterVisitor, mergeLayer)),
           mergeLayer);
       boost::apply_visitor(ForwardVisitor(
           boost::apply_visitor(outputParameterVisitor, mergeLayer),
           boost::apply_visitor(outputParameterVisitor, mergeOutput)),
           mergeOutput);
       results.slice(seqNum).submat(0, begin, results.n_rows - 1, begin +
           effectiveBatchSize - 1) =
           boost::apply_visitor(outputParameterVisitor, mergeOutput);
     }
   }
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 double BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Evaluate(
     const arma::mat& /* parameters */,
     const size_t begin,
     const size_t batchSize,
     const bool deterministic)
 {
   forwardRNN.rho = backwardRNN.rho = rho;
   if (parameter.is_empty())
   {
     ResetParameters();
   }

   if (deterministic != this->deterministic)
   {
     this->deterministic = deterministic;
     ResetDeterministic();
   }

   if (!inputSize)
   {
     inputSize = predictors.n_rows;
     targetSize = responses.n_rows;
   }
   else if (targetSize == 0)
   {
     targetSize = responses.n_rows;
   }

   forwardRNN.ResetCells();
   backwardRNN.ResetCells();

   double performance = 0;
   size_t responseSeq = 0;

   std::vector<arma::mat> results1, results2;
   for (size_t seqNum = 0; seqNum < rho; ++seqNum)
   {
     forwardRNN.Forward(arma::mat(
         predictors.slice(seqNum).colptr(begin),
         predictors.n_rows, batchSize, false, true));
     backwardRNN.Forward(arma::mat(
         predictors.slice(rho - seqNum - 1).colptr(begin),
         predictors.n_rows, batchSize, false, true));

     boost::apply_visitor(SaveOutputParameterVisitor(results1),
         forwardRNN.network.back());
     boost::apply_visitor(SaveOutputParameterVisitor(results2),
         backwardRNN.network.back());
   }
   if (outputSize == 0)
   {
     outputSize = boost::apply_visitor(outputParameterVisitor,
         forwardRNN.network.back()).n_elem / batchSize;
     forwardRNN.outputSize = backwardRNN.outputSize = outputSize;
   }
   reverse(results1.begin(), results1.end());

   // Performance calculation after forwarding through merge layer.
   arma::mat input;
   for (size_t seqNum = 0; seqNum < rho; ++seqNum)
   {
     if (!single)
     {
       responseSeq = seqNum;
     }
     boost::apply_visitor(LoadOutputParameterVisitor(results1),
         forwardRNN.network.back());
     boost::apply_visitor(LoadOutputParameterVisitor(results2),
         backwardRNN.network.back());

     boost::apply_visitor(ForwardVisitor(input,
         boost::apply_visitor(outputParameterVisitor, mergeLayer)),
         mergeLayer);
     boost::apply_visitor(ForwardVisitor(
         boost::apply_visitor(outputParameterVisitor, mergeLayer),
         boost::apply_visitor(outputParameterVisitor, mergeOutput)),
         mergeOutput);
     performance += outputLayer.Forward(
         boost::apply_visitor(outputParameterVisitor, mergeOutput),
         arma::mat(responses.slice(responseSeq).colptr(begin),
         responses.n_rows, batchSize, false, true));
   }
   return performance;
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 double BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Evaluate(
     const arma::mat& parameters,
     const size_t begin,
     const size_t batchSize)
 {
   return Evaluate(parameters, begin, batchSize, true);
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename GradType>
 double BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::
 EvaluateWithGradient(const arma::mat& /* parameters */,
                      const size_t begin,
                      GradType& gradient,
                      const size_t batchSize)
 {
   forwardRNN.rho = backwardRNN.rho = rho;
   if (gradient.is_empty())
   {
     if (parameter.is_empty())
     {
       ResetParameters();
     }
     gradient = arma::zeros<arma::mat>(parameter.n_rows, parameter.n_cols);
   }
   else
   {
     gradient.zeros();
   }

   if (backwardGradient.is_empty())
   {
     backwardGradient = arma::zeros<arma::mat>(
         parameter.n_rows/ 2,
         parameter.n_cols);
     forwardGradient = arma::zeros<arma::mat>(
         parameter.n_rows/ 2,
         parameter.n_cols);
   }
   if (this->deterministic)
   {
     this->deterministic = false;
     ResetDeterministic();
   }

   if (!inputSize)
   {
     inputSize = predictors.n_rows;
     targetSize = responses.n_rows;
   }
   else if (targetSize == 0)
   {
     targetSize = responses.n_rows;
   }

   forwardRNN.ResetCells();
   backwardRNN.ResetCells();
   size_t networkSize = backwardRNN.network.size();

   // Forward propogation from both directions.
   std::vector<arma::mat> results1, results2;
   for (size_t seqNum = 0; seqNum < rho; ++seqNum)
   {
     forwardRNN.Forward(arma::mat(
         predictors.slice(seqNum).colptr(begin),
         predictors.n_rows, batchSize, false, true));
     backwardRNN.Forward(arma::mat(
         predictors.slice(rho - seqNum - 1).colptr(begin),
         predictors.n_rows, batchSize, false, true));

     for (size_t l = 0; l < networkSize; ++l)
     {
       boost::apply_visitor(SaveOutputParameterVisitor(
           forwardRNNOutputParameter), forwardRNN.network[l]);
       boost::apply_visitor(SaveOutputParameterVisitor(
           backwardRNNOutputParameter), backwardRNN.network[l]);
     }
     boost::apply_visitor(SaveOutputParameterVisitor(results1),
         forwardRNN.network.back());
     boost::apply_visitor(SaveOutputParameterVisitor(results2),
         backwardRNN.network.back());
   }
   if (outputSize == 0)
   {
     outputSize = boost::apply_visitor(outputParameterVisitor,
         forwardRNN.network.back()).n_elem / batchSize;
     forwardRNN.outputSize = backwardRNN.outputSize = outputSize;
   }

   arma::cube results;
   if (std::is_same<MergeLayerType, Concat<>>::value)
   {
     results = arma::zeros<arma::cube>(outputSize * 2, batchSize, rho);
   }
   else
   {
     results = arma::zeros<arma::cube>(outputSize, batchSize, rho);
   }

   double performance = 0;
   size_t responseSeq = 0;
   arma::mat input;

   reverse(results1.begin(), results1.end());
   // Performance calculation here.
   for (size_t seqNum = 0; seqNum < rho; ++seqNum)
   {
     if (!single)
     {
       responseSeq = seqNum;
     }
     boost::apply_visitor(LoadOutputParameterVisitor(
           results1), forwardRNN.network.back());
     boost::apply_visitor(LoadOutputParameterVisitor(
           results2), backwardRNN.network.back());
     boost::apply_visitor(ForwardVisitor(input,
         boost::apply_visitor(outputParameterVisitor, mergeLayer)),
         mergeLayer);
     boost::apply_visitor(ForwardVisitor(
         boost::apply_visitor(outputParameterVisitor, mergeLayer),
         results.slice(seqNum)), mergeOutput);
     performance += outputLayer.Forward(results.slice(seqNum),
         arma::mat(responses.slice(responseSeq).colptr(begin),
         responses.n_rows, batchSize, false, true));
   }

   // Calculate and storing delta parameters from output for t = 1 to T.
   arma::mat delta;
   std::vector<arma::mat> allDelta;

   for (size_t seqNum = 0; seqNum < rho; ++seqNum)
   {
     if (single && seqNum > 0)
     {
       error.zeros();
     }
     else if (single && seqNum == 0)
     {
       outputLayer.Backward(results.slice(seqNum),
           arma::mat(responses.slice(0).colptr(begin),
           responses.n_rows, batchSize, false, true), error);
     }
     else
     {
       outputLayer.Backward(results.slice(seqNum),
           arma::mat(responses.slice(seqNum).colptr(begin),
           responses.n_rows, batchSize, false, true), error);
     }

     boost::apply_visitor(BackwardVisitor(results.slice(seqNum), error, delta),
         mergeOutput);
     allDelta.push_back(arma::mat(delta));
   }

   // BPTT ForwardRNN from t = T to 1.
   totalGradient = arma::mat(gradient.memptr(),
       parameter.n_elem / 2, 1, false, false);

   forwardGradient.zeros();
   forwardRNN.ResetGradients(forwardGradient);
   backwardGradient.zeros();
   backwardRNN.ResetGradients(backwardGradient);

   for (size_t seqNum = 0; seqNum < rho; ++seqNum)
   {
     forwardGradient.zeros();
     for (size_t l = 0; l < networkSize; ++l)
     {
       boost::apply_visitor(LoadOutputParameterVisitor(
           forwardRNNOutputParameter),
           forwardRNN.network[networkSize - 1 - l]);
     }
     boost::apply_visitor(BackwardVisitor(boost::apply_visitor(
         outputParameterVisitor, forwardRNN.network.back()),
         allDelta[rho - seqNum - 1], delta, 0),
         mergeLayer);

     for (size_t i = 2; i < networkSize; ++i)
     {
       boost::apply_visitor(BackwardVisitor(
           boost::apply_visitor(outputParameterVisitor,
           forwardRNN.network[networkSize - i]),
           boost::apply_visitor(deltaVisitor,
           forwardRNN.network[networkSize - i + 1]),
           boost::apply_visitor(deltaVisitor,
           forwardRNN.network[networkSize - i])),
           forwardRNN.network[networkSize - i]);
     }
     forwardRNN.Gradient(
         arma::mat(predictors.slice(rho - seqNum - 1).colptr(begin),
         predictors.n_rows, batchSize, false, true));
     boost::apply_visitor(GradientVisitor(
         boost::apply_visitor(outputParameterVisitor,
         forwardRNN.network[networkSize - 2]),
         allDelta[rho - seqNum - 1], 0), mergeLayer);
     totalGradient += forwardGradient;
   }

   // BPTT BackwardRNN from t = 1 to T.
   totalGradient = arma::mat(gradient.memptr() + parameter.n_elem/2,
       parameter.n_elem/2, 1, false, false);

   for (size_t seqNum = 0; seqNum < rho; ++seqNum)
   {
     backwardGradient.zeros();
     for (size_t l = 0; l < networkSize; ++l)
     {
       boost::apply_visitor(LoadOutputParameterVisitor(
           backwardRNNOutputParameter),
           backwardRNN.network[networkSize - 1 - l]);
     }
     boost::apply_visitor(BackwardVisitor(
         boost::apply_visitor(outputParameterVisitor,
         backwardRNN.network.back()),
         allDelta[seqNum], delta, 1), mergeLayer);
     for (size_t i = 2; i < networkSize; ++i)
     {
       boost::apply_visitor(BackwardVisitor(
         boost::apply_visitor(outputParameterVisitor,
         backwardRNN.network[networkSize - i]), boost::apply_visitor(
         deltaVisitor, backwardRNN.network[networkSize - i + 1]),
         boost::apply_visitor(deltaVisitor,
         backwardRNN.network[networkSize - i])),
         backwardRNN.network[networkSize - i]);
     }

     backwardRNN.Gradient(
         arma::mat(predictors.slice(seqNum).colptr(begin),
         predictors.n_rows, batchSize, false, true));
     boost::apply_visitor(GradientVisitor(
         std::move(boost::apply_visitor(outputParameterVisitor,
         backwardRNN.network[networkSize - 2])),
         allDelta[seqNum], 1), mergeLayer);
     totalGradient += backwardGradient;
   }
   return performance;
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Gradient(
     const arma::mat& parameters,
     const size_t begin,
     arma::mat& gradient,
     const size_t batchSize)
 {
   this->EvaluateWithGradient(parameters, begin, gradient, batchSize);
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Shuffle()
 {
   arma::cube newPredictors, newResponses;
   math::ShuffleData(predictors, responses, newPredictors, newResponses);

   predictors = std::move(newPredictors);
   responses = std::move(newResponses);
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 template <class LayerType, class... Args>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Add(Args... args)
 {
   forwardRNN.network.push_back(new LayerType(args...));
   backwardRNN.network.push_back(new LayerType(args...));
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::
 Add(LayerTypes<CustomLayers...> layer)
 {
   forwardRNN.network.push_back(layer);
   backwardRNN.network.push_back(boost::apply_visitor(copyVisitor, layer));
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::ResetParameters()
 {
   if (!reset)
   {
     // TODO: what if we call ResetParameters() multiple times?  Do we have to
     // remove any existing mergeLayer?
     boost::apply_visitor(AddVisitor<CustomLayers...>(
         forwardRNN.network.back()), mergeLayer);
     boost::apply_visitor(AddVisitor<CustomLayers...>(
         backwardRNN.network.back()), mergeLayer);
     boost::apply_visitor(RunSetVisitor(false), mergeLayer);
   }

   ResetDeterministic();

   // Reset the network parameter with the given initialization rule.
   NetworkInitialization<InitializationRuleType,
                         CustomLayers...> networkInit(initializeRule);
   size_t rnnWeights = 0;
   for (size_t i = 0; i < forwardRNN.network.size(); ++i)
   {
     rnnWeights += boost::apply_visitor(weightSizeVisitor,
         forwardRNN.network[i]);
   }

   parameter.set_size(2 * rnnWeights, 1);

   forwardRNN.Parameters() = arma::mat(parameter.memptr(),
       rnnWeights, 1, false, false);
   backwardRNN.Parameters() = arma::mat(parameter.memptr() + rnnWeights,
       rnnWeights, 1, false, false);

   // Initialize the forward RNN parameters
   networkInit.Initialize(forwardRNN.network, parameter);

   // Initialize the backward RNN parameters
   networkInit.Initialize(backwardRNN.network, parameter, rnnWeights);

   reset = forwardRNN.reset = backwardRNN.reset = true;
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::Reset()
 {
   ResetParameters();
   forwardRNN.ResetCells();
   backwardRNN.ResetCells();
   forwardGradient.zeros();
   forwardRNN.ResetGradients(forwardGradient);
   backwardGradient.zeros();
   backwardRNN.ResetGradients(backwardGradient);
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::ResetDeterministic()
 {
   forwardRNN.deterministic = this->deterministic;
   backwardRNN.deterministic = this->deterministic;
   forwardRNN.ResetDeterministic();
   backwardRNN.ResetDeterministic();
 }

 template<typename OutputLayerType, typename MergeLayerType,
          typename MergeOutputType, typename InitializationRuleType,
          typename... CustomLayers>
 template<typename Archive>
 void BRNN<OutputLayerType, MergeLayerType, MergeOutputType,
     InitializationRuleType, CustomLayers...>::serialize(
     Archive& ar, const uint32_t version)
 {
   ar(CEREAL_NVP(parameter));
   ar(CEREAL_NVP(backwardRNN));
   ar(CEREAL_NVP(forwardRNN));

   // TODO: are there more parameters to be serialized?
 }

 } // namespace ann
 } // namespace mlpack

 #endif
mlpack::ann::BRNN::serialize
void serialize(Archive &ar, const uint32_t)
Serialize the model.
Definition: brnn_impl.hpp:721

mlpack::ann::DeleteVisitor
DeleteVisitor executes the destructor of the instantiated object.
Definition: delete_visitor.hpp:27

mlpack::Timer::Start
static void Start(const std::string &name)
Start the given timer.
Definition: timers.cpp:28

mlpack::ann::Add
Implementation of the Add module class.
Definition: add.hpp:34

weight_set_visitor.hpp

mlpack::ann::BRNN::WarnMessageMaxIterations
std::enable_if< HasMaxIterations< OptimizerType, size_t &(OptimizerType::*)()>::value, void >::type WarnMessageMaxIterations(OptimizerType &optimizer, size_t samples) const
Check if the optimizer has MaxIterations() parameter, if it does then check if it&#39;s value is less tha...
Definition: brnn_impl.hpp:87

backward_visitor.hpp

mlpack::ann::RunSetVisitor
RunSetVisitor set the run parameter given the run value.
Definition: run_set_visitor.hpp:28

mlpack::ann::BackwardVisitor
BackwardVisitor executes the Backward() function given the input, error and delta parameter...
Definition: backward_visitor.hpp:28

mlpack::ann::BRNN::Train
double Train(arma::cube predictors, arma::cube responses, OptimizerType &optimizer)
Train the bidirectional recurrent neural network on the given input data using the given optimizer...
Definition: brnn_impl.hpp:121

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: cv.hpp:1

mlpack::ann::RNN::Gradient
void Gradient(const arma::mat &parameters, const size_t begin, arma::mat &gradient, const size_t batchSize)
Evaluate the gradient of the recurrent neural network with the given parameters, and with respect to ...
Definition: rnn_impl.hpp:474

std
Definition: pointer_wrapper.hpp:23

mlpack::ann::SaveOutputParameterVisitor
SaveOutputParameterVisitor saves the output parameter into the given parameter set.
Definition: save_output_parameter_visitor.hpp:27

load_output_parameter_visitor.hpp

gradient_set_visitor.hpp

forward_visitor.hpp

brnn.hpp

mlpack::ann::BRNN::Gradient
void Gradient(const arma::mat &parameters, const size_t begin, arma::mat &gradient, const size_t batchSize)
Evaluate the gradient of the bidirectional recurrent neural network with the given parameters...
Definition: brnn_impl.hpp:600

mlpack::ann::Concat
Implementation of the Concat class.
Definition: concat.hpp:43

mlpack::ann::BRNN::Reset
void Reset()
Reset the state of the network.
Definition: brnn_impl.hpp:693

mlpack::Log::Warn
static MLPACK_EXPORT util::PrefixedOutStream Warn
Prints warning messages prefixed with [WARN ].
Definition: log.hpp:87

mlpack::ann::ForwardVisitor
ForwardVisitor executes the Forward() function given the input and output parameter.
Definition: forward_visitor.hpp:28

mlpack::ann::BRNN::Shuffle
void Shuffle()
Shuffle the order of function visitation.
Definition: brnn_impl.hpp:613

save_output_parameter_visitor.hpp

mlpack::ann::BRNN::ResetParameters
void ResetParameters()
Reset the module information (weights/parameters).
Definition: brnn_impl.hpp:648

mlpack::ann::AddVisitor
AddVisitor exposes the Add() method of the given module.
Definition: add_visitor.hpp:28

mlpack::ann::BRNN
Implementation of a standard bidirectional recurrent neural network container.
Definition: brnn.hpp:48

mlpack::ann::BRNN::Evaluate
double Evaluate(const arma::mat &parameters, const size_t begin, const size_t batchSize, const bool deterministic)
Evaluate the bidirectional recurrent neural network with the given parameters.
Definition: brnn_impl.hpp:266

mlpack::Timer::Stop
static void Stop(const std::string &name)
Stop the given timer.
Definition: timers.cpp:36

mlpack::ann::GradientVisitor
SearchModeVisitor executes the Gradient() method of the given module using the input and delta parame...
Definition: gradient_visitor.hpp:28

mlpack::ann::BRNN::EvaluateWithGradient
double EvaluateWithGradient(const arma::mat &parameters, const size_t begin, GradType &gradient, const size_t batchSize)
Evaluate the bidirectional recurrent neural network with the given parameters.
Definition: brnn_impl.hpp:369

mlpack::math::ShuffleData
void ShuffleData(const MatType &inputPoints, const LabelsType &inputLabels, MatType &outputPoints, LabelsType &outputLabels, const std::enable_if_t<!arma::is_SpMat< MatType >::value > *=0, const std::enable_if_t<!arma::is_Cube< MatType >::value > *=0)
Shuffle a dataset and associated labels (or responses).
Definition: shuffle_data.hpp:28

run_set_visitor.hpp

mlpack::ann::BRNN::Predict
void Predict(arma::cube predictors, arma::cube &results, const size_t batchSize=256)
Predict the responses to a given set of predictors.
Definition: brnn_impl.hpp:189

mlpack::Log::Info
static MLPACK_EXPORT util::PrefixedOutStream Info
Prints informational messages if –verbose is specified, prefixed with [INFO ].
Definition: log.hpp:84

mlpack::ann::LoadOutputParameterVisitor
LoadOutputParameterVisitor restores the output parameter using the given parameter set...
Definition: load_output_parameter_visitor.hpp:28

mlpack::ann::NetworkInitialization
This class is used to initialize the network with the given initialization rule.
Definition: network_init.hpp:33

mlpack::ann::RNN::Parameters
const arma::mat & Parameters() const
Return the initial point for the optimization.
Definition: rnn.hpp:297

gradient_visitor.hpp

reset_cell_visitor.hpp