mlpack-git/doxygen/ann__test__tools_8hpp_source.html

 #ifndef MLPACK_TESTS_ANN_TEST_TOOLS_HPP
 #define MLPACK_TESTS_ANN_TEST_TOOLS_HPP

 #include <mlpack/core.hpp>

 using namespace mlpack;
 using namespace mlpack::ann;

 // Helper function which calls the Reset function of the given module.
 template<class T>
 void ResetFunction(
     T& layer,
     typename std::enable_if<HasResetCheck<T, void(T::*)()>::value>::type* = 0)
 {
   layer.Reset();
 }

 template<class T>
 void ResetFunction(
     T& /* layer */,
     typename std::enable_if<!HasResetCheck<T, void(T::*)()>::value>::type* = 0)
 {
   /* Nothing to do here */
 }

 // Approximate Jacobian and supposedly-true Jacobian, then compare them
 // similarly to before.
 template<typename ModuleType>
 double JacobianTest(ModuleType& module,
                   arma::mat& input,
                   const double minValue = -2,
                   const double maxValue = -1,
                   const double perturbation = 1e-6)
 {
   arma::mat output, outputA, outputB, jacobianA, jacobianB;

   // Initialize the input matrix.
   RandomInitialization init(minValue, maxValue);
   init.Initialize(input, input.n_rows, input.n_cols);

   // Initialize the module parameters.
   ResetFunction(module);

   // Initialize the jacobian matrix.
   module.Forward(std::move(input), std::move(output));
   jacobianA = arma::zeros(input.n_elem, output.n_elem);

   // Share the input paramter matrix.
   arma::mat sin = arma::mat(input.memptr(), input.n_rows, input.n_cols,
       false, false);

   for (size_t i = 0; i < input.n_elem; ++i)
   {
     double original = sin(i);
     sin(i) = original - perturbation;
     module.Forward(std::move(input), std::move(outputA));
     sin(i) = original + perturbation;
     module.Forward(std::move(input), std::move(outputB));
     sin(i) = original;

     outputB -= outputA;
     outputB /= 2 * perturbation;
     jacobianA.row(i) = outputB.t();
   }

   // Initialize the derivative parameter.
   arma::mat deriv = arma::zeros(output.n_rows, output.n_cols);

   // Share the derivative parameter.
   arma::mat derivTemp = arma::mat(deriv.memptr(), deriv.n_rows, deriv.n_cols,
       false, false);

   // Initialize the jacobian matrix.
   jacobianB = arma::zeros(input.n_elem, output.n_elem);

   for (size_t i = 0; i < derivTemp.n_elem; ++i)
   {
     deriv.zeros();
     derivTemp(i) = 1;

     arma::mat delta;
     module.Backward(std::move(input), std::move(deriv), std::move(delta));

     jacobianB.col(i) = delta;
   }

   return arma::max(arma::max(arma::abs(jacobianA - jacobianB)));
 }

 // Approximate Jacobian and supposedly-true Jacobian, then compare them
 // similarly to before.
 template<typename ModuleType>
 double JacobianPerformanceTest(ModuleType& module,
                                arma::mat& input,
                                arma::mat& target,
                                const double eps = 1e-6)
 {
   module.Forward(std::move(input), std::move(target));

   arma::mat delta;
   module.Backward(std::move(input), std::move(target), std::move(delta));

   arma::mat centralDifference = arma::zeros(delta.n_rows, delta.n_cols);
   arma::mat inputTemp = arma::mat(input.memptr(), input.n_rows, input.n_cols,
       false, false);

   arma::mat centralDifferenceTemp = arma::mat(centralDifference.memptr(),
       centralDifference.n_rows, centralDifference.n_cols, false, false);

   for (size_t i = 0; i < input.n_elem; ++i)
   {
     inputTemp(i) = inputTemp(i) + eps;
     double outputA = module.Forward(std::move(input), std::move(target));
     inputTemp(i) = inputTemp(i) - (2 * eps);
     double outputB = module.Forward(std::move(input), std::move(target));

     centralDifferenceTemp(i) = (outputA - outputB) / (2 * eps);
     inputTemp(i) = inputTemp(i) + eps;
   }

   return arma::max(arma::max(arma::abs(centralDifference - delta)));
 }

 // Simple numerical gradient checker.
 template<class FunctionType>
 double CheckGradient(FunctionType& function, const double eps = 1e-7)
 {
   // Get gradients for the current parameters.
   arma::mat orgGradient, gradient, estGradient;
   function.Gradient(orgGradient);

   estGradient = arma::zeros(orgGradient.n_rows, orgGradient.n_cols);

   // Compute numeric approximations to gradient.
   for (size_t i = 0; i < orgGradient.n_elem; ++i)
   {
     double tmp = function.Parameters()(i);

     // Perturb parameter with a positive constant and get costs.
     function.Parameters()(i) += eps;
     double costPlus = function.Gradient(gradient);

     // Perturb parameter with a negative constant and get costs.
     function.Parameters()(i) -= (2 * eps);
     double costMinus = function.Gradient(gradient);

     // Restore the parameter value.
     function.Parameters()(i) = tmp;

     // Compute numerical gradients using the costs calculated above.
     estGradient(i) = (costPlus - costMinus) / (2 * eps);
   }

   // Estimate error of gradient.
   return arma::norm(orgGradient - estGradient) /
       arma::norm(orgGradient + estGradient);
 }

 // Simple numerical gradient checker for regularizers.
 template<class FunctionType>
 double CheckRegularizerGradient(FunctionType& function, const double eps = 1e-7)
 {
   // Get gradients for the current parameters.
   arma::mat weight = arma::randu(10, 10);
   arma::mat orgGradient = arma::zeros(10 * 10, 1);
   function.Gradient(weight, orgGradient);

   arma::mat estGradient = arma::zeros(weight.n_rows, weight.n_cols);

   // Compute numeric approximations to gradient.
   for (size_t i = 0; i < weight.n_rows; ++i)
   {
     for (size_t j = 0; j < weight.n_cols; ++j)
     {
       double tmp = weight(i, j);

       weight(i, j) += eps;
       double costPlus = function.Output(weight, i, j);
       weight(i, j) -= (2 * eps);
       double costMinus = function.Output(weight, i, j);

       // Restore the weight value.
       weight(i, j) = tmp;
       estGradient(i, j) = (costPlus - costMinus) / (2 * eps);
     }
   }

   estGradient = arma::vectorise(estGradient);
   // Estimate error of gradient.
   return arma::norm(orgGradient - estGradient) /
       arma::norm(orgGradient + estGradient);
 }

 #endif
mlpack::ann
Artificial Neural Network.
Definition: gelu_function.hpp:19

mlpack
strip_type.hpp
Definition: add_to_po.hpp:21

CheckGradient
double CheckGradient(FunctionType &function, const double eps=1e-7)
Definition: ann_test_tools.hpp:137

mlpack::ann::RandomInitialization
This class is used to initialize randomly the weight matrix.
Definition: random_init.hpp:24

ResetFunction
void ResetFunction(T &layer, typename std::enable_if< HasResetCheck< T, void(T::*)()>::value >::type *=0)
Definition: ann_test_tools.hpp:22

mlpack::ann::RandomInitialization::Initialize
void Initialize(arma::Mat< eT > &W, const size_t rows, const size_t cols)
Initialize randomly the elements of the specified weight matrix.
Definition: random_init.hpp:56

JacobianPerformanceTest
double JacobianPerformanceTest(ModuleType &module, arma::mat &input, arma::mat &target, const double eps=1e-6)
Definition: ann_test_tools.hpp:104

JacobianTest
double JacobianTest(ModuleType &module, arma::mat &input, const double minValue=-2, const double maxValue=-1, const double perturbation=1e-6)
Definition: ann_test_tools.hpp:40

core.hpp
Include all of the base components required to write mlpack methods, and the main mlpack Doxygen docu...

CheckRegularizerGradient
double CheckRegularizerGradient(FunctionType &function, const double eps=1e-7)
Definition: ann_test_tools.hpp:172