/** * @file methods/ann/layer/noisylinear_impl.hpp * @author Nishant Kumar * * Implementation of the NoisyLinear layer class. * * mlpack is free software; you may redistribute it and/or modify it under the * terms of the 3-clause BSD license. You should have received a copy of the * 3-clause BSD license along with mlpack. If not, see * http://www.opensource.org/licenses/BSD-3-Clause for more information. */ #ifndef MLPACK_METHODS_ANN_LAYER_NOISYLINEAR_IMPL_HPP #define MLPACK_METHODS_ANN_LAYER_NOISYLINEAR_IMPL_HPP // In case it hasn't yet been included. #include "noisylinear.hpp" namespace mlpack { namespace ann /** Artificial Neural Network. */ { template NoisyLinear::NoisyLinear() : inSize(0), outSize(0) { // Nothing to do here. } template NoisyLinear::NoisyLinear( const NoisyLinear& layer) : inSize(layer.inSize), outSize(layer.outSize), weights(layer.weights) { Reset(); } template NoisyLinear::NoisyLinear( const size_t inSize, const size_t outSize) : inSize(inSize), outSize(outSize) { weights.set_size((outSize * inSize + outSize) * 2, 1); weightEpsilon.set_size(outSize, inSize); biasEpsilon.set_size(outSize, 1); } template void NoisyLinear::Reset() { weightMu = arma::mat(weights.memptr(), outSize, inSize, false, false); biasMu = arma::mat(weights.memptr() + weightMu.n_elem, outSize, 1, false, false); weightSigma = arma::mat(weights.memptr() + weightMu.n_elem + biasMu.n_elem, outSize, inSize, false, false); biasSigma = arma::mat(weights.memptr() + weightMu.n_elem * 2 + biasMu.n_elem, outSize, 1, false, false); this->ResetNoise(); } template void NoisyLinear::ResetNoise() { arma::mat epsilonIn = arma::randn(inSize, 1); epsilonIn = arma::sign(epsilonIn) % arma::sqrt(arma::abs(epsilonIn)); arma::mat epsilonOut = arma::randn(outSize, 1); epsilonOut = arma::sign(epsilonOut) % arma::sqrt(arma::abs(epsilonOut)); weightEpsilon = epsilonOut * epsilonIn.t(); biasEpsilon = epsilonOut; } template void NoisyLinear::ResetParameters() { const double muRange = 1 / std::sqrt(inSize); weightMu.randu(); weightMu = muRange * (weightMu * 2 - 1); biasMu.randu(); biasMu = muRange * (biasMu * 2 - 1); weightSigma.fill(0.5 / std::sqrt(inSize)); biasSigma.fill(0.5 / std::sqrt(outSize)); } template template void NoisyLinear::Forward( const arma::Mat& input, arma::Mat& output) { weight = weightMu + weightSigma % weightEpsilon; bias = biasMu + biasSigma % biasEpsilon; output = weight * input; output.each_col() += bias; } template template void NoisyLinear::Backward( const arma::Mat& /* input */, const arma::Mat& gy, arma::Mat& g) { g = weight.t() * gy; } template template void NoisyLinear::Gradient( const arma::Mat& input, const arma::Mat& error, arma::Mat& gradient) { // Locally stored to prevent multiplication twice. arma::mat weightGrad = error * input.t(); // Gradients for mu values. gradient.rows(0, weight.n_elem - 1) = arma::vectorise(weightGrad); gradient.rows(weight.n_elem, weight.n_elem + bias.n_elem - 1) = arma::sum(error, 1); // Gradients for sigma values. gradient.rows(weight.n_elem + bias.n_elem, gradient.n_elem - bias.n_elem - 1) = arma::vectorise(weightGrad % weightEpsilon); gradient.rows(gradient.n_elem - bias.n_elem, gradient.n_elem - 1) = arma::sum(error, 1) % biasEpsilon; } template template void NoisyLinear::serialize( Archive& ar, const unsigned int /* version */) { ar & BOOST_SERIALIZATION_NVP(inSize); ar & BOOST_SERIALIZATION_NVP(outSize); // This is inefficient, but we have to allocate this memory so that // WeightSetVisitor gets the right size. if (Archive::is_loading::value) weights.set_size((outSize * inSize + outSize) * 2, 1); } } // namespace ann } // namespace mlpack #endif