/** * @file methods/ann/layer/max_pooling.hpp * @author Marcus Edel * @author Nilay Jain * * Definition of the MaxPooling class. * * mlpack is free software; you may redistribute it and/or modify it under the * terms of the 3-clause BSD license. You should have received a copy of the * 3-clause BSD license along with mlpack. If not, see * http://www.opensource.org/licenses/BSD-3-Clause for more information. */ #ifndef MLPACK_METHODS_ANN_LAYER_MAX_POOLING_HPP #define MLPACK_METHODS_ANN_LAYER_MAX_POOLING_HPP #include namespace mlpack { namespace ann /** Artificial Neural Network. */ { /* * The max pooling rule for convolution neural networks. Take the maximum value * within the receptive block. */ class MaxPoolingRule { public: /* * Return the maximum value within the receptive block. * * @param input Input used to perform the pooling operation. */ template size_t Pooling(const MatType& input) { return arma::as_scalar(arma::find(input.max() == input, 1)); } }; /** * Implementation of the MaxPooling layer. * * @tparam InputDataType Type of the input data (arma::colvec, arma::mat, * arma::sp_mat or arma::cube). * @tparam OutputDataType Type of the output data (arma::colvec, arma::mat, * arma::sp_mat or arma::cube). */ template < typename InputDataType = arma::mat, typename OutputDataType = arma::mat > class MaxPooling { public: //! Create the MaxPooling object. MaxPooling(); /** * Create the MaxPooling object using the specified number of units. * * @param kernelWidth Width of the pooling window. * @param kernelHeight Height of the pooling window. * @param strideWidth Width of the stride operation. * @param strideHeight Width of the stride operation. * @param floor Rounding operator (floor or ceil). */ MaxPooling(const size_t kernelWidth, const size_t kernelHeight, const size_t strideWidth = 1, const size_t strideHeight = 1, const bool floor = true); /** * Ordinary feed forward pass of a neural network, evaluating the function * f(x) by propagating the activity forward through f. * * @param input Input data used for evaluating the specified function. * @param output Resulting output activation. */ template void Forward(const arma::Mat& input, arma::Mat& output); /** * Ordinary feed backward pass of a neural network, using 3rd-order tensors as * input, calculating the function f(x) by propagating x backwards through f. * Using the results from the feed forward pass. * * @param * (input) The propagated input activation. * @param gy The backpropagated error. * @param g The calculated gradient. */ template void Backward(const arma::Mat& /* input */, const arma::Mat& gy, arma::Mat& g); //! Get the output parameter. const OutputDataType& OutputParameter() const { return outputParameter; } //! Modify the output parameter. OutputDataType& OutputParameter() { return outputParameter; } //! Get the delta. const OutputDataType& Delta() const { return delta; } //! Modify the delta. OutputDataType& Delta() { return delta; } //! Get the input width. size_t InputWidth() const { return inputWidth; } //! Modify the input width. size_t& InputWidth() { return inputWidth; } //! Get the input height. size_t InputHeight() const { return inputHeight; } //! Modify the input height. size_t& InputHeight() { return inputHeight; } //! Get the output width. size_t OutputWidth() const { return outputWidth; } //! Modify the output width. size_t& OutputWidth() { return outputWidth; } //! Get the output height. size_t OutputHeight() const { return outputHeight; } //! Modify the output height. size_t& OutputHeight() { return outputHeight; } //! Get the input size. size_t InputSize() const { return inSize; } //! Get the output size. size_t OutputSize() const { return outSize; } //! Get the kernel width. size_t KernelWidth() const { return kernelWidth; } //! Modify the kernel width. size_t& KernelWidth() { return kernelWidth; } //! Get the kernel height. size_t KernelHeight() const { return kernelHeight; } //! Modify the kernel height. size_t& KernelHeight() { return kernelHeight; } //! Get the stride width. size_t StrideWidth() const { return strideWidth; } //! Modify the stride width. size_t& StrideWidth() { return strideWidth; } //! Get the stride height. size_t StrideHeight() const { return strideHeight; } //! Modify the stride height. size_t& StrideHeight() { return strideHeight; } //! Get the value of the rounding operation. bool Floor() const { return floor; } //! Modify the value of the rounding operation. bool& Floor() { return floor; } //! Get the value of the deterministic parameter. bool Deterministic() const { return deterministic; } //! Modify the value of the deterministic parameter. bool& Deterministic() { return deterministic; } /** * Serialize the layer. */ template void serialize(Archive& ar, const unsigned int /* version */); private: /** * Apply pooling to the input and store the results. * * @param input The input to be apply the pooling rule. * @param output The pooled result. * @param poolingIndices The pooled indices. */ template void PoolingOperation(const arma::Mat& input, arma::Mat& output, arma::Mat& poolingIndices) { for (size_t j = 0, colidx = 0; j < output.n_cols; ++j, colidx += strideHeight) { for (size_t i = 0, rowidx = 0; i < output.n_rows; ++i, rowidx += strideWidth) { arma::mat subInput = input( arma::span(rowidx, rowidx + kernelWidth - 1 - offset), arma::span(colidx, colidx + kernelHeight - 1 - offset)); const size_t idx = pooling.Pooling(subInput); output(i, j) = subInput(idx); if (!deterministic) { arma::Mat subIndices = indices(arma::span(rowidx, rowidx + kernelWidth - 1 - offset), arma::span(colidx, colidx + kernelHeight - 1 - offset)); poolingIndices(i, j) = subIndices(idx); } } } } /** * Apply unpooling to the input and store the results. * * @param error The backward error. * @param output The pooled result. * @param poolingIndices The pooled indices. */ template void Unpooling(const arma::Mat& error, arma::Mat& output, arma::Mat& poolingIndices) { for (size_t i = 0; i < poolingIndices.n_elem; ++i) { output(poolingIndices(i)) += error(i); } } //! Locally-stored width of the pooling window. size_t kernelWidth; //! Locally-stored height of the pooling window. size_t kernelHeight; //! Locally-stored width of the stride operation. size_t strideWidth; //! Locally-stored height of the stride operation. size_t strideHeight; //! Rounding operation used. bool floor; //! Locally-stored number of input channels. size_t inSize; //! Locally-stored number of output channels. size_t outSize; //! Locally-stored reset parameter used to initialize the module once. bool reset; //! Locally-stored input width. size_t inputWidth; //! Locally-stored input height. size_t inputHeight; //! Locally-stored output width. size_t outputWidth; //! Locally-stored output height. size_t outputHeight; //! If true use maximum a posteriori during the forward pass. bool deterministic; //! Locally-stored stored rounding offset. size_t offset; //! Locally-stored number of input units. size_t batchSize; //! Locally-stored output parameter. arma::cube outputTemp; //! Locally-stored transformed input parameter. arma::cube inputTemp; //! Locally-stored transformed output parameter. arma::cube gTemp; //! Locally-stored pooling strategy. MaxPoolingRule pooling; //! Locally-stored delta object. OutputDataType delta; //! Locally-stored gradient object. OutputDataType gradient; //! Locally-stored output parameter object. OutputDataType outputParameter; //! Locally-stored indices matrix parameter. arma::Mat indices; //! Locally-stored indices column parameter. arma::Col indicesCol; //! Locally-stored pooling indicies. std::vector poolingIndices; }; // class MaxPooling } // namespace ann } // namespace mlpack // Include implementation. #include "max_pooling_impl.hpp" #endif