/** * @file methods/amf/update_rules/nmf_mult_div.hpp * @author Mohan Rajendran * * Update rules for the Non-negative Matrix Factorization. * * mlpack is free software; you may redistribute it and/or modify it under the * terms of the 3-clause BSD license. You should have received a copy of the * 3-clause BSD license along with mlpack. If not, see * http://www.opensource.org/licenses/BSD-3-Clause for more information. */ #ifndef MLPACK_METHODS_LMF_UPDATE_RULES_NMF_MULT_DIV_HPP #define MLPACK_METHODS_LMF_UPDATE_RULES_NMF_MULT_DIV_HPP #include namespace mlpack { namespace amf { /** * This follows a method described in the paper 'Algorithms for Non-negative * * @code * @inproceedings{lee2001algorithms, * title={Algorithms for non-negative matrix factorization}, * author={Lee, D.D. and Seung, H.S.}, * booktitle={Advances in Neural Information Processing Systems 13 * (NIPS 2000)}, * pages={556--562}, * year={2001} * } * @endcode * * This is a multiplicative rule that ensures that the Kullback–Leibler * divergence * * \f[ * \sum_i \sum_j (V_{ij} \log\frac{V_{ij}}{(W H)_{ij}} - V_{ij} + (W H)_{ij}) * \f] * * is non-increasing between subsequent iterations. Both of the update rules * for W and H are defined in this file. * * This set of update rules is not meant to work with sparse matrices. Using * sparse matrices often causes NaNs in the output, so other choices of update * rules are better in that situation. */ class NMFMultiplicativeDivergenceUpdate { public: // Empty constructor required for the WUpdateRule template. NMFMultiplicativeDivergenceUpdate() { } /** * Initialize the factorization. These rules don't store any state, so the * input values are ignore. */ template void Initialize(const MatType& /* dataset */, const size_t /* rank */) { // Nothing to do. } /** * The update rule for the basis matrix W. The formula used is * * \f[ * W_{ia} \leftarrow W_{ia} \frac{\sum_{\mu} H_{a\mu} V_{i\mu} / (W H)_{i\mu}} * {\sum_{\nu} H_{a\nu}} * \f] * * The function takes in all the matrices and only changes the value of the W * matrix. * * @param V Input matrix to be factorized. * @param W Basis matrix to be updated. * @param H Encoding matrix. */ template inline static void WUpdate(const MatType& V, arma::mat& W, const arma::mat& H) { // Simple implementation left in the header file. arma::mat t1; arma::rowvec t2; t1 = W * H; for (size_t i = 0; i < W.n_rows; ++i) { for (size_t j = 0; j < W.n_cols; ++j) { // Writing this as a single expression does not work as of Armadillo // 3.920. This should be fixed in a future release, and then the code // below can be fixed. // t2 = H.row(j) % V.row(i) / t1.row(i); t2.set_size(H.n_cols); for (size_t k = 0; k < t2.n_elem; ++k) { t2(k) = H(j, k) * V(i, k) / t1(i, k); } W(i, j) = W(i, j) * sum(t2) / sum(H.row(j)); } } } /** * The update rule for the encoding matrix H. The formula used is * * \f[ * H_{a\mu} \leftarrow H_{a\mu} \frac{\sum_{i} W_{ia} V_{i\mu}/(WH)_{i\mu}} * {\sum_{k} H_{ka}} * \f] * * The function takes in all the matrices and only changes the value of the H * matrix. * * @param V Input matrix to be factorized. * @param W Basis matrix. * @param H Encoding matrix to updated. */ template inline static void HUpdate(const MatType& V, const arma::mat& W, arma::mat& H) { // Simple implementation left in the header file. arma::mat t1; arma::colvec t2; t1 = W * H; for (size_t i = 0; i < H.n_rows; ++i) { for (size_t j = 0; j < H.n_cols; ++j) { // Writing this as a single expression does not work as of Armadillo // 3.920. This should be fixed in a future release, and then the code // below can be fixed. // t2 = W.col(i) % V.col(j) / t1.col(j); t2.set_size(W.n_rows); for (size_t k = 0; k < t2.n_elem; ++k) { t2(k) = W(k, i) * V(k, j) / t1(k, j); } H(i, j) = H(i, j) * sum(t2) / sum(W.col(i)); } } } //! Serialize the object (in this case, there is nothing to serialize). template void serialize(Archive& /* ar */, const unsigned int /* version */) { } }; } // namespace amf } // namespace mlpack #endif