include/shark/Algorithms/Trainers/PCA.h Source File

Go to the documentation of this file.
//===========================================================================
/*!
 * 
 *
 * \brief       Principal Component Analysis
 * 
 * 
 * 
 *
 * \author      T. Glasmachers, C. Igel
 * \date        2010, 2011
 *
 *
 * \par Copyright 1995-2017 Shark Development Team
 * 
 * <BR><HR>
 * This file is part of Shark.
 * <https://shark-ml.github.io/Shark/>
 * 
 * Shark is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Lesser General Public License as published 
 * by the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 * 
 * Shark is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Lesser General Public License for more details.
 * 
 * You should have received a copy of the GNU Lesser General Public License
 * along with Shark.  If not, see <http://www.gnu.org/licenses/>.
 *
 */
//===========================================================================
 
 
#ifndef SHARK_ALGORITHMS_TRAINER_PCA_H
#define SHARK_ALGORITHMS_TRAINER_PCA_H
 
#include <shark/Core/DLLSupport.h>
#include <shark/Models/LinearModel.h>
#include <shark/Algorithms/Trainers/AbstractTrainer.h>
 
namespace shark{
 
///  \brief Principal Component Analysis
///
///  The Principal Component Analysis, also known as
///  Karhunen-Loeve transformation, takes a symmetric
///  \f$ n \times n \f$ matrix \f$ A \f$ and uses its decomposition
///
///  \f$
///      A = \Gamma \Lambda \Gamma^T,
///  \f$
///
///  where \f$ \Lambda \f$ is the diagonal matrix of eigenvalues
///  of \f$ A \f$ and \f$ \Gamma \f$ is the orthogonal matrix
///  with the corresponding eigenvectors as columns.
///  \f$ \Lambda \f$ then defines a successive orthogonal rotation
///  that maximizes the variances of the coordinates, i.e. the
///  coordinate system is rotated in such a way that the correlation
///  between the new axes becomes zero. If there are \f$ p \f$ axes,
///  the first axis is rotated in a way that the points on the new axis
///  have maximum variance. Then the remaining \f$ p - 1 \f$ axes are
///  rotated such that a another axis covers a maximum part of the rest
///  variance, that is not covered by the first axis. After the
///  rotation of \f$ p - 1 \f$ axes, the rotation destination of axis
///  no. \f$ p \f$ is fixed.  An application for PCA is the reduction
///  of dimensions by skipping the components with the least
///  corresponding eigenvalues/variances. Furthermore, the eigenvalues
///  may be rescaled to one, resulting in a whitening of the data.
/// \ingroup unsupervised_trainer
class PCA : public AbstractUnsupervisedTrainer<LinearModel<> >
{
private:
    typedef AbstractUnsupervisedTrainer<LinearModel<> > base_type;
public:
    enum PCAAlgorithm { STANDARD, SMALL_SAMPLE, AUTO };
 
    /// Constructor.
    /// The parameter defines whether the model should also
    /// whiten the data.
    PCA(bool whitening = false) 
    : m_whitening(whitening){
        m_algorithm = AUTO;
    };
    /// Constructor.
    /// The parameter defines whether the model should also
    /// whiten the data.
    /// The eigendecomposition of the data is stored inthe PCA object.
    PCA(UnlabeledData<RealVector> const& inputs, bool whitening = false) 
    : m_whitening(whitening){
        m_algorithm = AUTO;
        setData(inputs);
    };
 
    /// \brief From INameable: return the class name.
    std::string name() const
    { return "PCA"; }
 
    /// If set to true, the encoded data has unit variance along
    /// the new coordinates.
    void setWhitening(bool whitening) {
        m_whitening = whitening;
    }
 
    /// Train the model to perform PCA. The model must be a
    /// LinearModel object with offset, and its output dimension
    /// defines the number of principal components
    /// represented. The model returned is the one given by the
    /// econder() function (i.e., mapping from the original input
    /// space to the PCA coordinate system).
    void train(LinearModel<>& model, UnlabeledData<RealVector> const& inputs) {
        std::size_t m = model.outputShape().numElements(); ///< reduced dimensionality
        setData(inputs);   // compute PCs
        encoder(model, m); // define the model 
    }
 
 
    //! Sets the input data and performs the PCA. This is a
    //! computationally costly operation. The eigendecomposition
    //! of the data is stored inthe PCA object.
    SHARK_EXPORT_SYMBOL void setData(UnlabeledData<RealVector> const& inputs);
 
    //! Returns a model mapping the original data to the
    //! m-dimensional PCA coordinate system.
    SHARK_EXPORT_SYMBOL void encoder(LinearModel<>& model, std::size_t m = 0);
 
    //! Returns a model mapping encoded data from the
    //! m-dimensional PCA coordinate system back to the
    //! n-dimensional original coordinate system.
    SHARK_EXPORT_SYMBOL void decoder(LinearModel<>& model, std::size_t m = 0);
 
    /// Eigenvalues of last training. The number of eigenvalues
    //! is equal to the minimum of the input dimensions (i.e.,
    //! number of attributes) and the number of data points used
    //! for training the PCA.
    RealVector const& eigenvalues() const {
        return m_eigenvalues;
    }
    /// Returns ith eigenvalue.
    double eigenvalue(std::size_t i) const {
        SIZE_CHECK( i < m_l );
        if( i < m_eigenvalues.size()) 
            return m_eigenvalues(i);
        return 0.;
    }
 
    //! Eigenvectors of last training. The number of eigenvectors
    //! is equal to the minimum of the input dimensions (i.e.,
    //! number of attributes) and the number of data points used
    //! for training the PCA.
    RealMatrix const& eigenvectors() const{
        return m_eigenvectors;
    }
 
    /// mean of last training
    RealVector const& mean() const{
        return m_mean;
    }
 
protected:
    bool m_whitening;          ///< normalize variance yes/no
    RealMatrix m_eigenvectors; ///< eigenvectors
    RealVector m_eigenvalues;  ///< eigenvalues
    RealVector m_mean;     ///< mean value
 
    std::size_t m_n;           ///< number of attributes
    std::size_t m_l;           ///< number of training data points
 
    PCAAlgorithm m_algorithm;  ///< whether to use design matrix or its transpose for building covariance matrix
};
 
 
}
#endif // SHARK_ML_TRAINER_PCA_H