include/shark/Models/Kernels/KernelHelpers.h Source File

Go to the documentation of this file.
//===========================================================================
/*!
 * 
 *
 * \brief       Collection of functions dealing with typical tasks of kernels
 
 
 * 
 *
 * \author      O. Krause
 * \date        2007-2012
 *
 *
 * \par Copyright 1995-2017 Shark Development Team
 * 
 * <BR><HR>
 * This file is part of Shark.
 * <https://shark-ml.github.io/Shark/>
 * 
 * Shark is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Lesser General Public License as published 
 * by the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 * 
 * Shark is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Lesser General Public License for more details.
 * 
 * You should have received a copy of the GNU Lesser General Public License
 * along with Shark.  If not, see <http://www.gnu.org/licenses/>.
 *
 */
//===========================================================================
 
#ifndef SHARK_MODELS_KERNELS_KERNELHELPERS_H
#define SHARK_MODELS_KERNELS_KERNELHELPERS_H
 
#include <shark/Models/Kernels/AbstractKernelFunction.h>
#include <shark/Data/Dataset.h>
#include <shark/Core/OpenMP.h>
namespace shark{
    
///  \brief Calculates the regularized kernel gram matrix of the points stored inside a dataset.
///
///  Regularization is applied by adding the regularizer on the diagonal
///  \param kernel the kernel for which to calculate the kernel gram matrix
///  \param dataset the set of points used in the gram matrix
///  \param matrix the target kernel matrix
///  \param regularizer the regularizer of the matrix which is always >= 0. default is 0.
///  \ingroup kernels
template<class InputType, class M, class Device>
void calculateRegularizedKernelMatrix(
    AbstractKernelFunction<InputType>const& kernel,
    Data<InputType> const& dataset,
    blas::matrix_expression<M, Device>& matrix,
    double regularizer = 0
){
    SHARK_RUNTIME_CHECK(regularizer >= 0, "regularizer must be >=0");
    std::size_t B = dataset.numberOfBatches();
    //get start of all batches in the matrix
    //also include  the past the end position at the end
    std::vector<std::size_t> batchStart(B+1,0);
    for(std::size_t i = 1; i != B+1; ++i){
        batchStart[i] = batchStart[i-1]+ batchSize(dataset.batch(i-1));
    }
    SIZE_CHECK(batchStart[B] == dataset.numberOfElements());
    std::size_t N  = batchStart[B];//number of elements
    ensure_size(matrix,N,N);
    
    
    for (std::size_t i=0; i<B; i++){
        std::size_t startX = batchStart[i];
        std::size_t endX = batchStart[i+1];
        SHARK_PARALLEL_FOR(int j=0; j < (int)B; j++){
            std::size_t startY = batchStart[j];
            std::size_t endY = batchStart[j+1];
            RealMatrix submatrix = kernel(dataset.batch(i), dataset.batch(j));
            noalias(subrange(matrix(),startX,endX,startY,endY))=submatrix;
            //~ if(i != j)
                //~ noalias(subrange(matrix(),startY,endY,startX,endX))=trans(submatrix);
        }
        for(std::size_t k = startX; k != endX; ++k){
            matrix()(k,k) += static_cast<typename M::value_type>(regularizer);
        }
    }
}
 
///  \brief Calculates the kernel gram matrix between two data sets.
///
///  \param kernel the kernel for which to calculate the kernel gram matrix
///  \param dataset1 the set of points corresponding to rows of the Gram matrix
///  \param dataset2 the set of points corresponding to columns of the Gram matrix
///  \param matrix the target kernel matrix
///  \ingroup kernels
template<class InputType, class M, class Device>
void calculateMixedKernelMatrix(
    AbstractKernelFunction<InputType>const& kernel,
    Data<InputType> const& dataset1,
    Data<InputType> const& dataset2,
    blas::matrix_expression<M, Device>& matrix
){
    std::size_t B1 = dataset1.numberOfBatches();
    std::size_t B2 = dataset2.numberOfBatches();
    //get start of all batches in the matrix
    //also include  the past the end position at the end
    std::vector<std::size_t> batchStart1(B1+1,0);
    for(std::size_t i = 1; i != B1+1; ++i){
        batchStart1[i] = batchStart1[i-1]+ batchSize(dataset1.batch(i-1));
    }
    std::vector<std::size_t> batchStart2(B2+1,0);
    for(std::size_t i = 1; i != B2+1; ++i){
        batchStart2[i] = batchStart2[i-1]+ batchSize(dataset2.batch(i-1));
    }
    SIZE_CHECK(batchStart1[B1] == dataset1.numberOfElements());
    SIZE_CHECK(batchStart2[B2] == dataset2.numberOfElements());
    std::size_t N1 = batchStart1[B1];//number of elements
    std::size_t N2 = batchStart2[B2];//number of elements
    ensure_size(matrix,N1,N2);
    
    for (std::size_t i=0; i<B1; i++){
        std::size_t startX = batchStart1[i];
        std::size_t endX = batchStart1[i+1];
        SHARK_PARALLEL_FOR(int j=0; j < (int)B2; j++){
            std::size_t startY = batchStart2[j];
            std::size_t endY = batchStart2[j+1];
            RealMatrix submatrix = kernel(dataset1.batch(i), dataset2.batch(j));
            noalias(subrange(matrix(),startX,endX,startY,endY))=submatrix;
            //~ if(i != j)
                //~ noalias(subrange(matrix(),startY,endY,startX,endX))=trans(submatrix);
        }
    }
}
 
///  \brief Calculates the regularized kernel gram matrix of the points stored inside a dataset.
///
///  Regularization is applied by adding the regularizer on the diagonal
///  \param kernel the kernel for which to calculate the kernel gram matrix
///  \param dataset the set of points used in the gram matrix
///  \param regularizer the regularizer of the matrix which is always >= 0. default is 0.
/// \return the kernel gram matrix
///  \ingroup kernels
template<class InputType>
RealMatrix calculateRegularizedKernelMatrix(
    AbstractKernelFunction<InputType>const& kernel,
    Data<InputType> const& dataset, 
    double regularizer = 0
){
    SHARK_RUNTIME_CHECK(regularizer >= 0, "regularizer must be >=0");
    RealMatrix M;
    calculateRegularizedKernelMatrix(kernel,dataset,M,regularizer);
    return M;
}
 
///  \brief Calculates the kernel gram matrix between two data sets.
///
///  \param kernel the kernel for which to calculate the kernel gram matrix
///  \param dataset1 the set of points corresponding to rows of the Gram matrix
///  \param dataset2 the set of points corresponding to columns of the Gram matrix
///  \return matrix the target kernel matrix
///  \ingroup kernels
template<class InputType>
RealMatrix calculateMixedKernelMatrix(
    AbstractKernelFunction<InputType>const& kernel,
    Data<InputType> const& dataset1, 
    Data<InputType> const& dataset2
){
    RealMatrix M;
    calculateMixedKernelMatrix(kernel,dataset1,dataset2,M);
    return M;
}
 
 
/// \brief Efficiently calculates the weighted derivative of a Kernel Gram Matrix w.r.t the Kernel Parameters
///
/// The formula is \f$  \sum_i \sum_j w_{ij} k(x_i,x_j)\f$ where w_ij are the weights of the gradient and x_i x_j are
/// the datapoints defining the gram matrix and k is the kernel. For efficiency it is assumd that w_ij = w_ji.
///This method is only useful when the whole Kernel Gram Matrix neds to be computed to get the weights w_ij and
///only computing smaller blocks is not sufficient. 
///  \param kernel the kernel for which to calculate the kernel gram matrix
///  \param dataset the set of points used in the gram matrix
///  \param weights the weights of the derivative, they must be symmetric!
///  \return the weighted derivative w.r.t the parameters.
///  \ingroup kernels
template<class InputType,class WeightMatrix>
RealVector calculateKernelMatrixParameterDerivative(
        AbstractKernelFunction<InputType> const& kernel,
        Data<InputType> const& dataset, 
        WeightMatrix const& weights
){
    std::size_t kp = kernel.numberOfParameters();
    RealMatrix block;//stores the kernel results of the block which we need to compute to get the State :(
    RealVector kernelGradient(kp);//weighted gradient summed over the whole kernel matrix
    kernelGradient.clear();
    
    //calculate the gradint blockwise taking symmetry into account.
    RealVector blockGradient(kp);//weighted gradient summed over the whole block
    boost::shared_ptr<State> state = kernel.createState();
    std::size_t startX = 0;
    for (std::size_t i=0; i<dataset.numberOfBatches(); i++){
        std::size_t sizeX= batchSize(dataset.batch(i));
        std::size_t startY = 0;//start of the current batch in y-direction
        for (std::size_t j=0; j <= i; j++){
            std::size_t sizeY= batchSize(dataset.batch(j));
            kernel.eval(dataset.batch(i), dataset.batch(j),block,*state);
            kernel.weightedParameterDerivative(
                dataset.batch(i), dataset.batch(j),//points
                subrange(weights,startX,startX+sizeX,startY,startY+sizeY),//weights
                *state,
                blockGradient
            );
            if(i != j)
                kernelGradient+=2*blockGradient;//Symmetry!
            else
                kernelGradient+=blockGradient;//middle blocks are symmetric
            startY+= sizeY;
        }
        startX+=sizeX;
    }
    return kernelGradient;
}
 
}
#endif