cn/current/MMDKernelSelectionComb_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2012-2013 Heiko Strathmann

  */


 #include <shogun/statistics/MMDKernelSelectionComb.h>

 #include <shogun/statistics/KernelTwoSampleTest.h>

 #include <shogun/kernel/CombinedKernel.h>


 using namespace shogun;


 CMMDKernelSelectionComb::CMMDKernelSelectionComb() :

         CMMDKernelSelection()

 {

     init();

 }


 CMMDKernelSelectionComb::CMMDKernelSelectionComb(

         CKernelTwoSampleTest* mmd) : CMMDKernelSelection(mmd)

 {

     init();

 }


 CMMDKernelSelectionComb::~CMMDKernelSelectionComb()

 {

 }


 void CMMDKernelSelectionComb::init()

 {

     SG_ADD(&m_opt_max_iterations, "opt_max_iterations", "Maximum number of "

             "iterations for qp solver", MS_NOT_AVAILABLE);

     SG_ADD(&m_opt_epsilon, "opt_epsilon", "Stopping criterion for qp solver",

             MS_NOT_AVAILABLE);

     SG_ADD(&m_opt_low_cut, "opt_low_cut", "Low cut value for optimization "

             "kernel weights", MS_NOT_AVAILABLE);


     /* sensible values for optimization */

     m_opt_max_iterations=10000;

     m_opt_epsilon=10E-15;

     m_opt_low_cut=10E-7;

 }


 CKernel* CMMDKernelSelectionComb::select_kernel()

 {

     /* cast is safe due to assertion in constructor */

     CCombinedKernel* combined=(CCombinedKernel*)m_estimator->get_kernel();


     /* optimise for kernel weights and set them */

     SGVector<float64_t> weights=compute_measures();

     combined->set_subkernel_weights(weights);


     /* note that kernel is SG_REF'ed from getter above */

     return combined;

 }


 /* no reference counting, use the static context constructor of SGMatrix */

 SGMatrix<float64_t> CMMDKernelSelectionComb::m_Q=SGMatrix<float64_t>(false);


 const float64_t* CMMDKernelSelectionComb::get_Q_col(uint32_t i)

 {

     return &m_Q[m_Q.num_rows*i];

 }


 void CMMDKernelSelectionComb::print_state(libqp_state_T state)

 {

     SG_SDEBUG("libqp state: primal=%f\n", state.QP);

 }


 SGVector<float64_t> CMMDKernelSelectionComb::solve_optimization(

         SGVector<float64_t> mmds)

 {

     /* readability */

     index_t num_kernels=mmds.vlen;


     /* compute sum of mmds to generate feasible point for convex program */

     float64_t sum_mmds=0;

     for (index_t i=0; i<mmds.vlen; ++i)

         sum_mmds+=mmds[i];


     /* QP: 0.5*x'*Q*x + f'*x

      * subject to

      * mmds'*x = b

      * LB[i] <= x[i] <= UB[i]   for all i=1..n */

     SGVector<float64_t> Q_diag(num_kernels);

     SGVector<float64_t> f(num_kernels);

     SGVector<float64_t> lb(num_kernels);

     SGVector<float64_t> ub(num_kernels);

     SGVector<float64_t> weights(num_kernels);


     /* init everything, there are two cases possible: i) at least one mmd is

      * is positive, ii) all mmds are negative */

     bool one_pos=false;

     for (index_t i=0; i<mmds.vlen; ++i)

     {

         if (mmds[i]>0)

         {

             SG_DEBUG("found at least one positive MMD\n")

             one_pos=true;

             break;

         }

     }


     if (!one_pos)

     {

         SG_WARNING("All mmd estimates are negative. This is techically possible,"

                 "although extremely rare. Consider using different kernels. "

                 "This combination will lead to a bad two-sample test. Since any"

                 "combination is bad, will now just return equally distributed "

                 "kernel weights\n");


         /* if no element is positive, we can choose arbritary weights since

          * the results will be bad anyway */

         weights.set_const(1.0/num_kernels);

     }

     else

     {

         SG_DEBUG("one MMD entry is positive, performing optimisation\n")

         /* do optimisation, init vectors */

         for (index_t i=0; i<num_kernels; ++i)

         {

             Q_diag[i]=m_Q(i,i);

             f[i]=0;

             lb[i]=0;

             ub[i]=CMath::INFTY;


             /* initial point has to be feasible, i.e. mmds'*x = b */

             weights[i]=1.0/sum_mmds;

         }


         /* start libqp solver with desired parameters */

         SG_DEBUG("starting libqp optimization\n")

         libqp_state_T qp_exitflag=libqp_gsmo_solver(&get_Q_col, Q_diag.vector,

                 f.vector, mmds.vector,

                 one_pos ? 1 : -1,

                 lb.vector, ub.vector,

                 weights.vector, num_kernels, m_opt_max_iterations,

                 m_opt_epsilon, &(CMMDKernelSelectionComb::print_state));


         SG_DEBUG("libqp returns: nIts=%d, exit_flag: %d\n", qp_exitflag.nIter,

                 qp_exitflag.exitflag);


         /* set really small entries to zero and sum up for normalization */

         float64_t sum_weights=0;

         for (index_t i=0; i<weights.vlen; ++i)

         {

             if (weights[i]<m_opt_low_cut)

             {

                 SG_DEBUG("lowcut: weight[%i]=%f<%f setting to zero\n", i, weights[i],

                         m_opt_low_cut);

                 weights[i]=0;

             }


             sum_weights+=weights[i];

         }


         /* normalize (allowed since problem is scale invariant) */

         for (index_t i=0; i<weights.vlen; ++i)

             weights[i]/=sum_weights;

     }


     return weights;

 }

shogun::CMMDKernelSelectionComb::select_kernel
virtual CKernel * select_kernel()
Definition: MMDKernelSelectionComb.cpp:47

shogun::CCombinedKernel::set_subkernel_weights
virtual void set_subkernel_weights(SGVector< float64_t > weights)
Definition: CombinedKernel.cpp:694

shogun::CKernelTwoSampleTest::get_kernel
virtual CKernel * get_kernel()
Definition: KernelTwoSampleTest.h:86

shogun::CMMDKernelSelectionComb::m_Q
static SGMatrix< float64_t > m_Q
Definition: MMDKernelSelectionComb.h:86

index_t
int32_t index_t
Definition: common.h:62

shogun::CMath::INFTY
static const float64_t INFTY
infinity
Definition: Math.h:2048

shogun::CMMDKernelSelectionComb::solve_optimization
virtual SGVector< float64_t > solve_optimization(SGVector< float64_t > mmds)
Definition: MMDKernelSelectionComb.cpp:74

shogun::CMMDKernelSelection
Base class for kernel selection for MMD-based two-sample test statistic implementations. Provides abstract methods for selecting kernels and computing criteria or kernel weights for the implemented method. In order to implement new methods for kernel selection, simply write a new implementation of this class.
Definition: MMDKernelSelection.h:57

shogun::CMMDKernelSelectionComb::m_opt_max_iterations
index_t m_opt_max_iterations
Definition: MMDKernelSelectionComb.h:77

CombinedKernel.h

shogun::CKernelTwoSampleTest
Kernel two sample test base class. Provides an interface for performing a two-sample test using a ker...
Definition: KernelTwoSampleTest.h:38

shogun::CMMDKernelSelectionComb::print_state
static void print_state(libqp_state_T state)
Definition: MMDKernelSelectionComb.cpp:69

shogun::SGMatrix::num_rows
index_t num_rows
Definition: SGMatrix.h:376

shogun::SGMatrix< float64_t >

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:89

shogun::CMMDKernelSelectionComb::CMMDKernelSelectionComb
CMMDKernelSelectionComb()
Definition: MMDKernelSelectionComb.cpp:16

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::SGVector< float64_t >

shogun::CMMDKernelSelectionComb::m_opt_low_cut
float64_t m_opt_low_cut
Definition: MMDKernelSelectionComb.h:83

float64_t
double float64_t
Definition: common.h:50

shogun::CCombinedKernel
The Combined kernel is used to combine a number of kernels into a single CombinedKernel object by lin...
Definition: CombinedKernel.h:49

shogun::CMMDKernelSelection::compute_measures
virtual SGVector< float64_t > compute_measures()=0

shogun::CMMDKernelSelectionComb::get_Q_col
static const float64_t * get_Q_col(uint32_t i)
Definition: MMDKernelSelectionComb.cpp:63

MMDKernelSelectionComb.h

shogun::CKernelSelection::m_estimator
CKernelTwoSampleTest * m_estimator
Definition: KernelSelection.h:99

SG_DEBUG
#define SG_DEBUG(...)
Definition: SGIO.h:107

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

SG_SDEBUG
#define SG_SDEBUG(...)
Definition: SGIO.h:168

shogun::CMMDKernelSelectionComb::m_opt_epsilon
float64_t m_opt_epsilon
Definition: MMDKernelSelectionComb.h:80

KernelTwoSampleTest.h

shogun::CKernel
The Kernel base class.
Definition: Kernel.h:158

SG_WARNING
#define SG_WARNING(...)
Definition: SGIO.h:128

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:81

shogun::CMMDKernelSelectionComb::~CMMDKernelSelectionComb
virtual ~CMMDKernelSelectionComb()
Definition: MMDKernelSelectionComb.cpp:28

shogun::SGVector::set_const
void set_const(T const_elem)
Definition: SGVector.cpp:152