en/latest/Max_8h_source.html

 /*

  * Copyright (c) The Shogun Machine Learning Toolbox

  * Written (w) 2014 Khaled Nasr

  * All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice, this

  *    list of conditions and the following disclaimer.

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  *    this list of conditions and the following disclaimer in the documentation

  *    and/or other materials provided with the distribution.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR

  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  * The views and conclusions contained in the software and documentation are those

  * of the authors and should not be interpreted as representing official policies,

  * either expressed or implied, of the Shogun Development Team.

  */


 #ifndef MAX_IMPL_H_

 #define MAX_IMPL_H_


 #include <shogun/lib/config.h>

 #include <shogun/lib/SGMatrix.h>

 #include <shogun/lib/SGVector.h>

 #include <shogun/mathematics/Math.h>


 #include <shogun/mathematics/eigen3.h>


 #ifdef HAVE_VIENNACL

 #include <shogun/mathematics/linalg/internal/opencl_util.h>

 #include <shogun/lib/GPUMatrix.h>

 #include <shogun/lib/GPUVector.h>

 #endif


 #include <string>


 namespace shogun

 {


 namespace linalg

 {


 namespace implementation

 {


 template <enum Backend,class Matrix>

 struct max

 {

     typedef typename Matrix::Scalar T;


     static T compute(Matrix m);

 };


 template <class Matrix>

 struct max<Backend::EIGEN3,Matrix>

 {

     typedef typename Matrix::Scalar T;


     typedef Eigen::Matrix<T,Eigen::Dynamic,Eigen::Dynamic> MatrixXt;


     typedef Eigen::Matrix<T,Eigen::Dynamic,1> VectorXt;


     static T compute(SGMatrix<T> mat)

     {

         Eigen::Map<MatrixXt> m = mat;


         return m.maxCoeff();

     }


     static T compute(SGVector<T> vec)

     {

         Eigen::Map<VectorXt> v = vec;


         return v.maxCoeff();

     }

 };


 #ifdef HAVE_VIENNACL


 template <class Matrix>

 struct max<Backend::VIENNACL,Matrix>

 {

     typedef typename Matrix::Scalar T;


     template <class T>

     static viennacl::ocl::kernel& generate_kernel()

     {

         std::string kernel_name = "max_" + ocl::get_type_string<T>();


         if (ocl::kernel_exists(kernel_name))

             return ocl::get_kernel(kernel_name);


         std::string source = ocl::generate_kernel_preamble<T>(kernel_name);


         source.append(

             R"(

                 __kernel void KERNEL_NAME(

                     __global DATATYPE* vec, int size, int offset,

                     __global DATATYPE* result)

                 {

                     __local DATATYPE buffer[WORK_GROUP_SIZE_1D];


                     int local_id = get_local_id(0);


                     DATATYPE thread_max = -INFINITY;

                     for (int i=local_id; i<size; i+=WORK_GROUP_SIZE_1D)

                     {

                         DATATYPE v = vec[i+offset];

                         thread_max = max(v, thread_max);

                     }


                     buffer[local_id] = thread_max;


                     for (int j = WORK_GROUP_SIZE_1D/2; j > 0; j = j>>1)

                     {

                         barrier(CLK_LOCAL_MEM_FENCE);

                         if (local_id < j)

                             buffer[local_id] = max(buffer[local_id], buffer[local_id + j]);

                     }


                     barrier(CLK_LOCAL_MEM_FENCE);


                     if (get_global_id(0)==0)

                         *result = buffer[0];

                 }

             )"

         );


         viennacl::ocl::kernel& kernel = ocl::compile_kernel(kernel_name, source);


         kernel.local_work_size(0, OCL_WORK_GROUP_SIZE_1D);

         kernel.global_work_size(0, OCL_WORK_GROUP_SIZE_1D);


         return kernel;

     }


     static T compute(CGPUMatrix<T> mat)

     {

         viennacl::ocl::kernel& kernel = generate_kernel<T>();


         CGPUVector<T> result(1);


         viennacl::ocl::enqueue(kernel(mat.vcl_matrix(),

             cl_int(mat.num_rows*mat.num_cols), cl_int(mat.offset),

             result.vcl_vector()));


         return result[0];

     }


     static T compute(CGPUVector<T> vec)

     {

         viennacl::ocl::kernel& kernel = generate_kernel<T>();


         CGPUVector<T> result(1);


         viennacl::ocl::enqueue(kernel(vec.vcl_vector(),

             cl_int(vec.vlen), cl_int(vec.offset),

             result.vcl_vector()));


         return result[0];

     }

 };

 #endif // HAVE_VIENNACL


 }


 }


 }

 #endif // MAX_IMPL_H_

GPUVector.h

Math.h

eigen3.h

Eigen::Map
Definition: SGMatrix.h:24

config.h

SGMatrix.h

shogun::SGMatrix
shogun matrix
Definition: base/Parameter.h:26

shogun::SGVector
shogun vector
Definition: base/Parameter.h:28

shogun::linalg::implementation::max
Generic class which is specialized for different backends to perform the max operation.
Definition: Max.h:63

shogun::linalg::implementation::max::compute
static T compute(Matrix m)

shogun::linalg::implementation::max< Backend::EIGEN3, Matrix >::T
Matrix::Scalar T
Definition: Max.h:83

shogun::linalg::implementation::max< Backend::EIGEN3, Matrix >::VectorXt
Eigen::Matrix< T, Eigen::Dynamic, 1 > VectorXt
Definition: Max.h:89

shogun::linalg::implementation::max::T
Matrix::Scalar T
Definition: Max.h:66

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

opencl_util.h

Eigen::Matrix
Definition: SGMatrix.h:22

shogun::linalg::implementation::max< Backend::EIGEN3, Matrix >::compute
static T compute(SGMatrix< T > mat)
Definition: Max.h:96

shogun::linalg::implementation::max< Backend::EIGEN3, Matrix >::compute
static T compute(SGVector< T > vec)
Definition: Max.h:108

GPUMatrix.h

shogun::linalg::max
Matrix::Scalar max(Matrix m)
Definition: Redux.h:68

shogun::linalg::implementation::max< Backend::EIGEN3, Matrix >::MatrixXt
Eigen::Matrix< T, Eigen::Dynamic, Eigen::Dynamic > MatrixXt
Definition: Max.h:86

SGVector.h