TASMANIAN/rolling/tsgGpuWrappers_8hpp_source.html

 /*

  * Copyright (c) 2017, Miroslav Stoyanov

  *

  * This file is part of

  * Toolkit for Adaptive Stochastic Modeling And Non-Intrusive ApproximatioN: TASMANIAN

  *

  * Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.

  *

  * 2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions

  *    and the following disclaimer in the documentation and/or other materials provided with the distribution.

  *

  * 3. Neither the name of the copyright holder nor the names of its contributors may be used to endorse

  *    or promote products derived from this software without specific prior written permission.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,

  * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.

  * IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY,

  * OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA,

  * OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,

  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  * UT-BATTELLE, LLC AND THE UNITED STATES GOVERNMENT MAKE NO REPRESENTATIONS AND DISCLAIM ALL WARRANTIES, BOTH EXPRESSED AND IMPLIED.

  * THERE ARE NO EXPRESS OR IMPLIED WARRANTIES OF MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE, OR THAT THE USE OF THE SOFTWARE WILL NOT INFRINGE ANY PATENT,

  * COPYRIGHT, TRADEMARK, OR OTHER PROPRIETARY RIGHTS, OR THAT THE SOFTWARE WILL ACCOMPLISH THE INTENDED RESULTS OR THAT THE SOFTWARE OR ITS USE WILL NOT RESULT IN INJURY OR DAMAGE.

  * THE USER ASSUMES RESPONSIBILITY FOR ALL LIABILITIES, PENALTIES, FINES, CLAIMS, CAUSES OF ACTION, AND COSTS AND EXPENSES, CAUSED BY, RESULTING FROM OR ARISING OUT OF,

  * IN WHOLE OR IN PART THE USE, STORAGE OR DISPOSAL OF THE SOFTWARE.

  */


 #ifndef __TASMANIAN_GPU_WRAPPERS_HPP

 #define __TASMANIAN_GPU_WRAPPERS_HPP


 #include "tsgAcceleratedDataStructures.hpp"


 namespace TasGrid{

 namespace TasGpu{


 template<typename scalar_type>

 void solveLSmultiGPU(AccelerationContext const *acceleration, int n, int m, scalar_type A[], int nrhs, scalar_type B[]);


 template<typename scalar_type>

 void solveLSmultiOOC(AccelerationContext const *acceleration, int n, int m, scalar_type A[], int nrhs, scalar_type B[]);


 template<typename scalar_type>

 void solveLSmulti(AccelerationContext const *acceleration, int n, int m, scalar_type A[], int nrhs, scalar_type B[]){

     GpuVector<scalar_type> gpuA(acceleration, m, n, A);

     GpuVector<scalar_type> gpuB(acceleration, nrhs, n, B);

     solveLSmultiGPU(acceleration, n, m, gpuA.data(), nrhs, gpuB.data());

     gpuB.unload(acceleration, B);

 }


 void factorizePLU(AccelerationContext const *acceleration, int n, double A[], int_gpu_lapack ipiv[]);

 void solvePLU(AccelerationContext const *acceleration, char trans, int n, double const A[], int_gpu_lapack const ipiv[], double b[]);

 void solvePLU(AccelerationContext const *acceleration, char trans, int n, double const A[], int_gpu_lapack const ipiv[], int nrhs, double B[]);


 template<typename scalar_type>

 void denseMultiply(AccelerationContext const *acceleration, int M, int N, int K,

                    typename GpuVector<scalar_type>::value_type alpha, GpuVector<scalar_type> const &A,

                    GpuVector<scalar_type> const &B, typename GpuVector<scalar_type>::value_type beta, scalar_type C[]);


 template<typename scalar_type>

 void denseMultiplyMixed(AccelerationContext const *acceleration, int M, int N, int K, typename GpuVector<scalar_type>::value_type alpha,

                         GpuVector<scalar_type> const &A, scalar_type const B[],

                         typename GpuVector<scalar_type>::value_type beta, scalar_type C[]){

     GpuVector<scalar_type> gpuB(acceleration, K, N, B), gpuC(acceleration, M, N);

     denseMultiply(acceleration, M, N, K, alpha, A, gpuB, beta, gpuC.data());

     gpuC.unload(acceleration, C);

 }


 template<typename scalar_type>

 void sparseMultiply(AccelerationContext const *acceleration, int M, int N, int K, typename GpuVector<scalar_type>::value_type alpha,

                     const GpuVector<scalar_type> &A, const GpuVector<int> &pntr, const GpuVector<int> &indx,

                     const GpuVector<scalar_type> &vals, scalar_type C[]);


 template<typename T>

 void sparseMultiplyMixed(AccelerationContext const *acceleration, int M, int N, int K, typename GpuVector<T>::value_type alpha, const GpuVector<T> &A,

                          const std::vector<int> &pntr, const std::vector<int> &indx, const std::vector<T> &vals, T C[]){

     GpuVector<int> gpu_pntr(acceleration, pntr), gpu_indx(acceleration, indx);

     GpuVector<T> gpu_vals(acceleration, vals), gpu_c(acceleration, M, N);

     sparseMultiply(acceleration, M, N, K, alpha, A, gpu_pntr, gpu_indx, gpu_vals, gpu_c.data());

     gpu_c.unload(acceleration, C);

 }


 }

 }


 #endif

TasGrid::GpuVector
Template class that wraps around a single GPU array, providing functionality that mimics std::vector.
Definition: tsgAcceleratedDataStructures.hpp:95

TasGrid::GpuVector::unload
void unload(AccelerationContext const *acc, std::vector< T > &cpu_data) const
Copy the data from the GPU array to cpu_data, the cpu_data will be resized and overwritten.
Definition: tsgAcceleratedDataStructures.hpp:196

TasGrid::GpuVector::data
T * data()
Get a reference to the GPU array, which an be used as input to GPU libraries and kernels.
Definition: tsgAcceleratedDataStructures.hpp:145

TasGrid::GpuVector::value_type
T value_type
The data-type of the vector entries.
Definition: tsgAcceleratedDataStructures.hpp:220

TasGrid::TasGpu::solveLSmultiOOC
void solveLSmultiOOC(AccelerationContext const *acceleration, int n, int m, scalar_type A[], int nrhs, scalar_type B[])
Identical to TasGpu::solveLSmultiGPU() but the arrays are on the CPU and the MAGMA out-of-core implem...

TasGrid::TasGpu::sparseMultiplyMixed
void sparseMultiplyMixed(AccelerationContext const *acceleration, int M, int N, int K, typename GpuVector< T >::value_type alpha, const GpuVector< T > &A, const std::vector< int > &pntr, const std::vector< int > &indx, const std::vector< T > &vals, T C[])
Identical to TasGpu::sparseMultiply() but the sparse matrix and the result C are in CPU memory.
Definition: tsgGpuWrappers.hpp:120

TasGrid::TasGpu::solveLSmultiGPU
void solveLSmultiGPU(AccelerationContext const *acceleration, int n, int m, scalar_type A[], int nrhs, scalar_type B[])
Least squares solver with data sitting on the gpu device.

TasGrid::TasGpu::solvePLU
void solvePLU(AccelerationContext const *acceleration, char trans, int n, double const A[], int_gpu_lapack const ipiv[], double b[])
Solve A x = b using a PLU factorization.

TasGrid::TasGpu::sparseMultiply
void sparseMultiply(AccelerationContext const *acceleration, int M, int N, int K, typename GpuVector< scalar_type >::value_type alpha, const GpuVector< scalar_type > &A, const GpuVector< int > &pntr, const GpuVector< int > &indx, const GpuVector< scalar_type > &vals, scalar_type C[])
Wrapper to GPU methods that multiplies a sparse and a dense matrix.

TasGrid::TasGpu::factorizePLU
void factorizePLU(AccelerationContext const *acceleration, int n, double A[], int_gpu_lapack ipiv[])
Factorize , arrays are on the GPU.

TasGrid::TasGpu::denseMultiplyMixed
void denseMultiplyMixed(AccelerationContext const *acceleration, int M, int N, int K, typename GpuVector< scalar_type >::value_type alpha, GpuVector< scalar_type > const &A, scalar_type const B[], typename GpuVector< scalar_type >::value_type beta, scalar_type C[])
Identical to TasGpu::denseMultiply() but both B and C are array in CPU memory.
Definition: tsgGpuWrappers.hpp:99

TasGrid::TasGpu::denseMultiply
void denseMultiply(AccelerationContext const *acceleration, int M, int N, int K, typename GpuVector< scalar_type >::value_type alpha, GpuVector< scalar_type > const &A, GpuVector< scalar_type > const &B, typename GpuVector< scalar_type >::value_type beta, scalar_type C[])
Wrapper to GPU BLAS that multiplies dense matrices (e.g., cuBlas, MAGMA).

TasGrid::TasGpu::solveLSmulti
void solveLSmulti(AccelerationContext const *acceleration, int n, int m, scalar_type A[], int nrhs, scalar_type B[])
Identical to TasGpu::solveLSmultiGPU() but the data starts with the CPU and gets uploaded to the GPU ...
Definition: tsgGpuWrappers.hpp:70

TasGrid
Encapsulates the Tasmanian Sparse Grid module.
Definition: TasmanianSparseGrid.hpp:68

TasGrid::int_gpu_lapack
int int_gpu_lapack
Defines the integer used by the LAPACK methods, usually int but DPC++ uses int64_t.
Definition: tsgEnumerates.hpp:97

TasGrid::AccelerationContext
Wrapper class around GPU device ID, acceleration type and GpuEngine.
Definition: tsgAcceleratedDataStructures.hpp:576

tsgAcceleratedDataStructures.hpp
Data structures for interacting with CUDA and MAGMA environments.