PARALUTION  1.0.0
PARALUTION
cuda_kernels_ell.hpp File Reference

Go to the source code of this file.

Namespaces

 paralution
 

Functions

template<typename ValueType , typename IndexType >
__global__ void paralution::kernel_ell_spmv (const IndexType num_rows, const IndexType num_cols, const IndexType num_cols_per_row, const IndexType *Acol, const ValueType *Aval, const ValueType *x, ValueType *y)
 
template<typename ValueType , typename IndexType >
__global__ void paralution::kernel_ell_add_spmv (const IndexType num_rows, const IndexType num_cols, const IndexType num_cols_per_row, const IndexType *Acol, const ValueType *Aval, const ValueType scalar, const ValueType *x, ValueType *y)
 
template<typename ValueType , typename IndexType , unsigned int BLOCK_SIZE>
__global__ void paralution::kernel_ell_max_row (const IndexType nrow, const ValueType *data, ValueType *out, const IndexType GROUP_SIZE, const IndexType LOCAL_SIZE)
 
template<typename ValueType , typename IndexType >
__global__ void paralution::kernel_ell_csr_to_ell (const IndexType nrow, const IndexType max_row, const IndexType *src_row_offset, const IndexType *src_col, const ValueType *src_val, IndexType *ell_col, ValueType *ell_val)