Implementation for inc/dense/cuda_transpose.h
More...
#include "inc/dense/cuda_transpose.h"
#include "inc/dense/dense_transpose_r2.h"
#include "inc/util/cublas_support.h"
Namespaces | |
namespace | syten |
Syten namespace. | |
namespace | syten::CudaDenseTensorImpl |
Implementation namespace for CUDA dense tensors. | |
Functions | |
void | syten::CudaDenseTensorImpl::cuda_transpose_r2 (CudaConstSpan< double > inp, CudaMutSpan< double > out, Index inp_rows, Index inp_cols, Conj const conj=Conj::n()) |
Transposition of a rank-2 CUDA matrix from range inp into range out in row-major format with inp_rows and inp_cols respectively. More... | |
void | syten::CudaDenseTensorImpl::cuda_transpose_r2 (CudaConstSpan< float > inp, CudaMutSpan< float > out, Index inp_rows, Index inp_cols, Conj const conj=Conj::n()) |
Transposition of a rank-2 CUDA matrix from range inp into range out in row-major format with inp_rows and inp_cols respectively. More... | |
void | syten::CudaDenseTensorImpl::cuda_transpose_r2 (CudaConstSpan< std::complex< double > > inp, CudaMutSpan< std::complex< double > > out, Index inp_rows, Index inp_cols, Conj const conj=Conj::n()) |
Transposition of a rank-2 CUDA matrix from range inp into range out in row-major format with inp_rows and inp_cols respectively. More... | |
void | syten::CudaDenseTensorImpl::cuda_transpose_r2 (CudaConstSpan< std::complex< float > > inp, CudaMutSpan< std::complex< float > > out, Index inp_rows, Index inp_cols, Conj const conj=Conj::n()) |
Transposition of a rank-2 CUDA matrix from range inp into range out in row-major format with inp_rows and inp_cols respectively. More... | |
Implementation for inc/dense/cuda_transpose.h