|
void | syten::CudaDenseTensorImpl::cuda_transpose_kernel_impl (std::uint32_t rank, std::size_t sz, const double *inp, double *out, cukrn_transpose_array const &old_dim, cukrn_transpose_array const &new_dim, cukrn_transpose_array const &ar_perm, void *str, bool do_conj) |
| Launcher for the CUDA tensor transposition kernel, double version. More...
|
|
void | syten::CudaDenseTensorImpl::cuda_transpose_kernel_impl (std::uint32_t rank, std::size_t sz, const float *inp, float *out, cukrn_transpose_array const &old_dim, cukrn_transpose_array const &new_dim, cukrn_transpose_array const &ar_perm, void *str, bool do_conj) |
| Launcher for the CUDA tensor transposition kernel, float version. More...
|
|
void | syten::CudaDenseTensorImpl::cuda_transpose_kernel_impl (std::uint32_t rank, std::size_t sz, const std::complex< double > *inp, std::complex< double > *out, cukrn_transpose_array const &old_dim, cukrn_transpose_array const &new_dim, cukrn_transpose_array const &ar_perm, void *str, bool do_conj) |
| Launcher for the CUDA tensor transposition kernel, std::complex<double> version. More...
|
|
void | syten::CudaDenseTensorImpl::cuda_transpose_kernel_impl (std::uint32_t rank, std::size_t sz, const std::complex< float > *inp, std::complex< float > *out, cukrn_transpose_array const &old_dim, cukrn_transpose_array const &new_dim, cukrn_transpose_array const &ar_perm, void *str, bool do_conj) |
| Launcher for the CUDA tensor transposition kernel, std::complex<float> version. More...
|
|
CUDA transposition kernel implementation header.