void syten::CudaDenseTensorImpl::cuda_transpose_impl | ( | CudaConstSpan< Scalar > | inp, |
CudaMutSpan< Scalar > | out, | ||
ConstSpan< Index > | in_perm, | ||
ConstSpan< Index > | in_dim, | ||
Conj | do_conj = Conj::n() , |
||
bool | do_checks = true , |
||
std::index_sequence< Ranks... > | = {} |
||
) |
Implementation of the CUDA tensor transposition routines, to be called only from cuda_transpose().