| void syten::CudaDenseTensorImpl::cuda_transpose_impl | ( | CudaConstSpan< Scalar > | inp, |
| CudaMutSpan< Scalar > | out, | ||
| ConstSpan< Index > | in_perm, | ||
| ConstSpan< Index > | in_dim, | ||
| Conj | do_conj = Conj::n(), |
||
| bool | do_checks = true, |
||
| std::index_sequence< Ranks... > | = {} |
||
| ) |
Implementation of the CUDA tensor transposition routines, to be called only from cuda_transpose().