void syten::CudaDenseTensorImpl::cuda_mm_cm | ( | CudaPtr< const float > | at, |
CudaPtr< const float > | bt, | ||
CudaPtr< float > | rt, | ||
Size const | dx, | ||
Size const | dy, | ||
Size const | dz | ||
) |
CUDA real float matrix-matrix multiplication.
References syten::Cuda::CudaPtr< T >::get(), syten::Cuda::get_handle(), syten::Cuda::handle_error(), syten::Cuda::host_device(), syten::DenseProduct::mm_cm(), and SYTEN_ASSERT_MSG.