Highly Efficient FFT for Exascale: HeFFTe v2.4
|
GPU version of the transpose packer. More...
#include <heffte_backend_cuda.h>
Public Member Functions | |
template<typename scalar_type, typename index> | |
void | pack (cudaStream_t stream, pack_plan_3d< index > const &plan, scalar_type const data[], scalar_type buffer[]) const |
Execute the planned pack operation. | |
template<typename scalar_type, typename index> | |
void | unpack (cudaStream_t stream, pack_plan_3d< index > const &plan, scalar_type const buffer[], scalar_type data[]) const |
Execute the planned transpose-unpack operation. | |
template<typename scalar_type, typename index> | |
void | pack (sycl::queue &stream, pack_plan_3d< index > const &plan, scalar_type const data[], scalar_type buffer[]) const |
Execute the planned pack operation. | |
template<typename scalar_type, typename index> | |
void | unpack (sycl::queue &stream, pack_plan_3d< index > const &plan, scalar_type const buffer[], scalar_type data[]) const |
Execute the planned transpose-unpack operation. | |
template<typename scalar_type, typename index> | |
void | pack (hipStream_t stream, pack_plan_3d< index > const &plan, scalar_type const data[], scalar_type buffer[]) const |
Execute the planned pack operation. | |
template<typename scalar_type, typename index> | |
void | unpack (hipStream_t stream, pack_plan_3d< index > const &plan, scalar_type const buffer[], scalar_type data[]) const |
Execute the planned transpose-unpack operation. | |
GPU version of the transpose packer.