Backend-portable SHAFFT C++ example using FFTND.
#include <shafft/shafft.hpp>
#include <cstdio>
#include <mpi.h>
#include <vector>
int main(int argc, char** argv) {
MPI_Init(&argc, &argv);
int rank = 0;
MPI_Comm_rank(MPI_COMM_WORLD, &rank);
[[maybe_unused]] int rc;
constexpr int ndim = 3;
constexpr int printCount = 4;
std::vector<size_t> dims = {64, 64, 32};
std::vector<int> commDims(ndim, 0);
std::vector<size_t> subsize(ndim), offset(ndim);
int nda = 0, commSize;
commDims,
nda,
subsize,
offset,
commSize,
0,
MPI_COMM_WORLD);
size_t localElems = subsize[0] * subsize[1] * subsize[2];
std::vector<shafft::complexf> host(allocSize, {0.0f, 0.0f});
if (rank == 0 && localElems > 0)
host[0] = {1.0f, 0.0f};
std::vector<shafft::complexf> spectrum(allocSize);
if (rank == 0) {
std::printf("Spectrum[0..%d] =", printCount - 1);
for (int i = 0; i < printCount; ++i)
std::printf(" (%g,%g)", spectrum[i].real(), spectrum[i].imag());
std::printf("\n");
}
std::vector<shafft::complexf> result(allocSize);
if (rank == 0) {
std::printf("Result[0..%d] =", printCount - 1);
for (int i = 0; i < printCount; ++i)
std::printf(" (%g,%g)", result[i].real(), result[i].imag());
std::printf("\n");
}
MPI_Finalize();
return 0;
}
N-dimensional distributed FFT plan with RAII semantics.
Definition shafft.hpp:51
int init(const std::vector< int > &commDims, const std::vector< size_t > &dimensions, FFTType type, MPI_Comm comm, TransformLayout output=TransformLayout::REDISTRIBUTED) noexcept
Initialize plan with Cartesian process grid.
int normalize() noexcept override
Apply symmetric normalization (1/sqrt(N) per transform).
int plan() noexcept override
Create backend FFT plans.
int execute(FFTDirection direction) noexcept override
Execute the FFT.
size_t allocSize() const noexcept override
Get required buffer size in complex elements.
int getBuffers(complexf **data, complexf **work) noexcept
Retrieve current buffer pointers.
void release() noexcept override
Release all internal resources.
int setBuffers(complexf *data, complexf *work) noexcept
Attach data and work buffers.
int freeBuffer(complexf *buf) noexcept
Free buffer allocated with allocBuffer().
int copyToBuffer(complexf *dst, const complexf *src, size_t count) noexcept
Copy from host to SHAFFT buffer.
int allocBuffer(size_t count, complexf **buf) noexcept
Allocate buffer for the current backend.
int copyFromBuffer(complexf *dst, const complexf *src, size_t count) noexcept
Copy from SHAFFT buffer to host.
std::complex< float > complexf
Single-precision complex type (std::complex<float>).
Definition shafft_types.hpp:71
int configurationND(const std::vector< size_t > &size, FFTType precision, std::vector< int > &commDims, int &nda, std::vector< size_t > &subsize, std::vector< size_t > &offset, int &commSize, DecompositionStrategy strategy, size_t memLimit, MPI_Comm comm)
Compute process grid and local layout for N-D distributed FFT.
@ C2C
Single-precision complex-to-complex (float).
@ MINIMIZE_NDA
Minimize distributed axes.
@ BACKWARD
Backward/inverse transform (frequency to time domain).
@ FORWARD
Forward transform (time to frequency domain).