SHAFFT 1.1.0-alpha
A Scalable High-dimensional Accelerated FFT Library
Loading...
Searching...
No Matches
example_portable.cpp

Backend-portable SHAFFT C++ example using FFTND.

#include <shafft/shafft.hpp>
#include <cstdio>
#include <mpi.h>
#include <vector>
int main(int argc, char** argv) {
MPI_Init(&argc, &argv);
// MPI setup
int rank = 0;
MPI_Comm_rank(MPI_COMM_WORLD, &rank);
[[maybe_unused]] int rc;
constexpr int ndim = 3;
constexpr int printCount = 4;
std::vector<size_t> dims = {64, 64, 32};
// Get configuration
std::vector<int> commDims(ndim, 0);
std::vector<size_t> subsize(ndim), offset(ndim);
int nda = 0, commSize;
commDims,
nda,
subsize,
offset,
commSize,
0,
MPI_COMM_WORLD);
// Create and plan FFT
rc = fft.init(commDims, dims, shafft::FFTType::C2C, MPI_COMM_WORLD);
rc = fft.plan();
size_t allocSize = fft.allocSize();
size_t localElems = subsize[0] * subsize[1] * subsize[2];
// Allocate buffers
shafft::complexf *data = nullptr, *work = nullptr;
rc = shafft::allocBuffer(allocSize, &data);
rc = shafft::allocBuffer(allocSize, &work);
// Initialize: delta function at origin (rank 0, index 0)
std::vector<shafft::complexf> host(allocSize, {0.0f, 0.0f});
if (rank == 0 && localElems > 0)
host[0] = {1.0f, 0.0f};
rc = shafft::copyToBuffer(data, host.data(), allocSize);
rc = fft.setBuffers(data, work);
// Forward FFT
rc = fft.normalize();
// Retrieve spectrum
shafft::complexf *curData, *curWork;
rc = fft.getBuffers(&curData, &curWork);
std::vector<shafft::complexf> spectrum(allocSize);
rc = shafft::copyFromBuffer(spectrum.data(), curData, allocSize);
if (rank == 0) {
std::printf("Spectrum[0..%d] =", printCount - 1);
for (int i = 0; i < printCount; ++i)
std::printf(" (%g,%g)", spectrum[i].real(), spectrum[i].imag());
std::printf("\n");
}
// Backward FFT
rc = fft.normalize();
// Retrieve result
rc = fft.getBuffers(&curData, &curWork);
std::vector<shafft::complexf> result(allocSize);
rc = shafft::copyFromBuffer(result.data(), curData, allocSize);
if (rank == 0) {
std::printf("Result[0..%d] =", printCount - 1);
for (int i = 0; i < printCount; ++i)
std::printf(" (%g,%g)", result[i].real(), result[i].imag());
std::printf("\n");
}
// Cleanup
rc = shafft::freeBuffer(data);
rc = shafft::freeBuffer(work);
fft.release();
MPI_Finalize();
return 0;
}
N-dimensional distributed FFT plan with RAII semantics.
Definition shafft.hpp:51
int init(const std::vector< int > &commDims, const std::vector< size_t > &dimensions, FFTType type, MPI_Comm comm, TransformLayout output=TransformLayout::REDISTRIBUTED) noexcept
Initialize plan with Cartesian process grid.
int normalize() noexcept override
Apply symmetric normalization (1/sqrt(N) per transform).
int plan() noexcept override
Create backend FFT plans.
int execute(FFTDirection direction) noexcept override
Execute the FFT.
size_t allocSize() const noexcept override
Get required buffer size in complex elements.
int getBuffers(complexf **data, complexf **work) noexcept
Retrieve current buffer pointers.
void release() noexcept override
Release all internal resources.
int setBuffers(complexf *data, complexf *work) noexcept
Attach data and work buffers.
int freeBuffer(complexf *buf) noexcept
Free buffer allocated with allocBuffer().
int copyToBuffer(complexf *dst, const complexf *src, size_t count) noexcept
Copy from host to SHAFFT buffer.
int allocBuffer(size_t count, complexf **buf) noexcept
Allocate buffer for the current backend.
int copyFromBuffer(complexf *dst, const complexf *src, size_t count) noexcept
Copy from SHAFFT buffer to host.
std::complex< float > complexf
Single-precision complex type (std::complex<float>).
Definition shafft_types.hpp:71
int configurationND(const std::vector< size_t > &size, FFTType precision, std::vector< int > &commDims, int &nda, std::vector< size_t > &subsize, std::vector< size_t > &offset, int &commSize, DecompositionStrategy strategy, size_t memLimit, MPI_Comm comm)
Compute process grid and local layout for N-D distributed FFT.
@ C2C
Single-precision complex-to-complex (float).
@ MINIMIZE_NDA
Minimize distributed axes.
@ BACKWARD
Backward/inverse transform (frequency to time domain).
@ FORWARD
Forward transform (time to frequency domain).