mirror of
https://github.com/paboyle/Grid.git
synced 2026-06-12 23:23:10 +01:00
FFT: use host stack buffer in PlanCreate, not deviceVector
Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
@@ -275,8 +275,10 @@ public:
|
|||||||
|
|
||||||
// GPU backends (cuFFT/hipFFT) ignore the buffer pointer at plan creation.
|
// GPU backends (cuFFT/hipFFT) ignore the buffer pointer at plan creation.
|
||||||
// CPU FFTW with FFTW_ESTIMATE inspects only alignment and never touches data.
|
// CPU FFTW with FFTW_ESTIMATE inspects only alignment and never touches data.
|
||||||
deviceVector<scalar> dummy(2);
|
// Use a host stack buffer: a device allocation here triggers a rocFFT RTC
|
||||||
FFTW_scalar *buf = (FFTW_scalar *)&dummy[0];
|
// bug on ROCm 7 that causes plan creation to fail for small transform sizes.
|
||||||
|
scalar stack_dummy[2] = {};
|
||||||
|
FFTW_scalar *buf = (FFTW_scalar *)stack_dummy;
|
||||||
|
|
||||||
{
|
{
|
||||||
FFTW_plan p = FFTW<scalar>::fftw_plan_many_dft(
|
FFTW_plan p = FFTW<scalar>::fftw_plan_many_dft(
|
||||||
|
|||||||
Reference in New Issue
Block a user