Workaround for Intel CPU OpenCL 2025.3 (#5137)

98173c60 · Evan Pretti · GitHub · 2fbed592 · 98173c60 · 98173c60
Unverified Commit 98173c60 authored Nov 13, 2025 by Evan Pretti Committed by GitHub Nov 13, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 8 additions and 0 deletions

platforms/opencl/src/OpenCLFFT3D.cpp platforms/opencl/src/OpenCLFFT3D.cpp +2 -0

platforms/opencl/tests/TestOpenCLFFT.cpp platforms/opencl/tests/TestOpenCLFFT.cpp +6 -0

No files found.
--- a/platforms/opencl/src/OpenCLFFT3D.cpp
+++ b/platforms/opencl/src/OpenCLFFT3D.cpp
@@ -59,6 +59,8 @@ OpenCLFFT3D::OpenCLFFT3D(OpenCLContext& context, int xsize, int ysize, int zsize
    if (platformVendor.size() >= 5 && platformVendor.substr(0, 5) == "Intel") {
        // Intel's OpenCL uses low accuracy trig functions, so tell VkFFT to use lookup tables instead.
        config.useLUT = 1;
+        // Version 2025.3 of Intel's OpenCL generates incorrect results when Y and Z sizes are 33 or 39; this is a workaround.
+        config.fixMinRaderPrimeMult = 11;
    }
    VkFFTResult result = initializeVkFFT(&app, config);
    if (result != VKFFT_SUCCESS)

--- a/platforms/opencl/tests/TestOpenCLFFT.cpp
+++ b/platforms/opencl/tests/TestOpenCLFFT.cpp
@@ -122,6 +122,9 @@ int main(int argc, char* argv[]) {
            testTransform<mm_double2>(true, 25, 28, 25);
            testTransform<mm_double2>(true, 25, 25, 28);
            testTransform<mm_double2>(true, 21, 25, 27);
+            testTransform<mm_double2>(true, 32, 33, 33);
+            testTransform<mm_double2>(true, 32, 33, 39);
+            testTransform<mm_double2>(true, 32, 39, 39);
        }
        else {
            testTransform<mm_float2>(false, 28, 25, 30);
@@ -129,6 +132,9 @@ int main(int argc, char* argv[]) {
            testTransform<mm_float2>(true, 25, 28, 25);
            testTransform<mm_float2>(true, 25, 25, 28);
            testTransform<mm_float2>(true, 21, 25, 27);
+            testTransform<mm_float2>(true, 32, 33, 33);
+            testTransform<mm_float2>(true, 32, 33, 39);
+            testTransform<mm_float2>(true, 32, 39, 39);
        }
    }
    catch(const exception& e) {