Commit bf7efca6 authored by peastman's avatar peastman
Browse files

Merge pull request #1051 from peastman/ffterror

Fixed potential compilation error in CUDA FFT
parents 5b074f80 3fd5e2c5
...@@ -169,7 +169,7 @@ static int getSmallestRadix(int size) { ...@@ -169,7 +169,7 @@ static int getSmallestRadix(int size) {
} }
CUfunction CudaFFT3D::createKernel(int xsize, int ysize, int zsize, int& threads, int axis, bool forward, bool inputIsReal) { CUfunction CudaFFT3D::createKernel(int xsize, int ysize, int zsize, int& threads, int axis, bool forward, bool inputIsReal) {
int maxThreads = 256; int maxThreads = (context.getUseDoublePrecision() ? 128 : 256);
// while (maxThreads > 128 && maxThreads-64 >= zsize) // while (maxThreads > 128 && maxThreads-64 >= zsize)
// maxThreads -= 64; // maxThreads -= 64;
int threadsPerBlock = zsize/getSmallestRadix(zsize); int threadsPerBlock = zsize/getSmallestRadix(zsize);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment