Commit 3fd5e2c5 authored by Peter Eastman's avatar Peter Eastman
Browse files

Fixed potential compilation error in CUDA FFT

parent 363406d1
...@@ -169,7 +169,7 @@ static int getSmallestRadix(int size) { ...@@ -169,7 +169,7 @@ static int getSmallestRadix(int size) {
} }
CUfunction CudaFFT3D::createKernel(int xsize, int ysize, int zsize, int& threads, int axis, bool forward, bool inputIsReal) { CUfunction CudaFFT3D::createKernel(int xsize, int ysize, int zsize, int& threads, int axis, bool forward, bool inputIsReal) {
int maxThreads = 256; int maxThreads = (context.getUseDoublePrecision() ? 128 : 256);
// while (maxThreads > 128 && maxThreads-64 >= zsize) // while (maxThreads > 128 && maxThreads-64 >= zsize)
// maxThreads -= 64; // maxThreads -= 64;
int threadsPerBlock = zsize/getSmallestRadix(zsize); int threadsPerBlock = zsize/getSmallestRadix(zsize);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment