Commit 2bce659f authored by Peter Eastman's avatar Peter Eastman
Browse files

Increased block sizes on Fermi

parent 75f74def
......@@ -784,7 +784,7 @@ void cudaComputeAmoebaElectrostatic( amoebaGpuContext amoebaGpu )
if( threadsPerBlock == 0 ){
unsigned int maxThreads;
if (gpu->sm_version >= SM_20)
maxThreads = 256;
maxThreads = 384;
else if (gpu->sm_version >= SM_12)
maxThreads = 128;
else
......
......@@ -28,7 +28,7 @@
__global__
#if (__CUDA_ARCH__ >= 200)
__launch_bounds__(256, 1)
__launch_bounds__(384, 1)
#elif (__CUDA_ARCH__ >= 130)
__launch_bounds__(128, 1)
#else
......
......@@ -1886,7 +1886,7 @@ void kCalculateAmoebaKirkwood( amoebaGpuContext amoebaGpu )
if( threadsPerBlock == 0 ){
unsigned int maxThreads;
if (gpu->sm_version >= SM_20)
maxThreads = 256;
maxThreads = 512;
else if (gpu->sm_version >= SM_12)
maxThreads = 128;
else
......
......@@ -28,7 +28,7 @@
__global__
#if (__CUDA_ARCH__ >= 200)
__launch_bounds__(256, 1)
__launch_bounds__(512, 1)
#elif (__CUDA_ARCH__ >= 130)
__launch_bounds__(128, 1)
#else
......
......@@ -1054,7 +1054,7 @@ void kCalculateAmoebaKirkwoodEDiff( amoebaGpuContext amoebaGpu )
if( threadsPerBlock == 0 ){
unsigned int maxThreads;
if (gpu->sm_version >= SM_20)
maxThreads = 192;
maxThreads = 384;
else if (gpu->sm_version >= SM_12)
maxThreads = 96;
else
......
......@@ -28,7 +28,7 @@
__global__
#if (__CUDA_ARCH__ >= 200)
__launch_bounds__(192, 1)
__launch_bounds__(384, 1)
#elif (__CUDA_ARCH__ >= 130)
__launch_bounds__(96, 1)
#else
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment