"csrc/gfx93/decode/sparse_fp8/splitkv_mla.cuh" did not exist on "620f8769a112358b4fb4be170901d55687d26388"
Commit 16f10eff authored by one's avatar one
Browse files

tune computeNonbonded launch params

parent 9c6732f0
...@@ -65,16 +65,15 @@ HipNonbondedUtilities::HipNonbondedUtilities(HipContext& context) : context(cont ...@@ -65,16 +65,15 @@ HipNonbondedUtilities::HipNonbondedUtilities(HipContext& context) : context(cont
string errorMessage = "Error initializing nonbonded utilities"; string errorMessage = "Error initializing nonbonded utilities";
CHECK_RESULT(hipEventCreateWithFlags(&downloadCountEvent, context.getEventFlags())); CHECK_RESULT(hipEventCreateWithFlags(&downloadCountEvent, context.getEventFlags()));
CHECK_RESULT(hipHostMalloc((void**) &pinnedCountBuffer, 2*sizeof(unsigned int), context.getHostMallocFlags())); CHECK_RESULT(hipHostMalloc((void**) &pinnedCountBuffer, 2*sizeof(unsigned int), context.getHostMallocFlags()));
numForceThreadBlocks = 5*4*context.getMultiprocessors(); numForceThreadBlocks = 16*4*context.getMultiprocessors();
forceThreadBlockSize = 64; forceThreadBlockSize = 256;
findInteractingBlocksThreadBlockSize = context.getSIMDWidth(); findInteractingBlocksThreadBlockSize = 128;
// When building the neighbor list, we can optionally use large blocks (32 * warpSize atoms) to // When building the neighbor list, we can optionally use large blocks (32 * warpSize atoms) to
// accelerate the process. This makes building the neighbor list faster, but it prevents // accelerate the process. This makes building the neighbor list faster, but it prevents
// us from sorting atom blocks by size, which leads to a slightly less efficient neighbor // us from sorting atom blocks by size, which leads to a slightly less efficient neighbor
// list. We guess based on system size which will be faster. // list. We guess based on system size which will be faster.
useLargeBlocks = false;
useLargeBlocks = (context.getNumAtoms() > 90000);
setKernelSource(HipKernelSources::nonbonded); setKernelSource(HipKernelSources::nonbonded);
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment