/* -------------------------------------------------------------------------- * * OpenMM * * -------------------------------------------------------------------------- * * This is part of the OpenMM molecular simulation toolkit originating from * * Simbios, the NIH National Center for Physics-Based Simulation of * * Biological Structures at Stanford, funded under the NIH Roadmap for * * Medical Research, grant U54 GM072970. See https://simtk.org. * * * * Portions copyright (c) 2011-2012 Stanford University and the Authors. * * Authors: Peter Eastman * * Contributors: * * * * This program is free software: you can redistribute it and/or modify * * it under the terms of the GNU Lesser General Public License as published * * by the Free Software Foundation, either version 3 of the License, or * * (at your option) any later version. * * * * This program is distributed in the hope that it will be useful, * * but WITHOUT ANY WARRANTY; without even the implied warranty of * * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * * GNU Lesser General Public License for more details. * * * * You should have received a copy of the GNU Lesser General Public License * * along with this program. If not, see . * * -------------------------------------------------------------------------- */ #include "CudaBondedUtilities.h" #include "CudaExpressionUtilities.h" #include "CudaKernelSources.h" #include "openmm/OpenMMException.h" #include "CudaNonbondedUtilities.h" #include using namespace OpenMM; using namespace std; CudaBondedUtilities::CudaBondedUtilities(CudaContext& context) : context(context), numForceBuffers(0), maxBonds(0), hasInitializedKernels(false) { } CudaBondedUtilities::~CudaBondedUtilities() { for (int i = 0; i < (int) atomIndices.size(); i++) for (int j = 0; j < (int) atomIndices[i].size(); j++) delete atomIndices[i][j]; } void CudaBondedUtilities::addInteraction(const vector >& atoms, const string& source, int group) { if (atoms.size() > 0) { forceAtoms.push_back(atoms); forceSource.push_back(source); forceGroup.push_back(group); } } std::string CudaBondedUtilities::addArgument(CUdeviceptr data, const string& type) { arguments.push_back(data); argTypes.push_back(type); return "customArg"+context.intToString(arguments.size()); } void CudaBondedUtilities::addPrefixCode(const string& source) { for (int i = 0; i < (int) prefixCode.size(); i++) if (prefixCode[i] == source) return; prefixCode.push_back(source); } void CudaBondedUtilities::initialize(const System& system) { int numForces = forceAtoms.size(); hasInteractions = (numForces > 0); if (!hasInteractions) return; // Build the lists of atom indices. atomIndices.resize(numForces); for (int i = 0; i < numForces; i++) { int numBonds = forceAtoms[i].size(); int numAtoms = forceAtoms[i][0].size(); int startAtom = 0; while (startAtom < numAtoms) { int width = min(numAtoms-startAtom, 4); int paddedWidth = (width == 3 ? 4 : width); vector indexVec(paddedWidth*numBonds); for (int bond = 0; bond < numBonds; bond++) { for (int atom = 0; atom < width; atom++) indexVec[bond*paddedWidth+atom] = forceAtoms[i][bond][startAtom+atom]; } CudaArray* indices = new CudaArray(context, numBonds, 4*paddedWidth, "bondedIndices"); indices->upload(&indexVec[0]); atomIndices[i].push_back(indices); startAtom += width; } } // Create the kernel. stringstream s; s<getElementSize()/4; string indexType = "uint"+context.intToString(indexWidth); s<<", const "< defines; defines["PADDED_NUM_ATOMS"] = context.intToString(context.getPaddedNumAtoms()); CUmodule module = context.createModule(s.str(), defines); kernel = context.getKernel(module, "computeBondedForces"); forceAtoms.clear(); forceSource.clear(); } string CudaBondedUtilities::createForceSource(int forceIndex, int numBonds, int numAtoms, int group, const string& computeForce) { maxBonds = max(maxBonds, numBonds); string suffix[] = {".x", ".y", ".z", ".w"}; stringstream s; s<<"if ((groups&"<<(1<getElementSize()/4; string indexType = "uint"+context.intToString(indexWidth); s<<" "<((long long) (force"<<(i+1)<<".x*0xFFFFFFFF)));\n"; s<<" atomicAdd(&forceBuffer[atom"<<(i+1)<<"+PADDED_NUM_ATOMS], static_cast((long long) (force"<<(i+1)<<".y*0xFFFFFFFF)));\n"; s<<" atomicAdd(&forceBuffer[atom"<<(i+1)<<"+PADDED_NUM_ATOMS*2], static_cast((long long) (force"<<(i+1)<<".z*0xFFFFFFFF)));\n"; s<<" __threadfence_block();\n"; } s<<"}\n"; return s.str(); } void CudaBondedUtilities::computeInteractions(int groups) { if (!hasInitializedKernels) { hasInitializedKernels = true; kernelArgs.push_back(&context.getForce().getDevicePointer()); kernelArgs.push_back(&context.getEnergyBuffer().getDevicePointer()); kernelArgs.push_back(&context.getPosq().getDevicePointer()); kernelArgs.push_back(NULL); for (int i = 0; i < (int) atomIndices.size(); i++) for (int j = 0; j < (int) atomIndices[i].size(); j++) kernelArgs.push_back(&atomIndices[i][j]->getDevicePointer()); for (int i = 0; i < (int) arguments.size(); i++) kernelArgs.push_back(&arguments[i]); } if (!hasInteractions) return; kernelArgs[3] = &groups; context.executeKernel(kernel, &kernelArgs[0], maxBonds); }