/* -------------------------------------------------------------------------- * * OpenMM * * -------------------------------------------------------------------------- * * This is part of the OpenMM molecular simulation toolkit originating from * * Simbios, the NIH National Center for Physics-Based Simulation of * * Biological Structures at Stanford, funded under the NIH Roadmap for * * Medical Research, grant U54 GM072970. See https://simtk.org. * * * * Portions copyright (c) 2008-2024 Stanford University and the Authors. * * Authors: Peter Eastman * * Contributors: * * * * This program is free software: you can redistribute it and/or modify * * it under the terms of the GNU Lesser General Public License as published * * by the Free Software Foundation, either version 3 of the License, or * * (at your option) any later version. * * * * This program is distributed in the hope that it will be useful, * * but WITHOUT ANY WARRANTY; without even the implied warranty of * * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * * GNU Lesser General Public License for more details. * * * * You should have received a copy of the GNU Lesser General Public License * * along with this program. If not, see . * * -------------------------------------------------------------------------- */ #include "openmm/common/CommonKernels.h" #include "openmm/common/ContextSelector.h" #include "openmm/common/ExpressionUtilities.h" #include "openmm/Context.h" #include "openmm/internal/AndersenThermostatImpl.h" #include "openmm/internal/CMAPTorsionForceImpl.h" #include "openmm/internal/ContextImpl.h" #include "openmm/internal/CustomCentroidBondForceImpl.h" #include "openmm/internal/CustomCompoundBondForceImpl.h" #include "openmm/internal/CustomHbondForceImpl.h" #include "openmm/internal/CustomManyParticleForceImpl.h" #include "openmm/internal/timer.h" #include "CommonKernelSources.h" #include "lepton/CustomFunction.h" #include "lepton/ExpressionTreeNode.h" #include "lepton/Operation.h" #include "lepton/Parser.h" #include "lepton/ParsedExpression.h" #include "ReferenceTabulatedFunction.h" #include "SimTKOpenMMRealType.h" #include "SimTKOpenMMUtilities.h" #include "jama_eig.h" #include #include #include #include using namespace OpenMM; using namespace std; using namespace Lepton; static void setPeriodicBoxArgs(ComputeContext& cc, ComputeKernel kernel, int index) { Vec3 a, b, c; cc.getPeriodicBoxVectors(a, b, c); if (cc.getUseDoublePrecision()) { kernel->setArg(index++, mm_double4(a[0], b[1], c[2], 0.0)); kernel->setArg(index++, mm_double4(1.0/a[0], 1.0/b[1], 1.0/c[2], 0.0)); kernel->setArg(index++, mm_double4(a[0], a[1], a[2], 0.0)); kernel->setArg(index++, mm_double4(b[0], b[1], b[2], 0.0)); kernel->setArg(index, mm_double4(c[0], c[1], c[2], 0.0)); } else { kernel->setArg(index++, mm_float4((float) a[0], (float) b[1], (float) c[2], 0.0f)); kernel->setArg(index++, mm_float4(1.0f/(float) a[0], 1.0f/(float) b[1], 1.0f/(float) c[2], 0.0f)); kernel->setArg(index++, mm_float4((float) a[0], (float) a[1], (float) a[2], 0.0f)); kernel->setArg(index++, mm_float4((float) b[0], (float) b[1], (float) b[2], 0.0f)); kernel->setArg(index, mm_float4((float) c[0], (float) c[1], (float) c[2], 0.0f)); } } static bool isZeroExpression(const Lepton::ParsedExpression& expression) { const Lepton::Operation& op = expression.getRootNode().getOperation(); if (op.getId() != Lepton::Operation::CONSTANT) return false; return (dynamic_cast(op).getValue() == 0.0); } static bool usesVariable(const Lepton::ExpressionTreeNode& node, const string& variable) { const Lepton::Operation& op = node.getOperation(); if (op.getId() == Lepton::Operation::VARIABLE && op.getName() == variable) return true; for (auto& child : node.getChildren()) if (usesVariable(child, variable)) return true; return false; } static bool usesVariable(const Lepton::ParsedExpression& expression, const string& variable) { return usesVariable(expression.getRootNode(), variable); } static pair makeVariable(const string& name, const string& value) { return make_pair(ExpressionTreeNode(new Operation::Variable(name)), value); } static void flushPeriodically(ComputeContext& cc) { #ifdef WIN32 // When running on Windows, we periodically flush the queue to keep the UI responsive. static double lastTime = getCurrentTime(); double currentTime = getCurrentTime(); if (currentTime-lastTime > 0.025) { cc.flushQueue(); lastTime = currentTime; } #endif } void CommonUpdateStateDataKernel::initialize(const System& system) { } double CommonUpdateStateDataKernel::getTime(const ContextImpl& context) const { return cc.getTime(); } void CommonUpdateStateDataKernel::setTime(ContextImpl& context, double time) { for (auto ctx : cc.getAllContexts()) ctx->setTime(time); } long long CommonUpdateStateDataKernel::getStepCount(const ContextImpl& context) const { return cc.getStepCount(); } void CommonUpdateStateDataKernel::setStepCount(const ContextImpl& context, long long count) { for (auto ctx : cc.getAllContexts()) ctx->setStepCount(count); } void CommonUpdateStateDataKernel::getPositions(ContextImpl& context, vector& positions) { ContextSelector selector(cc); int numParticles = context.getSystem().getNumParticles(); positions.resize(numParticles); vector posCorrection; if (cc.getUseDoublePrecision()) { mm_double4* posq = (mm_double4*) cc.getPinnedBuffer(); cc.getPosq().download(posq); } else if (cc.getUseMixedPrecision()) { mm_float4* posq = (mm_float4*) cc.getPinnedBuffer(); cc.getPosq().download(posq, false); posCorrection.resize(numParticles); cc.getPosqCorrection().download(posCorrection); } else { mm_float4* posq = (mm_float4*) cc.getPinnedBuffer(); cc.getPosq().download(posq); } // Filling in the output array is done in parallel for speed. cc.getThreadPool().execute([&] (ThreadPool& threads, int threadIndex) { // Compute the position of each particle to return to the user. This is done in parallel for speed. const vector& order = cc.getAtomIndex(); int numParticles = cc.getNumAtoms(); Vec3 boxVectors[3]; cc.getPeriodicBoxVectors(boxVectors[0], boxVectors[1], boxVectors[2]); int numThreads = threads.getNumThreads(); int start = threadIndex*numParticles/numThreads; int end = (threadIndex+1)*numParticles/numThreads; if (cc.getUseDoublePrecision()) { mm_double4* posq = (mm_double4*) cc.getPinnedBuffer(); for (int i = start; i < end; ++i) { mm_double4 pos = posq[i]; mm_int4 offset = cc.getPosCellOffsets()[i]; positions[order[i]] = Vec3(pos.x, pos.y, pos.z)-boxVectors[0]*offset.x-boxVectors[1]*offset.y-boxVectors[2]*offset.z; } } else if (cc.getUseMixedPrecision()) { mm_float4* posq = (mm_float4*) cc.getPinnedBuffer(); for (int i = start; i < end; ++i) { mm_float4 pos1 = posq[i]; mm_float4 pos2 = posCorrection[i]; mm_int4 offset = cc.getPosCellOffsets()[i]; positions[order[i]] = Vec3((double)pos1.x+(double)pos2.x, (double)pos1.y+(double)pos2.y, (double)pos1.z+(double)pos2.z)-boxVectors[0]*offset.x-boxVectors[1]*offset.y-boxVectors[2]*offset.z; } } else { mm_float4* posq = (mm_float4*) cc.getPinnedBuffer(); for (int i = start; i < end; ++i) { mm_float4 pos = posq[i]; mm_int4 offset = cc.getPosCellOffsets()[i]; positions[order[i]] = Vec3(pos.x, pos.y, pos.z)-boxVectors[0]*offset.x-boxVectors[1]*offset.y-boxVectors[2]*offset.z; } } }); cc.getThreadPool().waitForThreads(); } void CommonUpdateStateDataKernel::setPositions(ContextImpl& context, const vector& positions) { ContextSelector selector(cc); const vector& order = cc.getAtomIndex(); int numParticles = context.getSystem().getNumParticles(); if (cc.getUseDoublePrecision()) { mm_double4* posq = (mm_double4*) cc.getPinnedBuffer(); cc.getPosq().download(posq); for (int i = 0; i < numParticles; ++i) { mm_double4& pos = posq[i]; const Vec3& p = positions[order[i]]; pos.x = p[0]; pos.y = p[1]; pos.z = p[2]; } for (int i = numParticles; i < cc.getPaddedNumAtoms(); i++) posq[i] = mm_double4(0.0, 0.0, 0.0, 0.0); cc.getPosq().upload(posq); } else { mm_float4* posq = (mm_float4*) cc.getPinnedBuffer(); cc.getPosq().download(posq); for (int i = 0; i < numParticles; ++i) { mm_float4& pos = posq[i]; const Vec3& p = positions[order[i]]; pos.x = (float) p[0]; pos.y = (float) p[1]; pos.z = (float) p[2]; } for (int i = numParticles; i < cc.getPaddedNumAtoms(); i++) posq[i] = mm_float4(0.0f, 0.0f, 0.0f, 0.0f); cc.getPosq().upload(posq); } if (cc.getUseMixedPrecision()) { mm_float4* posCorrection = (mm_float4*) cc.getPinnedBuffer(); for (int i = 0; i < numParticles; ++i) { mm_float4& c = posCorrection[i]; const Vec3& p = positions[order[i]]; c.x = (float) (p[0]-(float)p[0]); c.y = (float) (p[1]-(float)p[1]); c.z = (float) (p[2]-(float)p[2]); c.w = 0; } for (int i = numParticles; i < cc.getPaddedNumAtoms(); i++) posCorrection[i] = mm_float4(0.0f, 0.0f, 0.0f, 0.0f); cc.getPosqCorrection().upload(posCorrection); } for (auto& offset : cc.getPosCellOffsets()) offset = mm_int4(0, 0, 0, 0); cc.reorderAtoms(); } void CommonUpdateStateDataKernel::getVelocities(ContextImpl& context, vector& velocities) { ContextSelector selector(cc); const vector& order = cc.getAtomIndex(); int numParticles = context.getSystem().getNumParticles(); velocities.resize(numParticles); if (cc.getUseDoublePrecision() || cc.getUseMixedPrecision()) { mm_double4* velm = (mm_double4*) cc.getPinnedBuffer(); cc.getVelm().download(velm); for (int i = 0; i < numParticles; ++i) { mm_double4 vel = velm[i]; velocities[order[i]] = Vec3(vel.x, vel.y, vel.z); } } else { mm_float4* velm = (mm_float4*) cc.getPinnedBuffer(); cc.getVelm().download(velm); for (int i = 0; i < numParticles; ++i) { mm_float4 vel = velm[i]; velocities[order[i]] = Vec3(vel.x, vel.y, vel.z); } } } void CommonUpdateStateDataKernel::setVelocities(ContextImpl& context, const vector& velocities) { ContextSelector selector(cc); const vector& order = cc.getAtomIndex(); int numParticles = context.getSystem().getNumParticles(); if (cc.getUseDoublePrecision() || cc.getUseMixedPrecision()) { mm_double4* velm = (mm_double4*) cc.getPinnedBuffer(); cc.getVelm().download(velm); for (int i = 0; i < numParticles; ++i) { mm_double4& vel = velm[i]; const Vec3& p = velocities[order[i]]; vel.x = p[0]; vel.y = p[1]; vel.z = p[2]; } for (int i = numParticles; i < cc.getPaddedNumAtoms(); i++) velm[i] = mm_double4(0.0, 0.0, 0.0, 0.0); cc.getVelm().upload(velm); } else { mm_float4* velm = (mm_float4*) cc.getPinnedBuffer(); cc.getVelm().download(velm); for (int i = 0; i < numParticles; ++i) { mm_float4& vel = velm[i]; const Vec3& p = velocities[order[i]]; vel.x = p[0]; vel.y = p[1]; vel.z = p[2]; } for (int i = numParticles; i < cc.getPaddedNumAtoms(); i++) velm[i] = mm_float4(0.0f, 0.0f, 0.0f, 0.0f); cc.getVelm().upload(velm); } } void CommonUpdateStateDataKernel::computeShiftedVelocities(ContextImpl& context, double timeShift, vector& velocities) { cc.getIntegrationUtilities().computeShiftedVelocities(timeShift, velocities); } void CommonUpdateStateDataKernel::getForces(ContextImpl& context, vector& forces) { ContextSelector selector(cc); long long* force = (long long*) cc.getPinnedBuffer(); cc.getLongForceBuffer().download(force); const vector& order = cc.getAtomIndex(); int numParticles = context.getSystem().getNumParticles(); int paddedNumParticles = cc.getPaddedNumAtoms(); forces.resize(numParticles); double scale = 1.0/(double) 0x100000000LL; for (int i = 0; i < numParticles; ++i) forces[order[i]] = Vec3(scale*force[i], scale*force[i+paddedNumParticles], scale*force[i+paddedNumParticles*2]); } void CommonUpdateStateDataKernel::getEnergyParameterDerivatives(ContextImpl& context, map& derivs) { ContextSelector selector(cc); const vector& paramDerivNames = cc.getEnergyParamDerivNames(); int numDerivs = paramDerivNames.size(); if (numDerivs == 0) return; derivs = cc.getEnergyParamDerivWorkspace(); ArrayInterface& derivArray = cc.getEnergyParamDerivBuffer(); if (cc.getUseDoublePrecision() || cc.getUseMixedPrecision()) { vector derivBuffers; derivArray.download(derivBuffers); for (int i = numDerivs; i < derivArray.getSize(); i += numDerivs) for (int j = 0; j < numDerivs; j++) derivBuffers[j] += derivBuffers[i+j]; for (int i = 0; i < numDerivs; i++) derivs[paramDerivNames[i]] += derivBuffers[i]; } else { vector derivBuffers; derivArray.download(derivBuffers); for (int i = numDerivs; i < derivArray.getSize(); i += numDerivs) for (int j = 0; j < numDerivs; j++) derivBuffers[j] += derivBuffers[i+j]; for (int i = 0; i < numDerivs; i++) derivs[paramDerivNames[i]] += derivBuffers[i]; } } void CommonUpdateStateDataKernel::getPeriodicBoxVectors(ContextImpl& context, Vec3& a, Vec3& b, Vec3& c) const { cc.getPeriodicBoxVectors(a, b, c); } void CommonUpdateStateDataKernel::setPeriodicBoxVectors(ContextImpl& context, const Vec3& a, const Vec3& b, const Vec3& c) { // If any particles have been wrapped to the first periodic box, we need to unwrap them // to avoid changing their positions. vector positions; for (auto offset : cc.getPosCellOffsets()) { if (offset.x != 0 || offset.y != 0 || offset.z != 0) { getPositions(context, positions); break; } } // Update the vectors. for (auto ctx : cc.getAllContexts()) ctx->setPeriodicBoxVectors(a, b, c); if (positions.size() > 0) setPositions(context, positions); } void CommonUpdateStateDataKernel::createCheckpoint(ContextImpl& context, ostream& stream) { ContextSelector selector(cc); int version = 3; stream.write((char*) &version, sizeof(int)); int precision = (cc.getUseDoublePrecision() ? 2 : cc.getUseMixedPrecision() ? 1 : 0); stream.write((char*) &precision, sizeof(int)); double time = cc.getTime(); stream.write((char*) &time, sizeof(double)); long long stepCount = cc.getStepCount(); stream.write((char*) &stepCount, sizeof(long long)); int stepsSinceReorder = cc.getStepsSinceReorder(); stream.write((char*) &stepsSinceReorder, sizeof(int)); char* buffer = (char*) cc.getPinnedBuffer(); cc.getPosq().download(buffer); stream.write(buffer, cc.getPosq().getSize()*cc.getPosq().getElementSize()); if (cc.getUseMixedPrecision()) { cc.getPosqCorrection().download(buffer); stream.write(buffer, cc.getPosqCorrection().getSize()*cc.getPosqCorrection().getElementSize()); } cc.getVelm().download(buffer); stream.write(buffer, cc.getVelm().getSize()*cc.getVelm().getElementSize()); stream.write((char*) &cc.getAtomIndex()[0], sizeof(int)*cc.getAtomIndex().size()); stream.write((char*) &cc.getPosCellOffsets()[0], sizeof(mm_int4)*cc.getPosCellOffsets().size()); Vec3 boxVectors[3]; cc.getPeriodicBoxVectors(boxVectors[0], boxVectors[1], boxVectors[2]); stream.write((char*) boxVectors, 3*sizeof(Vec3)); cc.getIntegrationUtilities().createCheckpoint(stream); SimTKOpenMMUtilities::createCheckpoint(stream); } void CommonUpdateStateDataKernel::loadCheckpoint(ContextImpl& context, istream& stream) { ContextSelector selector(cc); int version; stream.read((char*) &version, sizeof(int)); if (version != 3) throw OpenMMException("Checkpoint was created with a different version of OpenMM"); int precision; stream.read((char*) &precision, sizeof(int)); int expectedPrecision = (cc.getUseDoublePrecision() ? 2 : cc.getUseMixedPrecision() ? 1 : 0); if (precision != expectedPrecision) throw OpenMMException("Checkpoint was created with a different numeric precision"); double time; stream.read((char*) &time, sizeof(double)); long long stepCount; stream.read((char*) &stepCount, sizeof(long long)); int stepsSinceReorder; stream.read((char*) &stepsSinceReorder, sizeof(int)); vector contexts = cc.getAllContexts(); for (auto ctx : contexts) { ctx->setTime(time); ctx->setStepCount(stepCount); ctx->setStepsSinceReorder(stepsSinceReorder); } char* buffer = (char*) cc.getPinnedBuffer(); stream.read(buffer, cc.getPosq().getSize()*cc.getPosq().getElementSize()); cc.getPosq().upload(buffer); if (cc.getUseMixedPrecision()) { stream.read(buffer, cc.getPosqCorrection().getSize()*cc.getPosqCorrection().getElementSize()); cc.getPosqCorrection().upload(buffer); } stream.read(buffer, cc.getVelm().getSize()*cc.getVelm().getElementSize()); cc.getVelm().upload(buffer); stream.read((char*) &cc.getAtomIndex()[0], sizeof(int)*cc.getAtomIndex().size()); cc.getAtomIndexArray().upload(cc.getAtomIndex()); stream.read((char*) &cc.getPosCellOffsets()[0], sizeof(mm_int4)*cc.getPosCellOffsets().size()); Vec3 boxVectors[3]; stream.read((char*) &boxVectors, 3*sizeof(Vec3)); for (auto ctx : contexts) ctx->setPeriodicBoxVectors(boxVectors[0], boxVectors[1], boxVectors[2]); cc.getIntegrationUtilities().loadCheckpoint(stream); SimTKOpenMMUtilities::loadCheckpoint(stream); for (auto listener : cc.getReorderListeners()) listener->execute(); cc.validateAtomOrder(); } void CommonApplyConstraintsKernel::initialize(const System& system) { } void CommonApplyConstraintsKernel::apply(ContextImpl& context, double tol) { ContextSelector selector(cc); if (!hasInitializedKernel) { hasInitializedKernel = true; map defines; ComputeProgram program = cc.compileProgram(CommonKernelSources::constraints, defines); applyDeltasKernel = program->createKernel("applyPositionDeltas"); applyDeltasKernel->addArg(cc.getNumAtoms()); applyDeltasKernel->addArg(cc.getPosq()); applyDeltasKernel->addArg(cc.getIntegrationUtilities().getPosDelta()); if (cc.getUseMixedPrecision()) applyDeltasKernel->addArg(cc.getPosqCorrection()); } IntegrationUtilities& integration = cc.getIntegrationUtilities(); cc.clearBuffer(integration.getPosDelta()); integration.applyConstraints(tol); applyDeltasKernel->execute(cc.getNumAtoms()); integration.computeVirtualSites(); } void CommonApplyConstraintsKernel::applyToVelocities(ContextImpl& context, double tol) { cc.getIntegrationUtilities().applyVelocityConstraints(tol); } void CommonVirtualSitesKernel::initialize(const System& system) { } void CommonVirtualSitesKernel::computePositions(ContextImpl& context) { cc.getIntegrationUtilities().computeVirtualSites(); } class CommonCalcHarmonicBondForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const HarmonicBondForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumBonds(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2; double length, k; force.getBondParameters(index, particle1, particle2, length, k); particles.resize(2); particles[0] = particle1; particles[1] = particle2; } bool areGroupsIdentical(int group1, int group2) { int particle1, particle2; double length1, length2, k1, k2; force.getBondParameters(group1, particle1, particle2, length1, k1); force.getBondParameters(group2, particle1, particle2, length2, k2); return (length1 == length2 && k1 == k2); } private: const HarmonicBondForce& force; }; void CommonCalcHarmonicBondForceKernel::initialize(const System& system, const HarmonicBondForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumBonds()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumBonds()/numContexts; numBonds = endIndex-startIndex; if (numBonds == 0) return; vector > atoms(numBonds, vector(2)); params.initialize(cc, numBonds, "bondParams"); vector paramVector(numBonds); for (int i = 0; i < numBonds; i++) { double length, k; force.getBondParameters(startIndex+i, atoms[i][0], atoms[i][1], length, k); paramVector[i] = mm_float2((float) length, (float) k); } params.upload(paramVector); map replacements; replacements["APPLY_PERIODIC"] = (force.usesPeriodicBoundaryConditions() ? "1" : "0"); replacements["COMPUTE_FORCE"] = CommonKernelSources::harmonicBondForce; replacements["PARAMS"] = cc.getBondedUtilities().addArgument(params, "float2"); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::bondForce, replacements), force.getForceGroup()); info = new ForceInfo(force); cc.addForce(info); } double CommonCalcHarmonicBondForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { return 0.0; } void CommonCalcHarmonicBondForceKernel::copyParametersToContext(ContextImpl& context, const HarmonicBondForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumBonds()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumBonds()/numContexts; if (numBonds != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of bonds has changed"); if (numBonds == 0) return; // Record the per-bond parameters. vector paramVector(numBonds); for (int i = 0; i < numBonds; i++) { int atom1, atom2; double length, k; force.getBondParameters(startIndex+i, atom1, atom2, length, k); paramVector[i] = mm_float2((float) length, (float) k); } params.upload(paramVector); // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcCustomBondForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomBondForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumBonds(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2; thread_local static vector parameters; force.getBondParameters(index, particle1, particle2, parameters); particles.resize(2); particles[0] = particle1; particles[1] = particle2; } bool areGroupsIdentical(int group1, int group2) { int particle1, particle2; thread_local static vector parameters1, parameters2; force.getBondParameters(group1, particle1, particle2, parameters1); force.getBondParameters(group2, particle1, particle2, parameters2); for (int i = 0; i < (int) parameters1.size(); i++) if (parameters1[i] != parameters2[i]) return false; return true; } private: const CustomBondForce& force; }; CommonCalcCustomBondForceKernel::~CommonCalcCustomBondForceKernel() { ContextSelector selector(cc); if (params != NULL) delete params; } void CommonCalcCustomBondForceKernel::initialize(const System& system, const CustomBondForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumBonds()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumBonds()/numContexts; numBonds = endIndex-startIndex; if (numBonds == 0) return; vector > atoms(numBonds, vector(2)); params = new ComputeParameterSet(cc, force.getNumPerBondParameters(), numBonds, "customBondParams"); vector > paramVector(numBonds); for (int i = 0; i < numBonds; i++) force.getBondParameters(startIndex+i, atoms[i][0], atoms[i][1], paramVector[i]); params->setParameterValues(paramVector, true); info = new ForceInfo(force); cc.addForce(info); // Record information for the expressions. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } Lepton::ParsedExpression energyExpression = Lepton::Parser::parse(force.getEnergyFunction()).optimize(); Lepton::ParsedExpression forceExpression = energyExpression.differentiate("r").optimize(); map expressions; expressions["energy += "] = energyExpression; expressions["real dEdR = "] = forceExpression; // Create the kernels. map variables; variables["r"] = "r"; for (int i = 0; i < force.getNumPerBondParameters(); i++) { const string& name = force.getPerBondParameterName(i); variables[name] = "bondParams"+params->getParameterSuffix(i); } if (force.getNumGlobalParameters() > 0) { globals.initialize(cc, force.getNumGlobalParameters(), "customBondGlobals"); globals.upload(globalParamValues); string argName = cc.getBondedUtilities().addArgument(globals, "float"); for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = argName+"["+cc.intToString(i)+"]"; variables[name] = value; } } for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { string paramName = force.getEnergyParameterDerivativeName(i); string derivVariable = cc.getBondedUtilities().addEnergyParameterDerivative(paramName); Lepton::ParsedExpression derivExpression = energyExpression.differentiate(paramName).optimize(); expressions[derivVariable+" += "] = derivExpression; } stringstream compute; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = params->getParameterInfos()[i]; string argName = cc.getBondedUtilities().addArgument(parameter.getArray(), parameter.getType()); compute< functions; vector > functionNames; compute << cc.getExpressionUtilities().createExpressions(expressions, variables, functions, functionNames, "temp"); map replacements; replacements["APPLY_PERIODIC"] = (force.usesPeriodicBoundaryConditions() ? "1" : "0"); replacements["COMPUTE_FORCE"] = compute.str(); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::bondForce, replacements), force.getForceGroup()); } double CommonCalcCustomBondForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { ContextSelector selector(cc); if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } return 0.0; } void CommonCalcCustomBondForceKernel::copyParametersToContext(ContextImpl& context, const CustomBondForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumBonds()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumBonds()/numContexts; if (numBonds != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of bonds has changed"); if (numBonds == 0) return; // Record the per-bond parameters. vector > paramVector(numBonds); int atom1, atom2; for (int i = 0; i < numBonds; i++) force.getBondParameters(startIndex+i, atom1, atom2, paramVector[i]); params->setParameterValues(paramVector, true); // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcHarmonicAngleForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const HarmonicAngleForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumAngles(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2, particle3; double angle, k; force.getAngleParameters(index, particle1, particle2, particle3, angle, k); particles.resize(3); particles[0] = particle1; particles[1] = particle2; particles[2] = particle3; } bool areGroupsIdentical(int group1, int group2) { int particle1, particle2, particle3; double angle1, angle2, k1, k2; force.getAngleParameters(group1, particle1, particle2, particle3, angle1, k1); force.getAngleParameters(group2, particle1, particle2, particle3, angle2, k2); return (angle1 == angle2 && k1 == k2); } private: const HarmonicAngleForce& force; }; void CommonCalcHarmonicAngleForceKernel::initialize(const System& system, const HarmonicAngleForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumAngles()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumAngles()/numContexts; numAngles = endIndex-startIndex; if (numAngles == 0) return; vector > atoms(numAngles, vector(3)); params.initialize(cc, numAngles, "angleParams"); vector paramVector(numAngles); for (int i = 0; i < numAngles; i++) { double angle, k; force.getAngleParameters(startIndex+i, atoms[i][0], atoms[i][1], atoms[i][2], angle, k); paramVector[i] = mm_float2((float) angle, (float) k); } params.upload(paramVector); map replacements; replacements["APPLY_PERIODIC"] = (force.usesPeriodicBoundaryConditions() ? "1" : "0"); replacements["COMPUTE_FORCE"] = CommonKernelSources::harmonicAngleForce; replacements["PARAMS"] = cc.getBondedUtilities().addArgument(params, "float2"); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::angleForce, replacements), force.getForceGroup()); info = new ForceInfo(force); cc.addForce(info); } double CommonCalcHarmonicAngleForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { return 0.0; } void CommonCalcHarmonicAngleForceKernel::copyParametersToContext(ContextImpl& context, const HarmonicAngleForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumAngles()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumAngles()/numContexts; if (numAngles != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of angles has changed"); if (numAngles == 0) return; // Record the per-angle parameters. vector paramVector(numAngles); for (int i = 0; i < numAngles; i++) { int atom1, atom2, atom3; double angle, k; force.getAngleParameters(startIndex+i, atom1, atom2, atom3, angle, k); paramVector[i] = mm_float2((float) angle, (float) k); } params.upload(paramVector); // Mark that the current reordering may be invalid. cc.invalidateMolecules(); } class CommonCalcCustomAngleForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomAngleForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumAngles(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2, particle3; thread_local static vector parameters; force.getAngleParameters(index, particle1, particle2, particle3, parameters); particles.resize(3); particles[0] = particle1; particles[1] = particle2; particles[2] = particle3; } bool areGroupsIdentical(int group1, int group2) { int particle1, particle2, particle3; thread_local static vector parameters1, parameters2; force.getAngleParameters(group1, particle1, particle2, particle3, parameters1); force.getAngleParameters(group2, particle1, particle2, particle3, parameters2); for (int i = 0; i < (int) parameters1.size(); i++) if (parameters1[i] != parameters2[i]) return false; return true; } private: const CustomAngleForce& force; }; CommonCalcCustomAngleForceKernel::~CommonCalcCustomAngleForceKernel() { ContextSelector selector(cc); if (params != NULL) delete params; } void CommonCalcCustomAngleForceKernel::initialize(const System& system, const CustomAngleForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumAngles()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumAngles()/numContexts; numAngles = endIndex-startIndex; if (numAngles == 0) return; vector > atoms(numAngles, vector(3)); params = new ComputeParameterSet(cc, force.getNumPerAngleParameters(), numAngles, "customAngleParams"); vector > paramVector(numAngles); for (int i = 0; i < numAngles; i++) force.getAngleParameters(startIndex+i, atoms[i][0], atoms[i][1], atoms[i][2], paramVector[i]); params->setParameterValues(paramVector, true); info = new ForceInfo(force); cc.addForce(info); // Record information for the expressions. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } Lepton::ParsedExpression energyExpression = Lepton::Parser::parse(force.getEnergyFunction()).optimize(); Lepton::ParsedExpression forceExpression = energyExpression.differentiate("theta").optimize(); map expressions; expressions["energy += "] = energyExpression; expressions["real dEdAngle = "] = forceExpression; // Create the kernels. map variables; variables["theta"] = "theta"; for (int i = 0; i < force.getNumPerAngleParameters(); i++) { const string& name = force.getPerAngleParameterName(i); variables[name] = "angleParams"+params->getParameterSuffix(i); } if (force.getNumGlobalParameters() > 0) { globals.initialize(cc, force.getNumGlobalParameters(), "customAngleGlobals"); globals.upload(globalParamValues); string argName = cc.getBondedUtilities().addArgument(globals, "float"); for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = argName+"["+cc.intToString(i)+"]"; variables[name] = value; } } for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { string paramName = force.getEnergyParameterDerivativeName(i); string derivVariable = cc.getBondedUtilities().addEnergyParameterDerivative(paramName); Lepton::ParsedExpression derivExpression = energyExpression.differentiate(paramName).optimize(); expressions[derivVariable+" += "] = derivExpression; } stringstream compute; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = params->getParameterInfos()[i]; string argName = cc.getBondedUtilities().addArgument(parameter.getArray(), parameter.getType()); compute< functions; vector > functionNames; compute << cc.getExpressionUtilities().createExpressions(expressions, variables, functions, functionNames, "temp"); map replacements; replacements["APPLY_PERIODIC"] = (force.usesPeriodicBoundaryConditions() ? "1" : "0"); replacements["COMPUTE_FORCE"] = compute.str(); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::angleForce, replacements), force.getForceGroup()); } double CommonCalcCustomAngleForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { ContextSelector selector(cc); if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } return 0.0; } void CommonCalcCustomAngleForceKernel::copyParametersToContext(ContextImpl& context, const CustomAngleForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumAngles()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumAngles()/numContexts; if (numAngles != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of angles has changed"); if (numAngles == 0) return; // Record the per-angle parameters. vector > paramVector(numAngles); int atom1, atom2, atom3; for (int i = 0; i < numAngles; i++) force.getAngleParameters(startIndex+i, atom1, atom2, atom3, paramVector[i]); params->setParameterValues(paramVector, true); // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcPeriodicTorsionForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const PeriodicTorsionForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumTorsions(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2, particle3, particle4, periodicity; double phase, k; force.getTorsionParameters(index, particle1, particle2, particle3, particle4, periodicity, phase, k); particles.resize(4); particles[0] = particle1; particles[1] = particle2; particles[2] = particle3; particles[3] = particle4; } bool areGroupsIdentical(int group1, int group2) { int particle1, particle2, particle3, particle4, periodicity1, periodicity2; double phase1, phase2, k1, k2; force.getTorsionParameters(group1, particle1, particle2, particle3, particle4, periodicity1, phase1, k1); force.getTorsionParameters(group2, particle1, particle2, particle3, particle4, periodicity2, phase2, k2); return (periodicity1 == periodicity2 && phase1 == phase2 && k1 == k2); } private: const PeriodicTorsionForce& force; }; void CommonCalcPeriodicTorsionForceKernel::initialize(const System& system, const PeriodicTorsionForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumTorsions()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumTorsions()/numContexts; numTorsions = endIndex-startIndex; if (numTorsions == 0) return; vector > atoms(numTorsions, vector(4)); params.initialize(cc, numTorsions, "periodicTorsionParams"); vector paramVector(numTorsions); for (int i = 0; i < numTorsions; i++) { int periodicity; double phase, k; force.getTorsionParameters(startIndex+i, atoms[i][0], atoms[i][1], atoms[i][2], atoms[i][3], periodicity, phase, k); paramVector[i] = mm_float4((float) k, (float) phase, (float) periodicity, 0.0f); } params.upload(paramVector); map replacements; replacements["APPLY_PERIODIC"] = (force.usesPeriodicBoundaryConditions() ? "1" : "0"); replacements["COMPUTE_FORCE"] = CommonKernelSources::periodicTorsionForce; replacements["PARAMS"] = cc.getBondedUtilities().addArgument(params, "float4"); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::torsionForce, replacements), force.getForceGroup()); info = new ForceInfo(force); cc.addForce(info); } double CommonCalcPeriodicTorsionForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { return 0.0; } void CommonCalcPeriodicTorsionForceKernel::copyParametersToContext(ContextImpl& context, const PeriodicTorsionForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumTorsions()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumTorsions()/numContexts; if (numTorsions != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of torsions has changed"); if (numTorsions == 0) return; // Record the per-torsion parameters. vector paramVector(numTorsions); for (int i = 0; i < numTorsions; i++) { int atom1, atom2, atom3, atom4, periodicity; double phase, k; force.getTorsionParameters(startIndex+i, atom1, atom2, atom3, atom4, periodicity, phase, k); paramVector[i] = mm_float4((float) k, (float) phase, (float) periodicity, 0.0f); } params.upload(paramVector); // Mark that the current reordering may be invalid. cc.invalidateMolecules(); } class CommonCalcRBTorsionForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const RBTorsionForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumTorsions(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2, particle3, particle4; double c0, c1, c2, c3, c4, c5; force.getTorsionParameters(index, particle1, particle2, particle3, particle4, c0, c1, c2, c3, c4, c5); particles.resize(4); particles[0] = particle1; particles[1] = particle2; particles[2] = particle3; particles[3] = particle4; } bool areGroupsIdentical(int group1, int group2) { int particle1, particle2, particle3, particle4; double c0a, c0b, c1a, c1b, c2a, c2b, c3a, c3b, c4a, c4b, c5a, c5b; force.getTorsionParameters(group1, particle1, particle2, particle3, particle4, c0a, c1a, c2a, c3a, c4a, c5a); force.getTorsionParameters(group2, particle1, particle2, particle3, particle4, c0b, c1b, c2b, c3b, c4b, c5b); return (c0a == c0b && c1a == c1b && c2a == c2b && c3a == c3b && c4a == c4b && c5a == c5b); } private: const RBTorsionForce& force; }; void CommonCalcRBTorsionForceKernel::initialize(const System& system, const RBTorsionForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumTorsions()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumTorsions()/numContexts; numTorsions = endIndex-startIndex; if (numTorsions == 0) return; vector > atoms(numTorsions, vector(4)); params1.initialize(cc, numTorsions, "rbTorsionParams1"); params2.initialize(cc, numTorsions, "rbTorsionParams2"); vector paramVector1(numTorsions); vector paramVector2(numTorsions); for (int i = 0; i < numTorsions; i++) { double c0, c1, c2, c3, c4, c5; force.getTorsionParameters(startIndex+i, atoms[i][0], atoms[i][1], atoms[i][2], atoms[i][3], c0, c1, c2, c3, c4, c5); paramVector1[i] = mm_float4((float) c0, (float) c1, (float) c2, (float) c3); paramVector2[i] = mm_float2((float) c4, (float) c5); } params1.upload(paramVector1); params2.upload(paramVector2); map replacements; replacements["APPLY_PERIODIC"] = (force.usesPeriodicBoundaryConditions() ? "1" : "0"); replacements["COMPUTE_FORCE"] = CommonKernelSources::rbTorsionForce; replacements["PARAMS1"] = cc.getBondedUtilities().addArgument(params1, "float4"); replacements["PARAMS2"] = cc.getBondedUtilities().addArgument(params2, "float2"); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::torsionForce, replacements), force.getForceGroup()); info = new ForceInfo(force); cc.addForce(info); } double CommonCalcRBTorsionForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { return 0.0; } void CommonCalcRBTorsionForceKernel::copyParametersToContext(ContextImpl& context, const RBTorsionForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumTorsions()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumTorsions()/numContexts; if (numTorsions != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of torsions has changed"); if (numTorsions == 0) return; // Record the per-torsion parameters. vector paramVector1(numTorsions); vector paramVector2(numTorsions); for (int i = 0; i < numTorsions; i++) { int atom1, atom2, atom3, atom4; double c0, c1, c2, c3, c4, c5; force.getTorsionParameters(startIndex+i, atom1, atom2, atom3, atom4, c0, c1, c2, c3, c4, c5); paramVector1[i] = mm_float4((float) c0, (float) c1, (float) c2, (float) c3); paramVector2[i] = mm_float2((float) c4, (float) c5); } params1.upload(paramVector1); params2.upload(paramVector2); // Mark that the current reordering may be invalid. cc.invalidateMolecules(); } class CommonCalcCustomTorsionForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomTorsionForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumTorsions(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2, particle3, particle4; thread_local static vector parameters; force.getTorsionParameters(index, particle1, particle2, particle3, particle4, parameters); particles.resize(4); particles[0] = particle1; particles[1] = particle2; particles[2] = particle3; particles[3] = particle4; } bool areGroupsIdentical(int group1, int group2) { int particle1, particle2, particle3, particle4; thread_local static vector parameters1, parameters2; force.getTorsionParameters(group1, particle1, particle2, particle3, particle4, parameters1); force.getTorsionParameters(group2, particle1, particle2, particle3, particle4, parameters2); for (int i = 0; i < (int) parameters1.size(); i++) if (parameters1[i] != parameters2[i]) return false; return true; } private: const CustomTorsionForce& force; }; CommonCalcCustomTorsionForceKernel::~CommonCalcCustomTorsionForceKernel() { if (params != NULL) delete params; } void CommonCalcCustomTorsionForceKernel::initialize(const System& system, const CustomTorsionForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumTorsions()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumTorsions()/numContexts; numTorsions = endIndex-startIndex; if (numTorsions == 0) return; vector > atoms(numTorsions, vector(4)); params = new ComputeParameterSet(cc, force.getNumPerTorsionParameters(), numTorsions, "customTorsionParams"); vector > paramVector(numTorsions); for (int i = 0; i < numTorsions; i++) force.getTorsionParameters(startIndex+i, atoms[i][0], atoms[i][1], atoms[i][2], atoms[i][3], paramVector[i]); params->setParameterValues(paramVector, true); info = new ForceInfo(force); cc.addForce(info); // Record information for the expressions. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } Lepton::ParsedExpression energyExpression = Lepton::Parser::parse(force.getEnergyFunction()).optimize(); Lepton::ParsedExpression forceExpression = energyExpression.differentiate("theta").optimize(); map expressions; expressions["energy += "] = energyExpression; expressions["real dEdAngle = "] = forceExpression; // Create the kernels. map variables; variables["theta"] = "theta"; for (int i = 0; i < force.getNumPerTorsionParameters(); i++) { const string& name = force.getPerTorsionParameterName(i); variables[name] = "torsionParams"+params->getParameterSuffix(i); } if (force.getNumGlobalParameters() > 0) { globals.initialize(cc, force.getNumGlobalParameters(), "customTorsionGlobals"); globals.upload(globalParamValues); string argName = cc.getBondedUtilities().addArgument(globals, "float"); for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = argName+"["+cc.intToString(i)+"]"; variables[name] = value; } } for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { string paramName = force.getEnergyParameterDerivativeName(i); string derivVariable = cc.getBondedUtilities().addEnergyParameterDerivative(paramName); Lepton::ParsedExpression derivExpression = energyExpression.differentiate(paramName).optimize(); expressions[derivVariable+" += "] = derivExpression; } stringstream compute; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = params->getParameterInfos()[i]; string argName = cc.getBondedUtilities().addArgument(parameter.getArray(), parameter.getType()); compute< functions; vector > functionNames; compute << cc.getExpressionUtilities().createExpressions(expressions, variables, functions, functionNames, "temp"); map replacements; replacements["APPLY_PERIODIC"] = (force.usesPeriodicBoundaryConditions() ? "1" : "0"); replacements["COMPUTE_FORCE"] = compute.str(); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::torsionForce, replacements), force.getForceGroup()); } double CommonCalcCustomTorsionForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { ContextSelector selector(cc); if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } return 0.0; } void CommonCalcCustomTorsionForceKernel::copyParametersToContext(ContextImpl& context, const CustomTorsionForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumTorsions()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumTorsions()/numContexts; if (numTorsions != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of torsions has changed"); if (numTorsions == 0) return; // Record the per-torsion parameters. vector > paramVector(numTorsions); int atom1, atom2, atom3, atom4; for (int i = 0; i < numTorsions; i++) force.getTorsionParameters(startIndex+i, atom1, atom2, atom3, atom4, paramVector[i]); params->setParameterValues(paramVector, true); // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcCMAPTorsionForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CMAPTorsionForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumTorsions(); } void getParticlesInGroup(int index, vector& particles) { int map, a1, a2, a3, a4, b1, b2, b3, b4; force.getTorsionParameters(index, map, a1, a2, a3, a4, b1, b2, b3, b4); particles.resize(8); particles[0] = a1; particles[1] = a2; particles[2] = a3; particles[3] = a4; particles[4] = b1; particles[5] = b2; particles[6] = b3; particles[7] = b4; } bool areGroupsIdentical(int group1, int group2) { int map1, map2, a1, a2, a3, a4, b1, b2, b3, b4; force.getTorsionParameters(group1, map1, a1, a2, a3, a4, b1, b2, b3, b4); force.getTorsionParameters(group2, map2, a1, a2, a3, a4, b1, b2, b3, b4); return (map1 == map2); } private: const CMAPTorsionForce& force; }; void CommonCalcCMAPTorsionForceKernel::initialize(const System& system, const CMAPTorsionForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumTorsions()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumTorsions()/numContexts; numTorsions = endIndex-startIndex; if (numTorsions == 0) return; int numMaps = force.getNumMaps(); vector coeffVec; mapPositionsVec.resize(numMaps); vector energy; vector > c; int currentPosition = 0; for (int i = 0; i < numMaps; i++) { int size; force.getMapParameters(i, size, energy); CMAPTorsionForceImpl::calcMapDerivatives(size, energy, c); mapPositionsVec[i] = mm_int2(currentPosition, size); currentPosition += 4*size*size; for (int j = 0; j < size*size; j++) { coeffVec.push_back(mm_float4((float) c[j][0], (float) c[j][1], (float) c[j][2], (float) c[j][3])); coeffVec.push_back(mm_float4((float) c[j][4], (float) c[j][5], (float) c[j][6], (float) c[j][7])); coeffVec.push_back(mm_float4((float) c[j][8], (float) c[j][9], (float) c[j][10], (float) c[j][11])); coeffVec.push_back(mm_float4((float) c[j][12], (float) c[j][13], (float) c[j][14], (float) c[j][15])); } } vector > atoms(numTorsions, vector(8)); vector torsionMapsVec(numTorsions); for (int i = 0; i < numTorsions; i++) force.getTorsionParameters(startIndex+i, torsionMapsVec[i], atoms[i][0], atoms[i][1], atoms[i][2], atoms[i][3], atoms[i][4], atoms[i][5], atoms[i][6], atoms[i][7]); coefficients.initialize(cc, coeffVec.size(), "cmapTorsionCoefficients"); mapPositions.initialize(cc, numMaps, "cmapTorsionMapPositions"); torsionMaps.initialize(cc, numTorsions, "cmapTorsionMaps"); coefficients.upload(coeffVec); mapPositions.upload(mapPositionsVec); torsionMaps.upload(torsionMapsVec); map replacements; replacements["APPLY_PERIODIC"] = (force.usesPeriodicBoundaryConditions() ? "1" : "0"); replacements["COEFF"] = cc.getBondedUtilities().addArgument(coefficients, "float4"); replacements["MAP_POS"] = cc.getBondedUtilities().addArgument(mapPositions, "int2"); replacements["MAPS"] = cc.getBondedUtilities().addArgument(torsionMaps, "int"); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::cmapTorsionForce, replacements), force.getForceGroup()); info = new ForceInfo(force); cc.addForce(info); } double CommonCalcCMAPTorsionForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { return 0.0; } void CommonCalcCMAPTorsionForceKernel::copyParametersToContext(ContextImpl& context, const CMAPTorsionForce& force) { int numMaps = force.getNumMaps(); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumTorsions()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumTorsions()/numContexts; numTorsions = endIndex-startIndex; if (mapPositions.getSize() != numMaps) throw OpenMMException("updateParametersInContext: The number of maps has changed"); if (torsionMaps.getSize() != numTorsions) throw OpenMMException("updateParametersInContext: The number of CMAP torsions has changed"); // Update the maps. ContextSelector selector(cc); vector coeffVec; vector energy; vector > c; int currentPosition = 0; for (int i = 0; i < numMaps; i++) { int size; force.getMapParameters(i, size, energy); if (size != mapPositionsVec[i].y) throw OpenMMException("updateParametersInContext: The size of a map has changed"); CMAPTorsionForceImpl::calcMapDerivatives(size, energy, c); currentPosition += 4*size*size; for (int j = 0; j < size*size; j++) { coeffVec.push_back(mm_float4((float) c[j][0], (float) c[j][1], (float) c[j][2], (float) c[j][3])); coeffVec.push_back(mm_float4((float) c[j][4], (float) c[j][5], (float) c[j][6], (float) c[j][7])); coeffVec.push_back(mm_float4((float) c[j][8], (float) c[j][9], (float) c[j][10], (float) c[j][11])); coeffVec.push_back(mm_float4((float) c[j][12], (float) c[j][13], (float) c[j][14], (float) c[j][15])); } } coefficients.upload(coeffVec); // Update the indices. vector torsionMapsVec(numTorsions); for (int i = 0; i < numTorsions; i++) { int index[8]; force.getTorsionParameters(i, torsionMapsVec[i], index[0], index[1], index[2], index[3], index[4], index[5], index[6], index[7]); } torsionMaps.upload(torsionMapsVec); } class CommonCalcCustomExternalForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomExternalForce& force, int numParticles) : force(force), indices(numParticles, -1) { vector params; for (int i = 0; i < force.getNumParticles(); i++) { int particle; force.getParticleParameters(i, particle, params); indices[particle] = i; } } bool areParticlesIdentical(int particle1, int particle2) { particle1 = indices[particle1]; particle2 = indices[particle2]; if (particle1 == -1 && particle2 == -1) return true; if (particle1 == -1 || particle2 == -1) return false; int temp; thread_local static vector params1, params2; force.getParticleParameters(particle1, temp, params1); force.getParticleParameters(particle2, temp, params2); for (int i = 0; i < (int) params1.size(); i++) if (params1[i] != params2[i]) return false; return true; } private: const CustomExternalForce& force; vector indices; }; CommonCalcCustomExternalForceKernel::~CommonCalcCustomExternalForceKernel() { ContextSelector selector(cc); if (params != NULL) delete params; } void CommonCalcCustomExternalForceKernel::initialize(const System& system, const CustomExternalForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumParticles()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumParticles()/numContexts; numParticles = endIndex-startIndex; if (numParticles == 0) return; vector > atoms(numParticles, vector(1)); params = new ComputeParameterSet(cc, force.getNumPerParticleParameters(), numParticles, "customExternalParams"); vector > paramVector(numParticles); for (int i = 0; i < numParticles; i++) force.getParticleParameters(startIndex+i, atoms[i][0], paramVector[i]); params->setParameterValues(paramVector, true); info = new ForceInfo(force, system.getNumParticles()); cc.addForce(info); // Record information for the expressions. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } map customFunctions; customFunctions["periodicdistance"] = cc.getExpressionUtilities().getPeriodicDistancePlaceholder(); Lepton::ParsedExpression energyExpression = Lepton::Parser::parse(force.getEnergyFunction(), customFunctions).optimize(); Lepton::ParsedExpression forceExpressionX = energyExpression.differentiate("x").optimize(); Lepton::ParsedExpression forceExpressionY = energyExpression.differentiate("y").optimize(); Lepton::ParsedExpression forceExpressionZ = energyExpression.differentiate("z").optimize(); map expressions; expressions["energy += "] = energyExpression; expressions["real dEdX = "] = forceExpressionX; expressions["real dEdY = "] = forceExpressionY; expressions["real dEdZ = "] = forceExpressionZ; // Create the kernels. map variables; variables["x"] = "pos1.x"; variables["y"] = "pos1.y"; variables["z"] = "pos1.z"; for (int i = 0; i < force.getNumPerParticleParameters(); i++) { const string& name = force.getPerParticleParameterName(i); variables[name] = "particleParams"+params->getParameterSuffix(i); } if (force.getNumGlobalParameters() > 0) { globals.initialize(cc, force.getNumGlobalParameters(), "customExternalGlobals"); globals.upload(globalParamValues); string argName = cc.getBondedUtilities().addArgument(globals, "float"); for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = argName+"["+cc.intToString(i)+"]"; variables[name] = value; } } stringstream compute; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = params->getParameterInfos()[i]; string argName = cc.getBondedUtilities().addArgument(parameter.getArray(), parameter.getType()); compute< functions; vector > functionNames; compute << cc.getExpressionUtilities().createExpressions(expressions, variables, functions, functionNames, "temp"); map replacements; replacements["COMPUTE_FORCE"] = compute.str(); cc.getBondedUtilities().addInteraction(atoms, cc.replaceStrings(CommonKernelSources::customExternalForce, replacements), force.getForceGroup()); } double CommonCalcCustomExternalForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { ContextSelector selector(cc); if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } return 0.0; } void CommonCalcCustomExternalForceKernel::copyParametersToContext(ContextImpl& context, const CustomExternalForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumParticles()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumParticles()/numContexts; if (numParticles != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of particles has changed"); if (numParticles == 0) return; // Record the per-particle parameters. vector > paramVector(numParticles); int particle; for (int i = 0; i < numParticles; i++) force.getParticleParameters(startIndex+i, particle, paramVector[i]); params->setParameterValues(paramVector, true); // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcCustomCompoundBondForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomCompoundBondForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumBonds(); } void getParticlesInGroup(int index, vector& particles) { thread_local static vector parameters; force.getBondParameters(index, particles, parameters); } bool areGroupsIdentical(int group1, int group2) { thread_local static vector particles; thread_local static vector parameters1, parameters2; force.getBondParameters(group1, particles, parameters1); force.getBondParameters(group2, particles, parameters2); for (int i = 0; i < (int) parameters1.size(); i++) if (parameters1[i] != parameters2[i]) return false; return true; } private: const CustomCompoundBondForce& force; }; CommonCalcCustomCompoundBondForceKernel::~CommonCalcCustomCompoundBondForceKernel() { ContextSelector selector(cc); if (params != NULL) delete params; } void CommonCalcCustomCompoundBondForceKernel::initialize(const System& system, const CustomCompoundBondForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumBonds()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumBonds()/numContexts; numBonds = endIndex-startIndex; if (numBonds == 0) return; int particlesPerBond = force.getNumParticlesPerBond(); vector > atoms(numBonds, vector(particlesPerBond)); params = new ComputeParameterSet(cc, force.getNumPerBondParameters(), numBonds, "customCompoundBondParams", false, cc.getUseDoublePrecision()); vector > paramVector(numBonds); for (int i = 0; i < numBonds; i++) force.getBondParameters(startIndex+i, atoms[i], paramVector[i]); params->setParameterValues(paramVector, true); info = new ForceInfo(force); cc.addForce(info); // Record the tabulated functions. map functions; vector > functionDefinitions; vector functionList; tabulatedFunctionArrays.resize(force.getNumTabulatedFunctions()); for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { functionList.push_back(&force.getTabulatedFunction(i)); string name = force.getTabulatedFunctionName(i); tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); functions[name] = cc.getExpressionUtilities().getFunctionPlaceholder(force.getTabulatedFunction(i)); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].initialize(cc, f.size(), "TabulatedFunction"); tabulatedFunctionArrays[i].upload(f); string arrayName = cc.getBondedUtilities().addArgument(tabulatedFunctionArrays[i], width == 1 ? "float" : "float"+cc.intToString(width)); functionDefinitions.push_back(make_pair(name, arrayName)); } // Record information about parameters. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } map variables; for (int i = 0; i < particlesPerBond; i++) { string index = cc.intToString(i+1); variables["x"+index] = "pos"+index+".x"; variables["y"+index] = "pos"+index+".y"; variables["z"+index] = "pos"+index+".z"; } for (int i = 0; i < force.getNumPerBondParameters(); i++) { const string& name = force.getPerBondParameterName(i); variables[name] = "bondParams"+params->getParameterSuffix(i); } if (force.getNumGlobalParameters() > 0) { globals.initialize(cc, force.getNumGlobalParameters(), "customCompoundBondGlobals"); globals.upload(globalParamValues); string argName = cc.getBondedUtilities().addArgument(globals, "float"); for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = argName+"["+cc.intToString(i)+"]"; variables[name] = value; } } // Generate the kernel. Lepton::ParsedExpression energyExpression = CustomCompoundBondForceImpl::prepareExpression(force, functions); map forceExpressions; stringstream compute; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = params->getParameterInfos()[i]; string argName = cc.getBondedUtilities().addArgument(parameter.getArray(), parameter.getType()); compute< replacements; replacements["M_PI"] = cc.doubleToString(M_PI); cc.getBondedUtilities().addPrefixCode(cc.replaceStrings(CommonKernelSources::pointFunctions, replacements)); } double CommonCalcCustomCompoundBondForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { ContextSelector selector(cc); if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } return 0.0; } void CommonCalcCustomCompoundBondForceKernel::copyParametersToContext(ContextImpl& context, const CustomCompoundBondForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumBonds()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumBonds()/numContexts; if (numBonds != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of bonds has changed"); if (numBonds == 0) return; // Record the per-bond parameters. vector > paramVector(numBonds); vector particles; for (int i = 0; i < numBonds; i++) force.getBondParameters(startIndex+i, particles, paramVector[i]); params->setParameterValues(paramVector, true); // See if any tabulated functions have changed. for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { string name = force.getTabulatedFunctionName(i); if (force.getTabulatedFunction(i).getUpdateCount() != tabulatedFunctionUpdateCount[name]) { tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].upload(f); } } // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcCustomCentroidBondForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomCentroidBondForce& force) : force(force) { } int getNumParticleGroups() { return force.getNumBonds(); } void getParticlesInGroup(int index, vector& particles) { thread_local static vector parameters; thread_local static vector groups; force.getBondParameters(index, groups, parameters); for (int group : groups) { vector groupParticles; vector weights; force.getGroupParameters(group, groupParticles, weights); particles.insert(particles.end(), groupParticles.begin(), groupParticles.end()); } } bool areGroupsIdentical(int group1, int group2) { thread_local static vector groups1, groups2; thread_local static vector parameters1, parameters2; force.getBondParameters(group1, groups1, parameters1); force.getBondParameters(group2, groups2, parameters2); for (int i = 0; i < (int) parameters1.size(); i++) if (parameters1[i] != parameters2[i]) return false; for (int i = 0; i < groups1.size(); i++) { vector groupParticles; vector weights1, weights2; force.getGroupParameters(groups1[i], groupParticles, weights1); force.getGroupParameters(groups2[i], groupParticles, weights2); if (weights1.size() != weights2.size()) return false; for (int j = 0; j < weights1.size(); j++) if (weights1[j] != weights2[j]) return false; } return true; } private: const CustomCentroidBondForce& force; }; CommonCalcCustomCentroidBondForceKernel::~CommonCalcCustomCentroidBondForceKernel() { ContextSelector selector(cc); if (params != NULL) delete params; } void CommonCalcCustomCentroidBondForceKernel::initialize(const System& system, const CustomCentroidBondForce& force) { ContextSelector selector(cc); numBonds = force.getNumBonds(); if (numBonds == 0) return; info = new ForceInfo(force); cc.addForce(info); // Record the groups. numGroups = force.getNumGroups(); vector groupParticleVec; vector groupWeightVec; vector groupOffsetVec; groupOffsetVec.push_back(0); for (int i = 0; i < numGroups; i++) { vector particles; vector weights; force.getGroupParameters(i, particles, weights); groupParticleVec.insert(groupParticleVec.end(), particles.begin(), particles.end()); groupOffsetVec.push_back(groupParticleVec.size()); } vector > normalizedWeights; CustomCentroidBondForceImpl::computeNormalizedWeights(force, system, normalizedWeights); for (int i = 0; i < numGroups; i++) groupWeightVec.insert(groupWeightVec.end(), normalizedWeights[i].begin(), normalizedWeights[i].end()); groupParticles.initialize(cc, groupParticleVec.size(), "groupParticles"); groupParticles.upload(groupParticleVec); if (cc.getUseDoublePrecision()) { groupWeights.initialize(cc, groupParticleVec.size(), "groupWeights"); centerPositions.initialize(cc, numGroups, "centerPositions"); } else { groupWeights.initialize(cc, groupParticleVec.size(), "groupWeights"); centerPositions.initialize(cc, numGroups, "centerPositions"); } groupWeights.upload(groupWeightVec, true); groupOffsets.initialize(cc, groupOffsetVec.size(), "groupOffsets"); groupOffsets.upload(groupOffsetVec); groupForces.initialize(cc, numGroups*3, "groupForces"); cc.addAutoclearBuffer(groupForces); // Record the bonds. int groupsPerBond = force.getNumGroupsPerBond(); vector bondGroupVec(numBonds*groupsPerBond); params = new ComputeParameterSet(cc, force.getNumPerBondParameters(), numBonds, "customCentroidBondParams", false, cc.getUseDoublePrecision()); vector > paramVector(numBonds); for (int i = 0; i < numBonds; i++) { vector groups; force.getBondParameters(i, groups, paramVector[i]); for (int j = 0; j < groups.size(); j++) bondGroupVec[i+j*numBonds] = groups[j]; } params->setParameterValues(paramVector, true); bondGroups.initialize(cc, bondGroupVec.size(), "bondGroups"); bondGroups.upload(bondGroupVec); // Record the tabulated functions. map functions; vector > functionDefinitions; vector functionList; stringstream extraArgs; tabulatedFunctionArrays.resize(force.getNumTabulatedFunctions()); for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { functionList.push_back(&force.getTabulatedFunction(i)); string name = force.getTabulatedFunctionName(i); tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); string arrayName = "table"+cc.intToString(i); functionDefinitions.push_back(make_pair(name, arrayName)); functions[name] = cc.getExpressionUtilities().getFunctionPlaceholder(force.getTabulatedFunction(i)); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].initialize(cc, f.size(), "TabulatedFunction"); tabulatedFunctionArrays[i].upload(f); extraArgs << ", GLOBAL const float"; if (width > 1) extraArgs << width; extraArgs << "* RESTRICT " << arrayName; } // Record information about parameters. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } map variables; for (int i = 0; i < groupsPerBond; i++) { string index = cc.intToString(i+1); variables["x"+index] = "pos"+index+".x"; variables["y"+index] = "pos"+index+".y"; variables["z"+index] = "pos"+index+".z"; } for (int i = 0; i < force.getNumPerBondParameters(); i++) { const string& name = force.getPerBondParameterName(i); variables[name] = "bondParams"+params->getParameterSuffix(i); } needEnergyParamDerivs = (force.getNumEnergyParameterDerivatives() > 0); if (needEnergyParamDerivs) extraArgs << ", GLOBAL mixed* RESTRICT energyParamDerivs"; if (force.getNumGlobalParameters() > 0) { globals.initialize(cc, force.getNumGlobalParameters(), "customCentroidBondGlobals"); globals.upload(globalParamValues); extraArgs << ", GLOBAL const float* RESTRICT globals"; for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = "globals["+cc.intToString(i)+"]"; variables[name] = value; } } // Generate the kernel. Lepton::ParsedExpression energyExpression = CustomCentroidBondForceImpl::prepareExpression(force, functions); map forceExpressions; stringstream compute, initParamDerivs, saveParamDerivs; for (int i = 0; i < groupsPerBond; i++) { compute<<"int group"<<(i+1)<<" = bondGroups[index+"<<(i*numBonds)<<"];\n"; compute<<"real4 pos"<<(i+1)<<" = centerPositions[group"<<(i+1)<<"];\n"; } for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = params->getParameterInfos()[i]; extraArgs<<", GLOBAL const "<& allParamDerivNames = cc.getEnergyParamDerivNames(); int numDerivs = allParamDerivNames.size(); for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) for (int index = 0; index < numDerivs; index++) if (allParamDerivNames[index] == force.getEnergyParameterDerivativeName(i)) saveParamDerivs << "energyParamDerivs[GLOBAL_ID*" << numDerivs << "+" << index << "] += energyParamDeriv" << i << ";\n"; } vector forceNames; for (int i = 0; i < groupsPerBond; i++) { string istr = cc.intToString(i+1); string forceName = "force"+istr; forceNames.push_back(forceName); compute<<"real3 "< replacements; replacements["M_PI"] = cc.doubleToString(M_PI); replacements["NUM_BONDS"] = cc.intToString(numBonds); replacements["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); replacements["EXTRA_ARGS"] = extraArgs.str(); replacements["COMPUTE_FORCE"] = compute.str(); replacements["INIT_PARAM_DERIVS"] = initParamDerivs.str(); replacements["SAVE_PARAM_DERIVS"] = saveParamDerivs.str(); ComputeProgram program = cc.compileProgram(cc.replaceStrings(CommonKernelSources::pointFunctions+CommonKernelSources::customCentroidBond, replacements)); computeCentersKernel = program->createKernel("computeGroupCenters"); computeCentersKernel->addArg(numGroups); computeCentersKernel->addArg(cc.getPosq()); computeCentersKernel->addArg(groupParticles); computeCentersKernel->addArg(groupWeights); computeCentersKernel->addArg(groupOffsets); computeCentersKernel->addArg(centerPositions); groupForcesKernel = program->createKernel("computeGroupForces"); groupForcesKernel->addArg(numGroups); groupForcesKernel->addArg(groupForces); groupForcesKernel->addArg(); // Energy buffer hasn't been created yet groupForcesKernel->addArg(centerPositions); groupForcesKernel->addArg(bondGroups); for (int i = 0; i < 5; i++) groupForcesKernel->addArg(); // Periodic box information will be set just before it is executed. if (needEnergyParamDerivs) groupForcesKernel->addArg(); // Deriv buffer hasn't been created yet. for (auto& function : tabulatedFunctionArrays) groupForcesKernel->addArg(function); if (globals.isInitialized()) groupForcesKernel->addArg(globals); for (auto& parameter : params->getParameterInfos()) groupForcesKernel->addArg(parameter.getArray()); applyForcesKernel = program->createKernel("applyForcesToAtoms"); applyForcesKernel->addArg(numGroups); applyForcesKernel->addArg(groupParticles); applyForcesKernel->addArg(groupWeights); applyForcesKernel->addArg(groupOffsets); applyForcesKernel->addArg(groupForces); applyForcesKernel->addArg(); } double CommonCalcCustomCentroidBondForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { if (numBonds == 0) return 0.0; ContextSelector selector(cc); if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } computeCentersKernel->execute(32*numGroups); groupForcesKernel->setArg(2, cc.getEnergyBuffer()); setPeriodicBoxArgs(cc, groupForcesKernel, 5); if (needEnergyParamDerivs) groupForcesKernel->setArg(10, cc.getEnergyParamDerivBuffer()); groupForcesKernel->execute(numBonds); applyForcesKernel->setArg(5, cc.getLongForceBuffer()); applyForcesKernel->execute(32*numGroups); return 0.0; } void CommonCalcCustomCentroidBondForceKernel::copyParametersToContext(ContextImpl& context, const CustomCentroidBondForce& force) { ContextSelector selector(cc); if (numBonds != force.getNumBonds()) throw OpenMMException("updateParametersInContext: The number of bonds has changed"); if (numBonds == 0) return; // Record the per-bond parameters. vector > paramVector(numBonds); vector particles; for (int i = 0; i < numBonds; i++) force.getBondParameters(i, particles, paramVector[i]); params->setParameterValues(paramVector, true); // See if any tabulated functions have changed. for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { string name = force.getTabulatedFunctionName(i); if (force.getTabulatedFunction(i).getUpdateCount() != tabulatedFunctionUpdateCount[name]) { tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].upload(f); } } // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcCustomNonbondedForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomNonbondedForce& force) : force(force) { if (force.getNumInteractionGroups() > 0) { groupsForParticle.resize(force.getNumParticles()); for (int i = 0; i < force.getNumInteractionGroups(); i++) { set set1, set2; force.getInteractionGroupParameters(i, set1, set2); for (int p : set1) groupsForParticle[p].insert(2*i); for (int p : set2) groupsForParticle[p].insert(2*i+1); } } } bool areParticlesIdentical(int particle1, int particle2) { thread_local static vector params1, params2; force.getParticleParameters(particle1, params1); force.getParticleParameters(particle2, params2); for (int i = 0; i < (int) params1.size(); i++) if (params1[i] != params2[i]) return false; if (groupsForParticle.size() > 0 && groupsForParticle[particle1] != groupsForParticle[particle2]) return false; return true; } int getNumParticleGroups() { return force.getNumExclusions(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2; force.getExclusionParticles(index, particle1, particle2); particles.resize(2); particles[0] = particle1; particles[1] = particle2; } bool areGroupsIdentical(int group1, int group2) { return true; } private: const CustomNonbondedForce& force; vector > groupsForParticle; }; class CommonCalcCustomNonbondedForceKernel::LongRangePostComputation : public ComputeContext::ForcePostComputation { public: LongRangePostComputation(ComputeContext& cc, double& longRangeCoefficient, vector& longRangeCoefficientDerivs, CustomNonbondedForce* force) : cc(cc), longRangeCoefficient(longRangeCoefficient), longRangeCoefficientDerivs(longRangeCoefficientDerivs), force(force) { } double computeForceAndEnergy(bool includeForces, bool includeEnergy, int groups) { if ((groups&(1<getForceGroup())) == 0) return 0; if (!cc.getWorkThread().isCurrentThread()) cc.getWorkThread().flush(); Vec3 a, b, c; cc.getPeriodicBoxVectors(a, b, c); double volume = a[0]*b[1]*c[2]; map& derivs = cc.getEnergyParamDerivWorkspace(); for (int i = 0; i < longRangeCoefficientDerivs.size(); i++) derivs[force->getEnergyParameterDerivativeName(i)] += longRangeCoefficientDerivs[i]/volume; return longRangeCoefficient/volume; } private: ComputeContext& cc; double& longRangeCoefficient; vector& longRangeCoefficientDerivs; CustomNonbondedForce* force; }; class CommonCalcCustomNonbondedForceKernel::LongRangeTask : public ComputeContext::WorkTask { public: LongRangeTask(ComputeContext& cc, Context& context, CustomNonbondedForceImpl::LongRangeCorrectionData& data, double& longRangeCoefficient, vector& longRangeCoefficientDerivs, CustomNonbondedForce* force) : cc(cc), context(context), data(data), longRangeCoefficient(longRangeCoefficient), longRangeCoefficientDerivs(longRangeCoefficientDerivs), force(force) { } void execute() { CustomNonbondedForceImpl::calcLongRangeCorrection(*force, data, context, longRangeCoefficient, longRangeCoefficientDerivs, cc.getThreadPool()); } private: ComputeContext& cc; Context& context; CustomNonbondedForceImpl::LongRangeCorrectionData& data; double& longRangeCoefficient; vector& longRangeCoefficientDerivs; CustomNonbondedForce* force; }; CommonCalcCustomNonbondedForceKernel::~CommonCalcCustomNonbondedForceKernel() { ContextSelector selector(cc); if (params != NULL) delete params; if (computedValues != NULL) delete computedValues; if (forceCopy != NULL) delete forceCopy; } void CommonCalcCustomNonbondedForceKernel::initialize(const System& system, const CustomNonbondedForce& force) { ContextSelector selector(cc); int forceIndex; for (forceIndex = 0; forceIndex < system.getNumForces() && &system.getForce(forceIndex) != &force; ++forceIndex) ; string prefix = (force.getNumInteractionGroups() == 0 ? "custom"+cc.intToString(forceIndex)+"_" : ""); // Record parameters and exclusions. int numParticles = force.getNumParticles(); int paddedNumParticles = cc.getPaddedNumAtoms(); int numParams = force.getNumPerParticleParameters(); params = new ComputeParameterSet(cc, numParams, paddedNumParticles, "customNonbondedParameters", true); if (force.getNumGlobalParameters() > 0) globals.initialize(cc, force.getNumGlobalParameters(), "customNonbondedGlobals"); vector > paramVector(paddedNumParticles, vector(numParams, 0)); vector > exclusionList(numParticles); for (int i = 0; i < numParticles; i++) { vector parameters; force.getParticleParameters(i, parameters); paramVector[i].resize(parameters.size()); for (int j = 0; j < (int) parameters.size(); j++) paramVector[i][j] = (float) parameters[j]; exclusionList[i].push_back(i); } for (int i = 0; i < force.getNumExclusions(); i++) { int particle1, particle2; force.getExclusionParticles(i, particle1, particle2); exclusionList[particle1].push_back(particle2); exclusionList[particle2].push_back(particle1); } params->setParameterValues(paramVector); // Record the tabulated functions. map functions; vector > functionDefinitions; vector functionList; vector tableTypes; stringstream tableArgs; tabulatedFunctionArrays.resize(force.getNumTabulatedFunctions()); for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { functionList.push_back(&force.getTabulatedFunction(i)); string name = force.getTabulatedFunctionName(i); tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); string arrayName = prefix+"table"+cc.intToString(i); functionDefinitions.push_back(make_pair(name, arrayName)); functions[name] = cc.getExpressionUtilities().getFunctionPlaceholder(force.getTabulatedFunction(i)); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].initialize(cc, f.size(), "TabulatedFunction"); tabulatedFunctionArrays[i].upload(f); if (force.getNumInteractionGroups() == 0) cc.getNonbondedUtilities().addArgument(ComputeParameterInfo(tabulatedFunctionArrays[i], arrayName, "float", width)); if (width == 1) tableTypes.push_back("float"); else tableTypes.push_back("float"+cc.intToString(width)); tableArgs << ", GLOBAL const float"; if (width > 1) tableArgs << width; tableArgs << "* RESTRICT " << arrayName; } // Record information for the expressions. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } if (globals.isInitialized()) globals.upload(globalParamValues); bool useCutoff = (force.getNonbondedMethod() != CustomNonbondedForce::NoCutoff); bool usePeriodic = (force.getNonbondedMethod() != CustomNonbondedForce::NoCutoff && force.getNonbondedMethod() != CustomNonbondedForce::CutoffNonPeriodic); Lepton::ParsedExpression energyExpression = Lepton::Parser::parse(force.getEnergyFunction(), functions).optimize(); Lepton::ParsedExpression forceExpression = energyExpression.differentiate("r").optimize(); map forceExpressions; forceExpressions["real customEnergy = "] = energyExpression; forceExpressions["tempForce -= "] = forceExpression; // Record which per-particle parameters and computed values appear in the energy expression. if (force.getNumComputedValues() > 0) computedValues = new ComputeParameterSet(cc, force.getNumComputedValues(), paddedNumParticles, "customNonbondedComputedValues", true); for (int i = 0; i < force.getNumPerParticleParameters(); i++) { string name = force.getPerParticleParameterName(i); if (usesVariable(energyExpression, name+"1") || usesVariable(energyExpression, name+"2")) { paramNames.push_back(name); paramBuffers.push_back(params->getParameterInfos()[i]); } } for (int i = 0; i < force.getNumComputedValues(); i++) { string name, expression; force.getComputedValueParameters(i, name, expression); if (usesVariable(energyExpression, name+"1") || usesVariable(energyExpression, name+"2")) { computedValueNames.push_back(name); computedValueBuffers.push_back(computedValues->getParameterInfos()[i]); } } // Create the kernels. vector > variables; ExpressionTreeNode rnode(new Operation::Variable("r")); variables.push_back(make_pair(rnode, "r")); variables.push_back(make_pair(ExpressionTreeNode(new Operation::Square(), rnode), "r2")); variables.push_back(make_pair(ExpressionTreeNode(new Operation::Reciprocal(), rnode), "invR")); for (int i = 0; i < paramNames.size(); i++) { variables.push_back(makeVariable(paramNames[i]+"1", "((real) "+prefix+"params"+cc.intToString(i+1)+"1)")); variables.push_back(makeVariable(paramNames[i]+"2", "((real) "+prefix+"params"+cc.intToString(i+1)+"2)")); } for (int i = 0; i < computedValueNames.size(); i++) { variables.push_back(makeVariable(computedValueNames[i]+"1", prefix+"values"+cc.intToString(i+1)+"1")); variables.push_back(makeVariable(computedValueNames[i]+"2", prefix+"values"+cc.intToString(i+1)+"2")); } for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = "globals["+cc.intToString(i)+"]"; variables.push_back(makeVariable(name, prefix+value)); } for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { string paramName = force.getEnergyParameterDerivativeName(i); string derivVariable = cc.getNonbondedUtilities().addEnergyParameterDerivative(paramName); Lepton::ParsedExpression derivExpression = energyExpression.differentiate(paramName).optimize(); forceExpressions[derivVariable+" += interactionScale*switchValue*"] = derivExpression; } stringstream compute; compute << cc.getExpressionUtilities().createExpressions(forceExpressions, variables, functionList, functionDefinitions, prefix+"temp"); map replacements; replacements["COMPUTE_FORCE"] = compute.str(); replacements["USE_SWITCH"] = (useCutoff && force.getUseSwitchingFunction() ? "1" : "0"); if (force.getUseSwitchingFunction()) { // Compute the switching coefficients. replacements["SWITCH_CUTOFF"] = cc.doubleToString(force.getSwitchingDistance()); replacements["SWITCH_C3"] = cc.doubleToString(10/pow(force.getSwitchingDistance()-force.getCutoffDistance(), 3.0)); replacements["SWITCH_C4"] = cc.doubleToString(15/pow(force.getSwitchingDistance()-force.getCutoffDistance(), 4.0)); replacements["SWITCH_C5"] = cc.doubleToString(6/pow(force.getSwitchingDistance()-force.getCutoffDistance(), 5.0)); } string source = cc.replaceStrings(CommonKernelSources::customNonbonded, replacements); if (force.getNumInteractionGroups() > 0) initInteractionGroups(force, source, tableTypes); else { cc.getNonbondedUtilities().addInteraction(useCutoff, usePeriodic, true, force.getCutoffDistance(), exclusionList, source, force.getForceGroup(), numParticles > 2000); for (int i = 0; i < paramBuffers.size(); i++) cc.getNonbondedUtilities().addParameter(ComputeParameterInfo(paramBuffers[i].getArray(), prefix+"params"+cc.intToString(i+1), paramBuffers[i].getComponentType(), paramBuffers[i].getNumComponents())); for (int i = 0; i < computedValueBuffers.size(); i++) cc.getNonbondedUtilities().addParameter(ComputeParameterInfo(computedValueBuffers[i].getArray(), prefix+"values"+cc.intToString(i+1), computedValueBuffers[i].getComponentType(), computedValueBuffers[i].getNumComponents())); if (globals.isInitialized()) { globals.upload(globalParamValues); cc.getNonbondedUtilities().addArgument(ComputeParameterInfo(globals, prefix+"globals", "float", 1)); } } if (force.getNumComputedValues() > 0) { // Create the kernel to calculate computed values. stringstream valuesSource, args; for (int i = 0; i < computedValues->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = computedValues->getParameterInfos()[i]; string valueName = "values"+cc.intToString(i+1); if (i > 0) args << ", "; args << "GLOBAL " << buffer.getType() << "* RESTRICT global_" << valueName; valuesSource << buffer.getType() << " local_" << valueName << ";\n"; } if (force.getNumGlobalParameters() > 0) args << ", GLOBAL const float* globals"; for (int i = 0; i < params->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; string paramName = "params"+cc.intToString(i+1); args << ", GLOBAL const " << buffer.getType() << "* RESTRICT " << paramName; } map variables; for (int i = 0; i < force.getNumPerParticleParameters(); i++) variables[force.getPerParticleParameterName(i)] = "params"+params->getParameterSuffix(i, "[index]"); for (int i = 0; i < force.getNumGlobalParameters(); i++) variables[force.getGlobalParameterName(i)] = "globals["+cc.intToString(i)+"]"; for (int i = 0; i < force.getNumComputedValues(); i++) { string name, expression; force.getComputedValueParameters(i, name, expression); variables[name] = "local_values"+computedValues->getParameterSuffix(i); map valueExpressions; valueExpressions["local_values"+computedValues->getParameterSuffix(i)+" = "] = Lepton::Parser::parse(expression, functions).optimize(); valuesSource << cc.getExpressionUtilities().createExpressions(valueExpressions, variables, functionList, functionDefinitions, "value"+cc.intToString(i)+"_temp"); } for (int i = 0; i < (int) computedValues->getParameterInfos().size(); i++) { string valueName = "values"+cc.intToString(i+1); valuesSource << "global_" << valueName << "[index] = local_" << valueName << ";\n"; } map replacements; replacements["PARAMETER_ARGUMENTS"] = args.str()+tableArgs.str(); replacements["COMPUTE_VALUES"] = valuesSource.str(); map defines; defines["NUM_ATOMS"] = cc.intToString(cc.getNumAtoms()); ComputeProgram program = cc.compileProgram(cc.replaceStrings(CommonKernelSources::customNonbondedComputedValues, replacements), defines); computedValuesKernel = program->createKernel("computePerParticleValues"); for (auto& value : computedValues->getParameterInfos()) computedValuesKernel->addArg(value.getArray()); if (globals.isInitialized()) computedValuesKernel->addArg(globals); for (auto& parameter : params->getParameterInfos()) computedValuesKernel->addArg(parameter.getArray()); for (auto& function : tabulatedFunctionArrays) computedValuesKernel->addArg(function); } info = new ForceInfo(force); cc.addForce(info); // Record information for the long range correction. if (force.getNonbondedMethod() == CustomNonbondedForce::CutoffPeriodic && force.getUseLongRangeCorrection() && cc.getContextIndex() == 0) { forceCopy = new CustomNonbondedForce(force); longRangeCorrectionData = CustomNonbondedForceImpl::prepareLongRangeCorrection(force, cc.getThreadPool().getNumThreads()); cc.addPostComputation(new LongRangePostComputation(cc, longRangeCoefficient, longRangeCoefficientDerivs, forceCopy)); hasInitializedLongRangeCorrection = false; } else { longRangeCoefficient = 0.0; hasInitializedLongRangeCorrection = true; } } void CommonCalcCustomNonbondedForceKernel::initInteractionGroups(const CustomNonbondedForce& force, const string& interactionSource, const vector& tableTypes) { // Process groups to form tiles. vector > atomLists; vector > tiles; vector tileGroup; vector > duplicateAtomsForGroup; for (int group = 0; group < force.getNumInteractionGroups(); group++) { // Get the list of atoms in this group and sort them. set set1, set2; force.getInteractionGroupParameters(group, set1, set2); vector atoms1, atoms2; atoms1.insert(atoms1.begin(), set1.begin(), set1.end()); atoms2.insert(atoms2.begin(), set2.begin(), set2.end()); sort(atoms1.begin(), atoms1.end()); sort(atoms2.begin(), atoms2.end()); duplicateAtomsForGroup.push_back(vector()); set_intersection(set1.begin(), set1.end(), set2.begin(), set2.end(), inserter(duplicateAtomsForGroup[group], duplicateAtomsForGroup[group].begin())); sort(duplicateAtomsForGroup[group].begin(), duplicateAtomsForGroup[group].end()); // Find how many tiles we will create for this group. int tileWidth = min(min(32, (int) atoms1.size()), (int) atoms2.size()); if (tileWidth == 0) continue; int numBlocks1 = (atoms1.size()+tileWidth-1)/tileWidth; int numBlocks2 = (atoms2.size()+tileWidth-1)/tileWidth; // Add the tiles. int firstTile = tiles.size(); for (int i = 0; i < numBlocks1; i++) for (int j = 0; j < numBlocks2; j++) { tiles.push_back(make_pair(atomLists.size()+i, atomLists.size()+numBlocks1+j)); tileGroup.push_back(group); } // Add the atom lists. for (int i = 0; i < numBlocks1; i++) { vector atoms; int first = i*tileWidth; int last = min((i+1)*tileWidth, (int) atoms1.size()); for (int j = first; j < last; j++) atoms.push_back(atoms1[j]); atomLists.push_back(atoms); } for (int i = 0; i < numBlocks2; i++) { vector atoms; int first = i*tileWidth; int last = min((i+1)*tileWidth, (int) atoms2.size()); for (int j = first; j < last; j++) atoms.push_back(atoms2[j]); atomLists.push_back(atoms); } } // Build a lookup table for quickly identifying excluded interactions. vector > exclusions(force.getNumParticles()); for (int i = 0; i < force.getNumExclusions(); i++) { int p1, p2; force.getExclusionParticles(i, p1, p2); exclusions[p1].insert(p2); exclusions[p2].insert(p1); } // Build the exclusion flags for each tile. While we're at it, filter out tiles // where all interactions are excluded, and sort the tiles by size. vector > exclusionFlags(tiles.size()); vector > tileOrder; for (int tile = 0; tile < tiles.size(); tile++) { bool swapped = false; if (atomLists[tiles[tile].first].size() < atomLists[tiles[tile].second].size()) { // For efficiency, we want the first axis to be the larger one. int swap = tiles[tile].first; tiles[tile].first = tiles[tile].second; tiles[tile].second = swap; swapped = true; } vector& atoms1 = atomLists[tiles[tile].first]; vector& atoms2 = atomLists[tiles[tile].second]; vector& duplicateAtoms = duplicateAtomsForGroup[tileGroup[tile]]; vector& flags = exclusionFlags[tile]; flags.resize(atoms1.size(), (int) (1LL< a2) == swapped && a1IsDuplicate && binary_search(duplicateAtoms.begin(), duplicateAtoms.end(), a2)) isExcluded = true; // Both atoms are in both sets, so skip duplicate interactions. if (isExcluded) { flags[i] &= -1-(1< tileSetStart; tileSetStart.push_back(0); int tileSetSize = 0; for (int i = 0; i < tileOrder.size(); i++) { int tile = tileOrder[i].second; int size = atomLists[tiles[tile].first].size(); if (tileSetSize+size > 32) { tileSetStart.push_back(i); tileSetSize = 0; } tileSetSize += size; } tileSetStart.push_back(tileOrder.size()); // Build the data structures. int numTileSets = tileSetStart.size()-1; vector groupData; for (int tileSet = 0; tileSet < numTileSets; tileSet++) { int indexInTileSet = 0; int minSize = 0; if (cc.getSIMDWidth() < 32) { // We need to include a barrier inside the inner loop, so ensure that all // threads will loop the same number of times. for (int i = tileSetStart[tileSet]; i < tileSetStart[tileSet+1]; i++) minSize = max(minSize, (int) atomLists[tiles[tileOrder[i].second].first].size()); } for (int i = tileSetStart[tileSet]; i < tileSetStart[tileSet+1]; i++) { int tile = tileOrder[i].second; vector& atoms1 = atomLists[tiles[tile].first]; vector& atoms2 = atomLists[tiles[tile].second]; int range = indexInTileSet + ((indexInTileSet+max(minSize, (int) atoms1.size()))<<16); int allFlags = (1< 0 ? exclusionFlags[tile][j] : allFlags); groupData.push_back(mm_int4(a1, a2, range, flags<(cc, groupData.size(), "interactionGroupData"); interactionGroupData.upload(groupData); numGroupTiles.initialize(cc, 1, "numGroupTiles"); // Allocate space for a neighbor list, if necessary. if (force.getNonbondedMethod() != CustomNonbondedForce::NoCutoff && groupData.size() > cc.getNumThreadBlocks()) { filteredGroupData.initialize(cc, groupData.size(), "filteredGroupData"); interactionGroupData.copyTo(filteredGroupData); int numTiles = groupData.size()/32; numGroupTiles.upload(&numTiles); } // Create the kernel. hasParamDerivs = (force.getNumEnergyParameterDerivatives() > 0); map replacements; replacements["COMPUTE_INTERACTION"] = interactionSource; const string suffixes[] = {"x", "y", "z", "w"}; stringstream localData; int localDataSize = 0; for (int i = 0; i < paramBuffers.size(); i++) { localData<& allParamDerivNames = cc.getEnergyParamDerivNames(); int numDerivs = allParamDerivNames.size(); for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { string paramName = force.getEnergyParameterDerivativeName(i); string derivVariable = cc.getNonbondedUtilities().addEnergyParameterDerivative(paramName); initDerivs<<"mixed "< defines; if (force.getNonbondedMethod() != CustomNonbondedForce::NoCutoff) defines["USE_CUTOFF"] = "1"; if (force.getNonbondedMethod() == CustomNonbondedForce::CutoffPeriodic) defines["USE_PERIODIC"] = "1"; int localMemorySize = max(32, cc.getNonbondedUtilities().getForceThreadBlockSize()); defines["LOCAL_MEMORY_SIZE"] = cc.intToString(localMemorySize); defines["WARPS_IN_BLOCK"] = cc.intToString(localMemorySize/32); double cutoff = force.getCutoffDistance(); defines["CUTOFF_SQUARED"] = cc.doubleToString(cutoff*cutoff); double paddedCutoff = cc.getNonbondedUtilities().padCutoff(cutoff); defines["PADDED_CUTOFF_SQUARED"] = cc.doubleToString(paddedCutoff*paddedCutoff); defines["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); defines["TILE_SIZE"] = "32"; defines["NUM_TILES"] = cc.intToString(numTileSets); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*numTileSets/numContexts; int endIndex = (cc.getContextIndex()+1)*numTileSets/numContexts; defines["FIRST_TILE"] = cc.intToString(startIndex); defines["LAST_TILE"] = cc.intToString(endIndex); if ((localDataSize/4)%2 == 0 && !cc.getUseDoublePrecision()) defines["PARAMETER_SIZE_IS_EVEN"] = "1"; ComputeProgram program = cc.compileProgram(cc.replaceStrings(CommonKernelSources::customNonbondedGroups, replacements), defines); interactionGroupKernel = program->createKernel("computeInteractionGroups"); prepareNeighborListKernel = program->createKernel("prepareToBuildNeighborList"); buildNeighborListKernel = program->createKernel("buildNeighborList"); numGroupThreadBlocks = cc.getNonbondedUtilities().getNumForceThreadBlocks(); } double CommonCalcCustomNonbondedForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { useNeighborList = (filteredGroupData.isInitialized() && cc.getNonbondedUtilities().getUseCutoff()); if (useNeighborList && cc.getContextIndex() > 0) { // When using a neighbor list, run the whole calculation on a single device. return 0.0; } ContextSelector selector(cc); bool recomputeLongRangeCorrection = !hasInitializedLongRangeCorrection; if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) { globals.upload(globalParamValues); if (forceCopy != NULL) recomputeLongRangeCorrection = true; } } if (recomputeLongRangeCorrection) { if (includeEnergy || forceCopy->getNumEnergyParameterDerivatives() > 0) { cc.getWorkThread().addTask(new LongRangeTask(cc, context.getOwner(), longRangeCorrectionData, longRangeCoefficient, longRangeCoefficientDerivs, forceCopy)); hasInitializedLongRangeCorrection = true; } else hasInitializedLongRangeCorrection = false; } if (computedValues != NULL) computedValuesKernel->execute(cc.getNumAtoms()); if (interactionGroupData.isInitialized()) { if (!hasInitializedKernel) { hasInitializedKernel = true; interactionGroupKernel->addArg(cc.getLongForceBuffer()); interactionGroupKernel->addArg(cc.getEnergyBuffer()); interactionGroupKernel->addArg(cc.getPosq()); interactionGroupKernel->addArg((useNeighborList ? filteredGroupData : interactionGroupData)); interactionGroupKernel->addArg(numGroupTiles); interactionGroupKernel->addArg((int) useNeighborList); for (int i = 0; i < 5; i++) interactionGroupKernel->addArg(); // Periodic box information will be set just before it is executed. interactionGroupKernel->addArg((int) cc.getEnergyParamDerivNames().size()); for (auto& buffer : paramBuffers) interactionGroupKernel->addArg(buffer.getArray()); for (auto& buffer : computedValueBuffers) interactionGroupKernel->addArg(buffer.getArray()); for (auto& function : tabulatedFunctionArrays) interactionGroupKernel->addArg(function); if (globals.isInitialized()) interactionGroupKernel->addArg(globals); if (hasParamDerivs) interactionGroupKernel->addArg(cc.getEnergyParamDerivBuffer()); if (useNeighborList) { // Initialize kernels for building the interaction group neighbor list. prepareNeighborListKernel->addArg(cc.getNonbondedUtilities().getRebuildNeighborList()); prepareNeighborListKernel->addArg(numGroupTiles); buildNeighborListKernel->addArg(cc.getNonbondedUtilities().getRebuildNeighborList()); buildNeighborListKernel->addArg(numGroupTiles); buildNeighborListKernel->addArg(cc.getPosq()); buildNeighborListKernel->addArg(interactionGroupData); buildNeighborListKernel->addArg(filteredGroupData); for (int i = 0; i < 5; i++) buildNeighborListKernel->addArg(); // Periodic box information will be set just before it is executed. } } int forceThreadBlockSize = max(32, cc.getNonbondedUtilities().getForceThreadBlockSize()); if (useNeighborList) { // Rebuild the neighbor list, if necessary. setPeriodicBoxArgs(cc, buildNeighborListKernel, 5); prepareNeighborListKernel->execute(1, 1); buildNeighborListKernel->execute(numGroupThreadBlocks*forceThreadBlockSize, forceThreadBlockSize); } setPeriodicBoxArgs(cc, interactionGroupKernel, 6); interactionGroupKernel->execute(numGroupThreadBlocks*forceThreadBlockSize, forceThreadBlockSize); } return 0; } void CommonCalcCustomNonbondedForceKernel::copyParametersToContext(ContextImpl& context, const CustomNonbondedForce& force) { ContextSelector selector(cc); int numParticles = force.getNumParticles(); if (numParticles != cc.getNumAtoms()) throw OpenMMException("updateParametersInContext: The number of particles has changed"); // Record the per-particle parameters. int paddedNumParticles = cc.getPaddedNumAtoms(); int numParams = force.getNumPerParticleParameters(); vector > paramVector(paddedNumParticles, vector(numParams, 0)); vector parameters; for (int i = 0; i < numParticles; i++) { force.getParticleParameters(i, parameters); paramVector[i].resize(parameters.size()); for (int j = 0; j < (int) parameters.size(); j++) paramVector[i][j] = (float) parameters[j]; } params->setParameterValues(paramVector); // If necessary, recompute the long range correction. if (forceCopy != NULL) { longRangeCorrectionData = CustomNonbondedForceImpl::prepareLongRangeCorrection(force, cc.getThreadPool().getNumThreads()); CustomNonbondedForceImpl::calcLongRangeCorrection(force, longRangeCorrectionData, context.getOwner(), longRangeCoefficient, longRangeCoefficientDerivs, cc.getThreadPool()); hasInitializedLongRangeCorrection = false; *forceCopy = force; } // See if any tabulated functions have changed. for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { string name = force.getTabulatedFunctionName(i); if (force.getTabulatedFunction(i).getUpdateCount() != tabulatedFunctionUpdateCount[name]) { tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].upload(f); } } // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcGBSAOBCForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const GBSAOBCForce& force) : force(force) { } bool areParticlesIdentical(int particle1, int particle2) { double charge1, charge2, radius1, radius2, scale1, scale2; force.getParticleParameters(particle1, charge1, radius1, scale1); force.getParticleParameters(particle2, charge2, radius2, scale2); return (charge1 == charge2 && radius1 == radius2 && scale1 == scale2); } private: const GBSAOBCForce& force; }; void CommonCalcGBSAOBCForceKernel::initialize(const System& system, const GBSAOBCForce& force) { ContextSelector selector(cc); if (cc.getNumContexts() > 1) throw OpenMMException("GBSAOBCForce does not support using multiple devices"); int forceIndex; for (forceIndex = 0; forceIndex < system.getNumForces() && &system.getForce(forceIndex) != &force; ++forceIndex) ; string prefix = "obc"+cc.intToString(forceIndex)+"_"; NonbondedUtilities& nb = cc.getNonbondedUtilities(); params.initialize(cc, cc.getPaddedNumAtoms(), "gbsaObcParams"); int elementSize = (cc.getUseDoublePrecision() ? sizeof(double) : sizeof(float)); charges.initialize(cc, cc.getPaddedNumAtoms(), elementSize, "gbsaObcCharges"); bornRadii.initialize(cc, cc.getPaddedNumAtoms(), elementSize, "bornRadii"); obcChain.initialize(cc, cc.getPaddedNumAtoms(), elementSize, "obcChain"); bornSum.initialize(cc, cc.getPaddedNumAtoms(), "bornSum"); bornForce.initialize(cc, cc.getPaddedNumAtoms(), "bornForce"); cc.addAutoclearBuffer(bornSum); cc.addAutoclearBuffer(bornForce); vector chargeVec(cc.getPaddedNumAtoms()); vector paramsVector(cc.getPaddedNumAtoms(), mm_float2(1,1)); const double dielectricOffset = 0.009; for (int i = 0; i < force.getNumParticles(); i++) { double charge, radius, scalingFactor; force.getParticleParameters(i, charge, radius, scalingFactor); radius -= dielectricOffset; chargeVec[i] = charge; paramsVector[i] = mm_float2((float) radius, (float) (scalingFactor*radius)); } charges.upload(chargeVec, true); params.upload(paramsVector); prefactor = -ONE_4PI_EPS0*((1.0/force.getSoluteDielectric())-(1.0/force.getSolventDielectric())); surfaceAreaFactor = -6.0*4*M_PI*force.getSurfaceAreaEnergy(); bool useCutoff = (force.getNonbondedMethod() != GBSAOBCForce::NoCutoff); bool usePeriodic = (force.getNonbondedMethod() != GBSAOBCForce::NoCutoff && force.getNonbondedMethod() != GBSAOBCForce::CutoffNonPeriodic); cutoff = force.getCutoffDistance(); string source = CommonKernelSources::gbsaObc2; map replacements; replacements["CHARGE1"] = prefix+"charge1"; replacements["CHARGE2"] = prefix+"charge2"; replacements["OBC_PARAMS1"] = prefix+"obcParams1"; replacements["OBC_PARAMS2"] = prefix+"obcParams2"; replacements["BORN_FORCE1"] = prefix+"bornForce1"; replacements["BORN_FORCE2"] = prefix+"bornForce2"; source = cc.replaceStrings(source, replacements); nb.addInteraction(useCutoff, usePeriodic, false, cutoff, vector >(), source, force.getForceGroup()); nb.addParameter(ComputeParameterInfo(charges, prefix+"charge", "float", 1)); nb.addParameter(ComputeParameterInfo(params, prefix+"obcParams", "float", 2)); nb.addParameter(ComputeParameterInfo(bornForce, prefix+"bornForce", "mm_long", 1)); info = new ForceInfo(force); cc.addForce(info); } double CommonCalcGBSAOBCForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { ContextSelector selector(cc); NonbondedUtilities& nb = cc.getNonbondedUtilities(); bool deviceIsCpu = cc.getIsCPU(); if (!hasCreatedKernels) { // These Kernels cannot be created in initialize(), because the NonbondedUtilities has not been initialized yet then. hasCreatedKernels = true; maxTiles = (nb.getUseCutoff() ? nb.getInteractingTiles().getSize() : 0); int numAtomBlocks = cc.getPaddedNumAtoms()/32; map defines; if (nb.getUseCutoff()) defines["USE_CUTOFF"] = "1"; if (nb.getUsePeriodic()) defines["USE_PERIODIC"] = "1"; defines["CUTOFF_SQUARED"] = cc.doubleToString(cutoff*cutoff); defines["CUTOFF"] = cc.doubleToString(cutoff); defines["PREFACTOR"] = cc.doubleToString(prefactor); defines["SURFACE_AREA_FACTOR"] = cc.doubleToString(surfaceAreaFactor); defines["NUM_ATOMS"] = cc.intToString(cc.getNumAtoms()); defines["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); defines["NUM_BLOCKS"] = cc.intToString(numAtomBlocks); defines["FORCE_WORK_GROUP_SIZE"] = cc.intToString(nb.getForceThreadBlockSize()); defines["TILE_SIZE"] = "32"; int numExclusionTiles = nb.getExclusionTiles().getSize(); defines["NUM_TILES_WITH_EXCLUSIONS"] = cc.intToString(numExclusionTiles); defines["FIRST_EXCLUSION_TILE"] = "0"; defines["LAST_EXCLUSION_TILE"] = cc.intToString(numExclusionTiles); string file; if (deviceIsCpu) file = CommonKernelSources::gbsaObc_cpu; else file = CommonKernelSources::gbsaObc; ComputeProgram program = cc.compileProgram(file, defines); computeBornSumKernel = program->createKernel("computeBornSum"); computeBornSumKernel->addArg(bornSum); computeBornSumKernel->addArg(cc.getPosq()); computeBornSumKernel->addArg(charges); computeBornSumKernel->addArg(params); if (nb.getUseCutoff()) { computeBornSumKernel->addArg(nb.getInteractingTiles()); computeBornSumKernel->addArg(nb.getInteractionCount()); for (int i = 0; i < 5; i++) computeBornSumKernel->addArg(); // The periodic box size arguments are set when the kernel is executed. computeBornSumKernel->addArg(maxTiles); computeBornSumKernel->addArg(nb.getBlockCenters()); computeBornSumKernel->addArg(nb.getBlockBoundingBoxes()); computeBornSumKernel->addArg(nb.getInteractingAtoms()); } else computeBornSumKernel->addArg(numAtomBlocks*(numAtomBlocks+1)/2); computeBornSumKernel->addArg(nb.getExclusionTiles()); force1Kernel = program->createKernel("computeGBSAForce1"); force1Kernel->addArg(cc.getLongForceBuffer()); force1Kernel->addArg(bornForce); force1Kernel->addArg(cc.getEnergyBuffer()); force1Kernel->addArg(cc.getPosq()); force1Kernel->addArg(charges); force1Kernel->addArg(bornRadii); force1Kernel->addArg(); // Whether to include energy. if (nb.getUseCutoff()) { force1Kernel->addArg(nb.getInteractingTiles()); force1Kernel->addArg(nb.getInteractionCount()); for (int i = 0; i < 5; i++) force1Kernel->addArg(); // The periodic box size arguments are set when the kernel is executed. force1Kernel->addArg(maxTiles); force1Kernel->addArg(nb.getBlockCenters()); force1Kernel->addArg(nb.getBlockBoundingBoxes()); force1Kernel->addArg(nb.getInteractingAtoms()); } else force1Kernel->addArg(numAtomBlocks*(numAtomBlocks+1)/2); force1Kernel->addArg(nb.getExclusionTiles()); program = cc.compileProgram(CommonKernelSources::gbsaObcReductions, defines); reduceBornSumKernel = program->createKernel("reduceBornSum"); reduceBornSumKernel->addArg(1.0f); reduceBornSumKernel->addArg(0.8f); reduceBornSumKernel->addArg(4.85f); reduceBornSumKernel->addArg(bornSum); reduceBornSumKernel->addArg(params); reduceBornSumKernel->addArg(bornRadii); reduceBornSumKernel->addArg(obcChain); reduceBornForceKernel = program->createKernel("reduceBornForce"); reduceBornForceKernel->addArg(bornForce); reduceBornForceKernel->addArg(cc.getEnergyBuffer()); reduceBornForceKernel->addArg(params); reduceBornForceKernel->addArg(bornRadii); reduceBornForceKernel->addArg(obcChain); } force1Kernel->setArg(6, (int) includeEnergy); if (nb.getUseCutoff()) { setPeriodicBoxArgs(cc, computeBornSumKernel, 6); setPeriodicBoxArgs(cc, force1Kernel, 9); if (maxTiles < nb.getInteractingTiles().getSize()) { maxTiles = nb.getInteractingTiles().getSize(); computeBornSumKernel->setArg(11, maxTiles); force1Kernel->setArg(14, maxTiles); } } computeBornSumKernel->execute(nb.getNumForceThreadBlocks()*nb.getForceThreadBlockSize(), nb.getForceThreadBlockSize()); reduceBornSumKernel->execute(cc.getPaddedNumAtoms()); force1Kernel->execute(nb.getNumForceThreadBlocks()*nb.getForceThreadBlockSize(), nb.getForceThreadBlockSize()); reduceBornForceKernel->execute(cc.getPaddedNumAtoms()); return 0.0; } void CommonCalcGBSAOBCForceKernel::copyParametersToContext(ContextImpl& context, const GBSAOBCForce& force) { // Make sure the new parameters are acceptable. ContextSelector selector(cc); int numParticles = force.getNumParticles(); if (numParticles != cc.getNumAtoms()) throw OpenMMException("updateParametersInContext: The number of particles has changed"); // Record the per-particle parameters. vector chargeVector(cc.getPaddedNumAtoms(), 0.0); vector paramsVector(cc.getPaddedNumAtoms()); const double dielectricOffset = 0.009; for (int i = 0; i < numParticles; i++) { double charge, radius, scalingFactor; force.getParticleParameters(i, charge, radius, scalingFactor); chargeVector[i] = charge; radius -= dielectricOffset; paramsVector[i] = mm_float2((float) radius, (float) (scalingFactor*radius)); } for (int i = numParticles; i < cc.getPaddedNumAtoms(); i++) paramsVector[i] = mm_float2(1,1); charges.upload(chargeVector, true); params.upload(paramsVector); // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcCustomGBForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomGBForce& force) : force(force) { } bool areParticlesIdentical(int particle1, int particle2) { thread_local static vector params1, params2; force.getParticleParameters(particle1, params1); force.getParticleParameters(particle2, params2); for (int i = 0; i < (int) params1.size(); i++) if (params1[i] != params2[i]) return false; return true; } int getNumParticleGroups() { return force.getNumExclusions(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2; force.getExclusionParticles(index, particle1, particle2); particles.resize(2); particles[0] = particle1; particles[1] = particle2; } bool areGroupsIdentical(int group1, int group2) { return true; } private: const CustomGBForce& force; }; CommonCalcCustomGBForceKernel::~CommonCalcCustomGBForceKernel() { ContextSelector selector(cc); if (params != NULL) delete params; if (computedValues != NULL) delete computedValues; if (energyDerivs != NULL) delete energyDerivs; if (energyDerivChain != NULL) delete energyDerivChain; for (auto d : dValuedParam) delete d; } void CommonCalcCustomGBForceKernel::initialize(const System& system, const CustomGBForce& force) { ContextSelector selector(cc); if (cc.getNumContexts() > 1) throw OpenMMException("CustomGBForce does not support using multiple devices"); NonbondedUtilities& nb = cc.getNonbondedUtilities(); cutoff = force.getCutoffDistance(); bool useExclusionsForValue = false; numComputedValues = force.getNumComputedValues(); vector computedValueNames(numComputedValues); vector computedValueExpressions(numComputedValues); if (numComputedValues > 0) { CustomGBForce::ComputationType type; force.getComputedValueParameters(0, computedValueNames[0], computedValueExpressions[0], type); if (type == CustomGBForce::SingleParticle) throw OpenMMException("The first computed value for a CustomGBForce must be of type ParticlePair or ParticlePairNoExclusions."); useExclusionsForValue = (type == CustomGBForce::ParticlePair); for (int i = 1; i < numComputedValues; i++) { force.getComputedValueParameters(i, computedValueNames[i], computedValueExpressions[i], type); if (type != CustomGBForce::SingleParticle) throw OpenMMException("A CustomGBForce may only have one computed value of type ParticlePair or ParticlePairNoExclusions."); } } int forceIndex; for (forceIndex = 0; forceIndex < system.getNumForces() && &system.getForce(forceIndex) != &force; ++forceIndex) ; string prefix = "custom"+cc.intToString(forceIndex)+"_"; // Record parameters and exclusions. int numParticles = force.getNumParticles(); int paddedNumParticles = cc.getPaddedNumAtoms(); int numParams = force.getNumPerParticleParameters(); params = new ComputeParameterSet(cc, force.getNumPerParticleParameters(), paddedNumParticles, "customGBParameters", true); computedValues = new ComputeParameterSet(cc, numComputedValues, paddedNumParticles, "customGBComputedValues", true, cc.getUseDoublePrecision()); if (force.getNumGlobalParameters() > 0) globals.initialize(cc, force.getNumGlobalParameters(), "customGBGlobals"); vector > paramVector(paddedNumParticles, vector(numParams, 0)); vector > exclusionList(numParticles); for (int i = 0; i < numParticles; i++) { vector parameters; force.getParticleParameters(i, parameters); for (int j = 0; j < (int) parameters.size(); j++) paramVector[i][j] = (float) parameters[j]; exclusionList[i].push_back(i); } for (int i = 0; i < force.getNumExclusions(); i++) { int particle1, particle2; force.getExclusionParticles(i, particle1, particle2); exclusionList[particle1].push_back(particle2); exclusionList[particle2].push_back(particle1); } params->setParameterValues(paramVector); // Record the tabulated functions. map functions; vector > functionDefinitions; vector functionList; stringstream tableArgs; tabulatedFunctionArrays.resize(force.getNumTabulatedFunctions()); for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { functionList.push_back(&force.getTabulatedFunction(i)); string name = force.getTabulatedFunctionName(i); tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); string arrayName = prefix+"table"+cc.intToString(i); functionDefinitions.push_back(make_pair(name, arrayName)); functions[name] = cc.getExpressionUtilities().getFunctionPlaceholder(force.getTabulatedFunction(i)); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].initialize(cc, f.size(), "TabulatedFunction"); tabulatedFunctionArrays[i].upload(f); nb.addArgument(ComputeParameterInfo(tabulatedFunctionArrays[i], arrayName, "float", width)); tableArgs << ", GLOBAL const float"; if (width > 1) tableArgs << width; tableArgs << "* RESTRICT " << arrayName; } // Record the global parameters. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } if (globals.isInitialized()) globals.upload(globalParamValues); // Record derivatives of expressions needed for the chain rule terms. vector > valueGradientExpressions(numComputedValues); vector > valueDerivExpressions(numComputedValues); vector > valueParamDerivExpressions(numComputedValues); needParameterGradient = false; for (int i = 0; i < numComputedValues; i++) { Lepton::ParsedExpression ex = Lepton::Parser::parse(computedValueExpressions[i], functions).optimize(); if (i > 0) { valueGradientExpressions[i].push_back(ex.differentiate("x").optimize()); valueGradientExpressions[i].push_back(ex.differentiate("y").optimize()); valueGradientExpressions[i].push_back(ex.differentiate("z").optimize()); if (!isZeroExpression(valueGradientExpressions[i][0]) || !isZeroExpression(valueGradientExpressions[i][1]) || !isZeroExpression(valueGradientExpressions[i][2])) needParameterGradient = true; for (int j = 0; j < i; j++) valueDerivExpressions[i].push_back(ex.differentiate(computedValueNames[j]).optimize()); } for (int j = 0; j < force.getNumEnergyParameterDerivatives(); j++) valueParamDerivExpressions[i].push_back(ex.differentiate(force.getEnergyParameterDerivativeName(j)).optimize()); } vector > energyDerivExpressions(force.getNumEnergyTerms()); vector > energyParamDerivExpressions(force.getNumEnergyTerms()); vector needChainForValue(numComputedValues, false); for (int i = 0; i < force.getNumEnergyTerms(); i++) { string expression; CustomGBForce::ComputationType type; force.getEnergyTermParameters(i, expression, type); Lepton::ParsedExpression ex = Lepton::Parser::parse(expression, functions).optimize(); for (int j = 0; j < numComputedValues; j++) { if (type == CustomGBForce::SingleParticle) { energyDerivExpressions[i].push_back(ex.differentiate(computedValueNames[j]).optimize()); if (!isZeroExpression(energyDerivExpressions[i].back())) needChainForValue[j] = true; } else { energyDerivExpressions[i].push_back(ex.differentiate(computedValueNames[j]+"1").optimize()); if (!isZeroExpression(energyDerivExpressions[i].back())) needChainForValue[j] = true; energyDerivExpressions[i].push_back(ex.differentiate(computedValueNames[j]+"2").optimize()); if (!isZeroExpression(energyDerivExpressions[i].back())) needChainForValue[j] = true; } } for (int j = 0; j < force.getNumEnergyParameterDerivatives(); j++) energyParamDerivExpressions[i].push_back(ex.differentiate(force.getEnergyParameterDerivativeName(j)).optimize()); } bool deviceIsCpu = cc.getIsCPU(); int elementSize = (cc.getUseDoublePrecision() ? sizeof(double) : sizeof(float)); valueBuffers.initialize(cc, cc.getPaddedNumAtoms(), "customGBValueBuffers"); longEnergyDerivs.initialize(cc, numComputedValues*cc.getPaddedNumAtoms(), "customGBLongEnergyDerivatives"); energyDerivs = new ComputeParameterSet(cc, numComputedValues, cc.getPaddedNumAtoms(), "customGBEnergyDerivatives", true); cc.addAutoclearBuffer(valueBuffers); energyDerivChain = new ComputeParameterSet(cc, numComputedValues, cc.getPaddedNumAtoms(), "customGBEnergyDerivativeChain", true); needEnergyParamDerivs = (force.getNumEnergyParameterDerivatives() > 0); dValue0dParam.resize(force.getNumEnergyParameterDerivatives()); for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { dValuedParam.push_back(new ComputeParameterSet(cc, numComputedValues, cc.getPaddedNumAtoms(), "dValuedParam", true, cc.getUseDoublePrecision())); dValue0dParam[i].initialize(cc, cc.getPaddedNumAtoms(), "dValue0dParam"); cc.addAutoclearBuffer(dValue0dParam[i]); string name = force.getEnergyParameterDerivativeName(i); cc.addEnergyParameterDerivative(name); } // Create the kernels. bool useCutoff = (force.getNonbondedMethod() != CustomGBForce::NoCutoff); bool usePeriodic = (force.getNonbondedMethod() != CustomGBForce::NoCutoff && force.getNonbondedMethod() != CustomGBForce::CutoffNonPeriodic); int numAtomBlocks = cc.getPaddedNumAtoms()/32; { // Create the N2 value kernel. vector > variables; map rename; ExpressionTreeNode rnode(new Operation::Variable("r")); variables.push_back(make_pair(rnode, "r")); variables.push_back(make_pair(ExpressionTreeNode(new Operation::Square(), rnode), "r2")); variables.push_back(make_pair(ExpressionTreeNode(new Operation::Reciprocal(), rnode), "invR")); for (int i = 0; i < force.getNumPerParticleParameters(); i++) { const string& name = force.getPerParticleParameterName(i); variables.push_back(makeVariable(name+"1", "((real) params"+params->getParameterSuffix(i, "1)"))); variables.push_back(makeVariable(name+"2", "((real) params"+params->getParameterSuffix(i, "2)"))); rename[name+"1"] = name+"2"; rename[name+"2"] = name+"1"; } for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = "globals["+cc.intToString(i)+"]"; variables.push_back(makeVariable(name, value)); } map n2ValueExpressions; stringstream n2ValueSource; Lepton::ParsedExpression ex = Lepton::Parser::parse(computedValueExpressions[0], functions).optimize(); n2ValueExpressions["tempValue1 = "] = ex; n2ValueExpressions["tempValue2 = "] = ex.renameVariables(rename); for (int i = 0; i < valueParamDerivExpressions[0].size(); i++) { string variableBase = "temp_dValue0dParam"+cc.intToString(i+1); if (!isZeroExpression(valueParamDerivExpressions[0][i])) { n2ValueExpressions[variableBase+"_1 = "] = valueParamDerivExpressions[0][i]; n2ValueExpressions[variableBase+"_2 = "] = valueParamDerivExpressions[0][i].renameVariables(rename); } } n2ValueSource << cc.getExpressionUtilities().createExpressions(n2ValueExpressions, variables, functionList, functionDefinitions, "temp"); map replacements; string n2ValueStr = n2ValueSource.str(); replacements["COMPUTE_VALUE"] = n2ValueStr; stringstream extraArgs, atomParams, loadLocal1, loadLocal2, load1, load2, tempDerivs1, tempDerivs2, storeDeriv1, storeDeriv2; if (force.getNumGlobalParameters() > 0) extraArgs << ", GLOBAL const float* globals"; pairValueUsesParam.resize(params->getParameterInfos().size(), false); for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; string paramName = "params"+cc.intToString(i+1); if (n2ValueStr.find(paramName+"1") != n2ValueStr.npos || n2ValueStr.find(paramName+"2") != n2ValueStr.npos) { extraArgs << ", GLOBAL const " << buffer.getType() << "* RESTRICT global_" << paramName; atomParams << "LOCAL " << buffer.getType() << " local_" << paramName << "[LOCAL_BUFFER_SIZE];\n"; loadLocal1 << "local_" << paramName << "[localAtomIndex] = " << paramName << "1;\n"; loadLocal2 << "local_" << paramName << "[localAtomIndex] = global_" << paramName << "[j];\n"; load1 << buffer.getType() << " " << paramName << "1 = global_" << paramName << "[atom1];\n"; load2 << buffer.getType() << " " << paramName << "2 = local_" << paramName << "[atom2];\n"; pairValueUsesParam[i] = true; } } for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { string derivName = "dValue0dParam"+cc.intToString(i+1); extraArgs << ", GLOBAL mm_ulong* RESTRICT global_" << derivName; atomParams << "LOCAL real local_" << derivName << "[LOCAL_BUFFER_SIZE];\n"; loadLocal2 << "local_" << derivName << "[localAtomIndex] = 0;\n"; load1 << "real " << derivName << " = 0;\n"; if (!isZeroExpression(valueParamDerivExpressions[0][i])) { load2 << "real temp_" << derivName << "_1 = 0;\n"; load2 << "real temp_" << derivName << "_2 = 0;\n"; tempDerivs1 << derivName << " += temp_" << derivName << "_1;\n"; if (deviceIsCpu) tempDerivs2 << "local_" << derivName << "[j] += temp_" << derivName << "_2;\n"; else tempDerivs2 << "local_" << derivName << "[tbx+tj] += temp_" << derivName << "_2;\n"; storeDeriv1 << "ATOMIC_ADD(&global_" << derivName << "[offset1], (mm_ulong) realToFixedPoint(" << derivName << "));\n"; if (deviceIsCpu) storeDeriv2 << "ATOMIC_ADD(&global_" << derivName << "[offset2], (mm_ulong) realToFixedPoint(local_" << derivName << "[tgx]));\n"; else storeDeriv2 << "ATOMIC_ADD(&global_" << derivName << "[offset2], (mm_ulong) realToFixedPoint(local_" << derivName << "[LOCAL_ID]));\n"; } } replacements["PARAMETER_ARGUMENTS"] = extraArgs.str()+tableArgs.str(); replacements["ATOM_PARAMETER_DATA"] = atomParams.str(); replacements["LOAD_LOCAL_PARAMETERS_FROM_1"] = loadLocal1.str(); replacements["LOAD_LOCAL_PARAMETERS_FROM_GLOBAL"] = loadLocal2.str(); replacements["LOAD_ATOM1_PARAMETERS"] = load1.str(); replacements["LOAD_ATOM2_PARAMETERS"] = load2.str(); replacements["ADD_TEMP_DERIVS1"] = tempDerivs1.str(); replacements["ADD_TEMP_DERIVS2"] = tempDerivs2.str(); replacements["STORE_PARAM_DERIVS1"] = storeDeriv1.str(); replacements["STORE_PARAM_DERIVS2"] = storeDeriv2.str(); if (useCutoff) pairValueDefines["USE_CUTOFF"] = "1"; if (usePeriodic) pairValueDefines["USE_PERIODIC"] = "1"; if (useExclusionsForValue) pairValueDefines["USE_EXCLUSIONS"] = "1"; pairValueDefines["LOCAL_BUFFER_SIZE"] = cc.intToString(deviceIsCpu ? 32 : nb.getForceThreadBlockSize()); pairValueDefines["CUTOFF_SQUARED"] = cc.doubleToString(cutoff*cutoff); pairValueDefines["NUM_ATOMS"] = cc.intToString(cc.getNumAtoms()); pairValueDefines["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); pairValueDefines["NUM_BLOCKS"] = cc.intToString(numAtomBlocks); pairValueDefines["TILE_SIZE"] = "32"; string file; if (deviceIsCpu) file = CommonKernelSources::customGBValueN2_cpu; else file = CommonKernelSources::customGBValueN2; pairValueSrc = cc.replaceStrings(file, replacements); } { // Create the kernel to reduce the N2 value and calculate other values. stringstream reductionSource, extraArgs, deriv0; if (force.getNumGlobalParameters() > 0) extraArgs << ", GLOBAL const float* globals"; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; string paramName = "params"+cc.intToString(i+1); extraArgs << ", GLOBAL const " << buffer.getType() << "* RESTRICT " << paramName; } for (int i = 0; i < (int) computedValues->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = computedValues->getParameterInfos()[i]; string valueName = "values"+cc.intToString(i+1); extraArgs << ", GLOBAL " << buffer.getType() << "* RESTRICT global_" << valueName; reductionSource << buffer.getType() << " local_" << valueName << ";\n"; } for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { string variableName = "dValuedParam_0_"+cc.intToString(i); extraArgs << ", GLOBAL const mm_long* RESTRICT dValue0dParam" << i; deriv0 << "real " << variableName << " = RECIP((real) 0x100000000)*dValue0dParam" << i << "[index];\n"; for (int j = 0; j < dValuedParam[i]->getParameterInfos().size(); j++) extraArgs << ", GLOBAL real* RESTRICT global_dValuedParam_" << j << "_" << i; deriv0 << "global_dValuedParam_0_" << i << "[index] = dValuedParam_0_" << i << ";\n"; } reductionSource << "local_values" << computedValues->getParameterSuffix(0) << " = sum;\n"; map variables; variables["x"] = "pos.x"; variables["y"] = "pos.y"; variables["z"] = "pos.z"; for (int i = 0; i < force.getNumPerParticleParameters(); i++) variables[force.getPerParticleParameterName(i)] = "params"+params->getParameterSuffix(i, "[index]"); for (int i = 0; i < force.getNumGlobalParameters(); i++) variables[force.getGlobalParameterName(i)] = "globals["+cc.intToString(i)+"]"; for (int i = 1; i < numComputedValues; i++) { variables[computedValueNames[i-1]] = "local_values"+computedValues->getParameterSuffix(i-1); map valueExpressions; valueExpressions["local_values"+computedValues->getParameterSuffix(i)+" = "] = Lepton::Parser::parse(computedValueExpressions[i], functions).optimize(); reductionSource << cc.getExpressionUtilities().createExpressions(valueExpressions, variables, functionList, functionDefinitions, "value"+cc.intToString(i)+"_temp"); } for (int i = 0; i < (int) computedValues->getParameterInfos().size(); i++) { string valueName = "values"+cc.intToString(i+1); reductionSource << "global_" << valueName << "[index] = local_" << valueName << ";\n"; } if (needEnergyParamDerivs) { map derivExpressions; for (int i = 1; i < numComputedValues; i++) { for (int j = 0; j < valueParamDerivExpressions[i].size(); j++) derivExpressions["real dValuedParam_"+cc.intToString(i)+"_"+cc.intToString(j)+" = "] = valueParamDerivExpressions[i][j]; for (int j = 0; j < i; j++) derivExpressions["real dVdV_"+cc.intToString(i)+"_"+cc.intToString(j)+" = "] = valueDerivExpressions[i][j]; } reductionSource << cc.getExpressionUtilities().createExpressions(derivExpressions, variables, functionList, functionDefinitions, "derivChain_temp"); for (int i = 1; i < numComputedValues; i++) { for (int j = 0; j < i; j++) for (int k = 0; k < valueParamDerivExpressions[i].size(); k++) reductionSource << "dValuedParam_" << i << "_" << k << " += dVdV_" << i << "_" << j << "*dValuedParam_" << j <<"_" << k << ";\n"; for (int j = 0; j < valueParamDerivExpressions[i].size(); j++) reductionSource << "global_dValuedParam_" << i << "_" << j << "[index] = dValuedParam_" << i << "_" << j << ";\n"; } } map replacements; replacements["PARAMETER_ARGUMENTS"] = extraArgs.str()+tableArgs.str(); replacements["REDUCE_PARAM0_DERIV"] = deriv0.str(); replacements["COMPUTE_VALUES"] = reductionSource.str(); map defines; defines["NUM_ATOMS"] = cc.intToString(cc.getNumAtoms()); ComputeProgram program = cc.compileProgram(cc.replaceStrings(CommonKernelSources::customGBValuePerParticle, replacements), defines); perParticleValueKernel = program->createKernel("computePerParticleValues"); } { // Create the N2 energy kernel. vector > variables; ExpressionTreeNode rnode(new Operation::Variable("r")); variables.push_back(make_pair(rnode, "r")); variables.push_back(make_pair(ExpressionTreeNode(new Operation::Square(), rnode), "r2")); variables.push_back(make_pair(ExpressionTreeNode(new Operation::Reciprocal(), rnode), "invR")); for (int i = 0; i < force.getNumPerParticleParameters(); i++) { const string& name = force.getPerParticleParameterName(i); variables.push_back(makeVariable(name+"1", "((real) params"+params->getParameterSuffix(i, "1)"))); variables.push_back(makeVariable(name+"2", "((real) params"+params->getParameterSuffix(i, "2)"))); } for (int i = 0; i < numComputedValues; i++) { variables.push_back(makeVariable(computedValueNames[i]+"1", "values"+computedValues->getParameterSuffix(i, "1"))); variables.push_back(makeVariable(computedValueNames[i]+"2", "values"+computedValues->getParameterSuffix(i, "2"))); } for (int i = 0; i < force.getNumGlobalParameters(); i++) variables.push_back(makeVariable(force.getGlobalParameterName(i), "globals["+cc.intToString(i)+"]")); stringstream n2EnergySource; bool anyExclusions = (force.getNumExclusions() > 0); for (int i = 0; i < force.getNumEnergyTerms(); i++) { string expression; CustomGBForce::ComputationType type; force.getEnergyTermParameters(i, expression, type); if (type == CustomGBForce::SingleParticle) continue; bool exclude = (anyExclusions && type == CustomGBForce::ParticlePair); map n2EnergyExpressions; n2EnergyExpressions["tempEnergy += "] = Lepton::Parser::parse(expression, functions).optimize(); n2EnergyExpressions["dEdR += "] = Lepton::Parser::parse(expression, functions).differentiate("r").optimize(); for (int j = 0; j < numComputedValues; j++) { if (needChainForValue[j]) { string index = cc.intToString(j+1); n2EnergyExpressions["/*"+cc.intToString(i+1)+"*/ deriv"+index+"_1 += "] = energyDerivExpressions[i][2*j]; n2EnergyExpressions["/*"+cc.intToString(i+1)+"*/ deriv"+index+"_2 += "] = energyDerivExpressions[i][2*j+1]; } } for (int j = 0; j < force.getNumEnergyParameterDerivatives(); j++) n2EnergyExpressions["energyParamDeriv"+cc.intToString(j)+" += interactionScale*"] = energyParamDerivExpressions[i][j]; if (exclude) n2EnergySource << "if (!isExcluded) {\n"; n2EnergySource << cc.getExpressionUtilities().createExpressions(n2EnergyExpressions, variables, functionList, functionDefinitions, "temp"); if (exclude) n2EnergySource << "}\n"; } map replacements; string n2EnergyStr = n2EnergySource.str(); replacements["COMPUTE_INTERACTION"] = n2EnergyStr; stringstream extraArgs, atomParams, loadLocal1, loadLocal2, clearLocal, load1, load2, declare1, recordDeriv, storeDerivs1, storeDerivs2, initParamDerivs, saveParamDerivs; if (force.getNumGlobalParameters() > 0) extraArgs << ", GLOBAL const float* globals"; pairEnergyUsesParam.resize(params->getParameterInfos().size(), false); for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; string paramName = "params"+cc.intToString(i+1); if (n2EnergyStr.find(paramName+"1") != n2EnergyStr.npos || n2EnergyStr.find(paramName+"2") != n2EnergyStr.npos) { extraArgs << ", GLOBAL const " << buffer.getType() << "* RESTRICT global_" << paramName; atomParams << "LOCAL " << buffer.getType() << " local_" << paramName << "[LOCAL_BUFFER_SIZE];\n"; loadLocal1 << "local_" << paramName << "[localAtomIndex] = " << paramName << "1;\n"; loadLocal2 << "local_" << paramName << "[localAtomIndex] = global_" << paramName << "[j];\n"; load1 << buffer.getType() << " " << paramName << "1 = global_" << paramName << "[atom1];\n"; load2 << buffer.getType() << " " << paramName << "2 = local_" << paramName << "[atom2];\n"; pairEnergyUsesParam[i] = true; } } pairEnergyUsesValue.resize(computedValues->getParameterInfos().size(), false); for (int i = 0; i < (int) computedValues->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = computedValues->getParameterInfos()[i]; string valueName = "values"+cc.intToString(i+1); if (n2EnergyStr.find(valueName+"1") != n2EnergyStr.npos || n2EnergyStr.find(valueName+"2") != n2EnergyStr.npos) { extraArgs << ", GLOBAL const " << buffer.getType() << "* RESTRICT global_" << valueName; atomParams << "LOCAL " << buffer.getType() << " local_" << valueName << "[LOCAL_BUFFER_SIZE];\n"; loadLocal1 << "local_" << valueName << "[localAtomIndex] = " << valueName << "1;\n"; loadLocal2 << "local_" << valueName << "[localAtomIndex] = global_" << valueName << "[j];\n"; load1 << buffer.getType() << " " << valueName << "1 = global_" << valueName << "[atom1];\n"; load2 << buffer.getType() << " " << valueName << "2 = local_" << valueName << "[atom2];\n"; pairEnergyUsesValue[i] = true; } } extraArgs << ", GLOBAL mm_ulong* RESTRICT derivBuffers"; for (int i = 0; i < numComputedValues; i++) { string index = cc.intToString(i+1); atomParams << "LOCAL real local_deriv" << index << "[LOCAL_BUFFER_SIZE];\n"; clearLocal << "local_deriv" << index << "[localAtomIndex] = 0.0f;\n"; declare1 << "real deriv" << index << "_1 = 0;\n"; load2 << "real deriv" << index << "_2 = 0;\n"; recordDeriv << "local_deriv" << index << "[atom2] += deriv" << index << "_2;\n"; storeDerivs1 << "STORE_DERIVATIVE_1(" << index << ")\n"; storeDerivs2 << "STORE_DERIVATIVE_2(" << index << ")\n"; } if (needEnergyParamDerivs) { extraArgs << ", GLOBAL mixed* RESTRICT energyParamDerivs"; const vector& allParamDerivNames = cc.getEnergyParamDerivNames(); int numDerivs = allParamDerivNames.size(); for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { initParamDerivs << "mixed energyParamDeriv" << i << " = 0;\n"; for (int index = 0; index < numDerivs; index++) if (allParamDerivNames[index] == force.getEnergyParameterDerivativeName(i)) saveParamDerivs << "energyParamDerivs[GLOBAL_ID*" << numDerivs << "+" << index << "] += energyParamDeriv" << i << ";\n"; } } replacements["PARAMETER_ARGUMENTS"] = extraArgs.str()+tableArgs.str(); replacements["ATOM_PARAMETER_DATA"] = atomParams.str(); replacements["LOAD_LOCAL_PARAMETERS_FROM_1"] = loadLocal1.str(); replacements["LOAD_LOCAL_PARAMETERS_FROM_GLOBAL"] = loadLocal2.str(); replacements["CLEAR_LOCAL_DERIVATIVES"] = clearLocal.str(); replacements["LOAD_ATOM1_PARAMETERS"] = load1.str(); replacements["LOAD_ATOM2_PARAMETERS"] = load2.str(); replacements["DECLARE_ATOM1_DERIVATIVES"] = declare1.str(); replacements["RECORD_DERIVATIVE_2"] = recordDeriv.str(); replacements["STORE_DERIVATIVES_1"] = storeDerivs1.str(); replacements["STORE_DERIVATIVES_2"] = storeDerivs2.str(); replacements["INIT_PARAM_DERIVS"] = initParamDerivs.str(); replacements["SAVE_PARAM_DERIVS"] = saveParamDerivs.str(); if (useCutoff) pairEnergyDefines["USE_CUTOFF"] = "1"; if (usePeriodic) pairEnergyDefines["USE_PERIODIC"] = "1"; if (anyExclusions) pairEnergyDefines["USE_EXCLUSIONS"] = "1"; pairEnergyDefines["LOCAL_BUFFER_SIZE"] = cc.intToString(deviceIsCpu ? 32 : nb.getForceThreadBlockSize()); pairEnergyDefines["CUTOFF_SQUARED"] = cc.doubleToString(cutoff*cutoff); pairEnergyDefines["NUM_ATOMS"] = cc.intToString(cc.getNumAtoms()); pairEnergyDefines["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); pairEnergyDefines["NUM_BLOCKS"] = cc.intToString(numAtomBlocks); pairEnergyDefines["TILE_SIZE"] = "32"; string file; if (deviceIsCpu) file = CommonKernelSources::customGBEnergyN2_cpu; else file = CommonKernelSources::customGBEnergyN2; pairEnergySrc = cc.replaceStrings(file, replacements); } { // Create the kernel to reduce the derivatives and calculate per-particle energy terms. stringstream compute, extraArgs, reduce, initParamDerivs, saveParamDerivs; if (force.getNumGlobalParameters() > 0) extraArgs << ", GLOBAL const float* globals"; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; string paramName = "params"+cc.intToString(i+1); extraArgs << ", GLOBAL const " << buffer.getType() << "* RESTRICT " << paramName; } for (int i = 0; i < (int) computedValues->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = computedValues->getParameterInfos()[i]; string valueName = "values"+cc.intToString(i+1); extraArgs << ", GLOBAL const " << buffer.getType() << "* RESTRICT " << valueName; } for (int i = 0; i < (int) energyDerivs->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = energyDerivs->getParameterInfos()[i]; string index = cc.intToString(i+1); extraArgs << ", GLOBAL " << buffer.getType() << "* RESTRICT derivBuffers" << index; compute << buffer.getType() << " deriv" << index << " = derivBuffers" << index << "[index];\n"; } for (int i = 0; i < (int) energyDerivChain->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = energyDerivChain->getParameterInfos()[i]; string index = cc.intToString(i+1); extraArgs << ", GLOBAL " << buffer.getType() << "* RESTRICT derivChain" << index; } extraArgs << ", GLOBAL const mm_long* RESTRICT derivBuffersIn"; for (int i = 0; i < energyDerivs->getNumParameters(); ++i) reduce << "derivBuffers" << energyDerivs->getParameterSuffix(i, "[index]") << " = RECIP((real) 0x100000000)*derivBuffersIn[index+PADDED_NUM_ATOMS*" << cc.intToString(i) << "];\n"; if (needEnergyParamDerivs) { extraArgs << ", GLOBAL mixed* RESTRICT energyParamDerivs"; const vector& allParamDerivNames = cc.getEnergyParamDerivNames(); int numDerivs = allParamDerivNames.size(); for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { initParamDerivs << "mixed energyParamDeriv" << i << " = 0;\n"; for (int index = 0; index < numDerivs; index++) if (allParamDerivNames[index] == force.getEnergyParameterDerivativeName(i)) saveParamDerivs << "energyParamDerivs[GLOBAL_ID*" << numDerivs << "+" << index << "] += energyParamDeriv" << i << ";\n"; } } // Compute the various expressions. map variables; variables["x"] = "pos.x"; variables["y"] = "pos.y"; variables["z"] = "pos.z"; for (int i = 0; i < force.getNumPerParticleParameters(); i++) variables[force.getPerParticleParameterName(i)] = "params"+params->getParameterSuffix(i, "[index]"); for (int i = 0; i < force.getNumGlobalParameters(); i++) variables[force.getGlobalParameterName(i)] = "globals["+cc.intToString(i)+"]"; for (int i = 0; i < numComputedValues; i++) variables[computedValueNames[i]] = "values"+computedValues->getParameterSuffix(i, "[index]"); map expressions; for (int i = 0; i < force.getNumEnergyTerms(); i++) { string expression; CustomGBForce::ComputationType type; force.getEnergyTermParameters(i, expression, type); if (type != CustomGBForce::SingleParticle) continue; Lepton::ParsedExpression parsed = Lepton::Parser::parse(expression, functions).optimize(); expressions["/*"+cc.intToString(i+1)+"*/ energy += "] = parsed; for (int j = 0; j < numComputedValues; j++) expressions["/*"+cc.intToString(i+1)+"*/ deriv"+energyDerivs->getParameterSuffix(j)+" += "] = energyDerivExpressions[i][j]; Lepton::ParsedExpression gradx = parsed.differentiate("x").optimize(); Lepton::ParsedExpression grady = parsed.differentiate("y").optimize(); Lepton::ParsedExpression gradz = parsed.differentiate("z").optimize(); if (!isZeroExpression(gradx)) expressions["/*"+cc.intToString(i+1)+"*/ force.x -= "] = gradx; if (!isZeroExpression(grady)) expressions["/*"+cc.intToString(i+1)+"*/ force.y -= "] = grady; if (!isZeroExpression(gradz)) expressions["/*"+cc.intToString(i+1)+"*/ force.z -= "] = gradz; for (int j = 0; j < force.getNumEnergyParameterDerivatives(); j++) expressions["/*"+cc.intToString(i+1)+"*/ energyParamDeriv"+cc.intToString(j)+" += "] = energyParamDerivExpressions[i][j]; } for (int i = 1; i < numComputedValues; i++) for (int j = 0; j < i; j++) expressions["real dV"+cc.intToString(i)+"dV"+cc.intToString(j)+" = "] = valueDerivExpressions[i][j]; compute << cc.getExpressionUtilities().createExpressions(expressions, variables, functionList, functionDefinitions, "temp"); // Record values. for (int i = 0; i < (int) energyDerivs->getParameterInfos().size(); i++) { string index = cc.intToString(i+1); compute << "derivBuffers" << index << "[index] = deriv" << index << ";\n"; } compute << "forceBuffers[index] += realToFixedPoint(force.x);\n"; compute << "forceBuffers[index+PADDED_NUM_ATOMS] += realToFixedPoint(force.y);\n"; compute << "forceBuffers[index+PADDED_NUM_ATOMS*2] += realToFixedPoint(force.z);\n"; for (int i = 1; i < numComputedValues; i++) { compute << "real totalDeriv"<getParameterInfos().size(); i++) { string index = cc.intToString(i+1); compute << "derivChain" << index << "[index] = deriv" << index << ";\n"; } map replacements; replacements["PARAMETER_ARGUMENTS"] = extraArgs.str()+tableArgs.str(); replacements["REDUCE_DERIVATIVES"] = reduce.str(); replacements["COMPUTE_ENERGY"] = compute.str(); replacements["INIT_PARAM_DERIVS"] = initParamDerivs.str(); replacements["SAVE_PARAM_DERIVS"] = saveParamDerivs.str(); map defines; defines["NUM_ATOMS"] = cc.intToString(cc.getNumAtoms()); defines["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); ComputeProgram program = cc.compileProgram(cc.replaceStrings(CommonKernelSources::customGBEnergyPerParticle, replacements), defines); perParticleEnergyKernel = program->createKernel("computePerParticleEnergy"); } if (needParameterGradient || needEnergyParamDerivs) { // Create the kernel to compute chain rule terms for computed values that depend explicitly on particle coordinates, and for // derivatives with respect to global parameters. stringstream compute, extraArgs, initParamDerivs, saveParamDerivs; if (force.getNumGlobalParameters() > 0) extraArgs << ", GLOBAL const float* globals"; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; string paramName = "params"+cc.intToString(i+1); extraArgs << ", GLOBAL const " << buffer.getType() << "* RESTRICT " << paramName; } for (int i = 0; i < (int) computedValues->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = computedValues->getParameterInfos()[i]; string valueName = "values"+cc.intToString(i+1); extraArgs << ", GLOBAL const " << buffer.getType() << "* RESTRICT " << valueName; } for (int i = 0; i < (int) energyDerivs->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = energyDerivs->getParameterInfos()[i]; string index = cc.intToString(i+1); extraArgs << ", GLOBAL " << buffer.getType() << "* RESTRICT derivBuffers" << index; compute << buffer.getType() << " deriv" << index << " = derivBuffers" << index << "[index];\n"; } if (needEnergyParamDerivs) { extraArgs << ", GLOBAL mixed* RESTRICT energyParamDerivs"; const vector& allParamDerivNames = cc.getEnergyParamDerivNames(); int numDerivs = allParamDerivNames.size(); for (int i = 0; i < force.getNumEnergyParameterDerivatives(); i++) { for (int j = 0; j < dValuedParam[i]->getParameterInfos().size(); j++) extraArgs << ", GLOBAL real* RESTRICT dValuedParam_" << j << "_" << i; initParamDerivs << "mixed energyParamDeriv" << i << " = 0;\n"; for (int index = 0; index < numDerivs; index++) if (allParamDerivNames[index] == force.getEnergyParameterDerivativeName(i)) saveParamDerivs << "energyParamDerivs[GLOBAL_ID*" << numDerivs << "+" << index << "] += energyParamDeriv" << i << ";\n"; } } map variables; variables["x"] = "pos.x"; variables["y"] = "pos.y"; variables["z"] = "pos.z"; for (int i = 0; i < force.getNumPerParticleParameters(); i++) variables[force.getPerParticleParameterName(i)] = "params"+params->getParameterSuffix(i, "[index]"); for (int i = 0; i < force.getNumGlobalParameters(); i++) variables[force.getGlobalParameterName(i)] = "globals["+cc.intToString(i)+"]"; for (int i = 0; i < numComputedValues; i++) variables[computedValueNames[i]] = "values"+computedValues->getParameterSuffix(i, "[index]"); if (needParameterGradient) { for (int i = 1; i < numComputedValues; i++) { string is = cc.intToString(i); compute << "real3 dV"< derivExpressions; string js = cc.intToString(j); derivExpressions["real dV"+is+"dV"+js+" = "] = valueDerivExpressions[i][j]; compute << cc.getExpressionUtilities().createExpressions(derivExpressions, variables, functionList, functionDefinitions, "temp_"+is+"_"+js); compute << "dV"< gradientExpressions; if (!isZeroExpression(valueGradientExpressions[i][0])) gradientExpressions["dV"+is+"dR.x += "] = valueGradientExpressions[i][0]; if (!isZeroExpression(valueGradientExpressions[i][1])) gradientExpressions["dV"+is+"dR.y += "] = valueGradientExpressions[i][1]; if (!isZeroExpression(valueGradientExpressions[i][2])) gradientExpressions["dV"+is+"dR.z += "] = valueGradientExpressions[i][2]; compute << cc.getExpressionUtilities().createExpressions(gradientExpressions, variables, functionList, functionDefinitions, "gradtemp_"+is); } for (int i = 1; i < numComputedValues; i++) compute << "force -= deriv"<getParameterSuffix(i)<<"*dV"<getParameterSuffix(i)<<"*dValuedParam_"< replacements; replacements["PARAMETER_ARGUMENTS"] = extraArgs.str()+tableArgs.str(); replacements["COMPUTE_FORCES"] = compute.str(); replacements["INIT_PARAM_DERIVS"] = initParamDerivs.str(); replacements["SAVE_PARAM_DERIVS"] = saveParamDerivs.str(); map defines; defines["NUM_ATOMS"] = cc.intToString(cc.getNumAtoms()); defines["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); ComputeProgram program = cc.compileProgram(cc.replaceStrings(CommonKernelSources::customGBGradientChainRule, replacements), defines); gradientChainRuleKernel = program->createKernel("computeGradientChainRuleTerms"); } { // Create the code to calculate chain rule terms as part of the default nonbonded kernel. vector > globalVariables; for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = "globals["+cc.intToString(i)+"]"; globalVariables.push_back(makeVariable(name, prefix+value)); } vector > variables = globalVariables; map rename; ExpressionTreeNode rnode(new Operation::Variable("r")); variables.push_back(make_pair(rnode, "r")); variables.push_back(make_pair(ExpressionTreeNode(new Operation::Square(), rnode), "r2")); variables.push_back(make_pair(ExpressionTreeNode(new Operation::Reciprocal(), rnode), "invR")); for (int i = 0; i < force.getNumPerParticleParameters(); i++) { const string& name = force.getPerParticleParameterName(i); variables.push_back(makeVariable(name+"1", "((real) "+prefix+"params"+params->getParameterSuffix(i, "1)"))); variables.push_back(makeVariable(name+"2", "((real) "+prefix+"params"+params->getParameterSuffix(i, "2)"))); rename[name+"1"] = name+"2"; rename[name+"2"] = name+"1"; } map derivExpressions; stringstream chainSource; Lepton::ParsedExpression dVdR = Lepton::Parser::parse(computedValueExpressions[0], functions).differentiate("r").optimize(); derivExpressions["real dV0dR1 = "] = dVdR; derivExpressions["real dV0dR2 = "] = dVdR.renameVariables(rename); chainSource << cc.getExpressionUtilities().createExpressions(derivExpressions, variables, functionList, functionDefinitions, prefix+"temp0_"); if (needChainForValue[0]) { if (useExclusionsForValue) chainSource << "if (!isExcluded) {\n"; chainSource << "tempForce -= dV0dR1*" << prefix << "dEdV" << energyDerivs->getParameterSuffix(0, "1") << ";\n"; chainSource << "tempForce -= dV0dR2*" << prefix << "dEdV" << energyDerivs->getParameterSuffix(0, "2") << ";\n"; if (useExclusionsForValue) chainSource << "}\n"; } for (int i = 1; i < numComputedValues; i++) { if (needChainForValue[i]) { chainSource << "tempForce -= dV0dR1*" << prefix << "dEdV" << energyDerivs->getParameterSuffix(i, "1") << ";\n"; chainSource << "tempForce -= dV0dR2*" << prefix << "dEdV" << energyDerivs->getParameterSuffix(i, "2") << ";\n"; } } map replacements; string chainStr = chainSource.str(); replacements["COMPUTE_FORCE"] = chainStr; string source = cc.replaceStrings(CommonKernelSources::customGBChainRule, replacements); vector parameters; vector arguments; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; string paramName = prefix+"params"+cc.intToString(i+1); if (chainStr.find(paramName+"1") != chainStr.npos || chainStr.find(paramName+"2") != chainStr.npos) parameters.push_back(ComputeParameterInfo(buffer.getArray(), paramName, buffer.getComponentType(), buffer.getNumComponents())); } for (int i = 0; i < (int) computedValues->getParameterInfos().size(); i++) { ComputeParameterInfo& buffer = computedValues->getParameterInfos()[i]; string paramName = prefix+"values"+cc.intToString(i+1); if (chainStr.find(paramName+"1") != chainStr.npos || chainStr.find(paramName+"2") != chainStr.npos) parameters.push_back(ComputeParameterInfo(buffer.getArray(), paramName, buffer.getComponentType(), buffer.getNumComponents())); } for (int i = 0; i < (int) energyDerivChain->getParameterInfos().size(); i++) { if (needChainForValue[i]) { ComputeParameterInfo& buffer = energyDerivChain->getParameterInfos()[i]; string paramName = prefix+"dEdV"+cc.intToString(i+1); parameters.push_back(ComputeParameterInfo(buffer.getArray(), paramName, buffer.getComponentType(), buffer.getNumComponents())); } } if (globals.isInitialized()) { globals.upload(globalParamValues); arguments.push_back(ComputeParameterInfo(globals, prefix+"globals", "float", 1)); } nb.addInteraction(useCutoff, usePeriodic, force.getNumExclusions() > 0, cutoff, exclusionList, source, force.getForceGroup()); for (auto param : parameters) nb.addParameter(param); for (auto arg : arguments) nb.addArgument(arg); } info = new ForceInfo(force); cc.addForce(info); cc.addAutoclearBuffer(longEnergyDerivs); } double CommonCalcCustomGBForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { ContextSelector selector(cc); bool deviceIsCpu = cc.getIsCPU(); NonbondedUtilities& nb = cc.getNonbondedUtilities(); int elementSize = (cc.getUseDoublePrecision() ? sizeof(double) : sizeof(float)); if (!hasInitializedKernels) { hasInitializedKernels = true; // These two kernels can't be compiled in initialize(), because the nonbonded utilities object // has not yet been initialized then. { int numExclusionTiles = nb.getExclusionTiles().getSize(); pairValueDefines["NUM_TILES_WITH_EXCLUSIONS"] = cc.intToString(numExclusionTiles); int numContexts = cc.getNumContexts(); int startExclusionIndex = cc.getContextIndex()*numExclusionTiles/numContexts; int endExclusionIndex = (cc.getContextIndex()+1)*numExclusionTiles/numContexts; pairValueDefines["FIRST_EXCLUSION_TILE"] = cc.intToString(startExclusionIndex); pairValueDefines["LAST_EXCLUSION_TILE"] = cc.intToString(endExclusionIndex); pairValueDefines["CUTOFF"] = cc.doubleToString(cutoff); ComputeProgram program = cc.compileProgram(pairValueSrc, pairValueDefines); pairValueKernel = program->createKernel("computeN2Value"); pairValueSrc = ""; pairValueDefines.clear(); } { int numExclusionTiles = nb.getExclusionTiles().getSize(); pairEnergyDefines["NUM_TILES_WITH_EXCLUSIONS"] = cc.intToString(numExclusionTiles); int numContexts = cc.getNumContexts(); int startExclusionIndex = cc.getContextIndex()*numExclusionTiles/numContexts; int endExclusionIndex = (cc.getContextIndex()+1)*numExclusionTiles/numContexts; pairEnergyDefines["FIRST_EXCLUSION_TILE"] = cc.intToString(startExclusionIndex); pairEnergyDefines["LAST_EXCLUSION_TILE"] = cc.intToString(endExclusionIndex); pairEnergyDefines["CUTOFF"] = cc.doubleToString(cutoff); ComputeProgram program = cc.compileProgram(pairEnergySrc, pairEnergyDefines); pairEnergyKernel = program->createKernel("computeN2Energy"); pairEnergySrc = ""; pairEnergyDefines.clear(); } // Set arguments for kernels. maxTiles = (nb.getUseCutoff() ? nb.getInteractingTiles().getSize() : 0); int numAtomBlocks = cc.getPaddedNumAtoms()/32; pairValueKernel->addArg(cc.getPosq()); pairValueKernel->addArg(cc.getNonbondedUtilities().getExclusions()); pairValueKernel->addArg(cc.getNonbondedUtilities().getExclusionTiles()); pairValueKernel->addArg(valueBuffers); if (nb.getUseCutoff()) { pairValueKernel->addArg(nb.getInteractingTiles()); pairValueKernel->addArg(nb.getInteractionCount()); for (int i = 0; i < 5; i++) pairValueKernel->addArg(); // Periodic box size arguments are set when the kernel is executed. pairValueKernel->addArg(maxTiles); pairValueKernel->addArg(nb.getBlockCenters()); pairValueKernel->addArg(nb.getBlockBoundingBoxes()); pairValueKernel->addArg(nb.getInteractingAtoms()); } else pairValueKernel->addArg(numAtomBlocks*(numAtomBlocks+1)/2); if (globals.isInitialized()) pairValueKernel->addArg(globals); for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { if (pairValueUsesParam[i]) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; pairValueKernel->addArg(buffer.getArray()); } } for (auto& d : dValue0dParam) pairValueKernel->addArg(d); for (auto& function : tabulatedFunctionArrays) pairValueKernel->addArg(function); perParticleValueKernel->addArg(cc.getPosq()); perParticleValueKernel->addArg(valueBuffers); if (globals.isInitialized()) perParticleValueKernel->addArg(globals); for (auto& buffer : params->getParameterInfos()) perParticleValueKernel->addArg(buffer.getArray()); for (auto& buffer : computedValues->getParameterInfos()) perParticleValueKernel->addArg(buffer.getArray()); for (int i = 0; i < dValuedParam.size(); i++) { perParticleValueKernel->addArg(dValue0dParam[i]); for (int j = 0; j < dValuedParam[i]->getParameterInfos().size(); j++) perParticleValueKernel->addArg(dValuedParam[i]->getParameterInfos()[j].getArray()); } for (auto& function : tabulatedFunctionArrays) perParticleValueKernel->addArg(function); pairEnergyKernel->addArg(cc.getLongForceBuffer()); pairEnergyKernel->addArg(cc.getEnergyBuffer()); pairEnergyKernel->addArg(cc.getPosq()); pairEnergyKernel->addArg(cc.getNonbondedUtilities().getExclusions()); pairEnergyKernel->addArg(cc.getNonbondedUtilities().getExclusionTiles()); pairEnergyKernel->addArg(); // Whether to include energy. if (nb.getUseCutoff()) { pairEnergyKernel->addArg(nb.getInteractingTiles()); pairEnergyKernel->addArg(nb.getInteractionCount()); for (int i = 0; i < 5; i++) pairEnergyKernel->addArg(); // Periodic box size arguments are set when the kernel is executed. pairEnergyKernel->addArg(maxTiles); pairEnergyKernel->addArg(nb.getBlockCenters()); pairEnergyKernel->addArg(nb.getBlockBoundingBoxes()); pairEnergyKernel->addArg(nb.getInteractingAtoms()); } else pairEnergyKernel->addArg(numAtomBlocks*(numAtomBlocks+1)/2); if (globals.isInitialized()) pairEnergyKernel->addArg(globals); for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { if (pairEnergyUsesParam[i]) { ComputeParameterInfo& buffer = params->getParameterInfos()[i]; pairEnergyKernel->addArg(buffer.getArray()); } } for (int i = 0; i < (int) computedValues->getParameterInfos().size(); i++) { if (pairEnergyUsesValue[i]) { ComputeParameterInfo& buffer = computedValues->getParameterInfos()[i]; pairEnergyKernel->addArg(buffer.getArray()); } } pairEnergyKernel->addArg(longEnergyDerivs); if (needEnergyParamDerivs) pairEnergyKernel->addArg(cc.getEnergyParamDerivBuffer()); for (auto& function : tabulatedFunctionArrays) pairEnergyKernel->addArg(function); perParticleEnergyKernel->addArg(cc.getEnergyBuffer()); perParticleEnergyKernel->addArg(cc.getPosq()); perParticleEnergyKernel->addArg(cc.getLongForceBuffer()); if (globals.isInitialized()) perParticleEnergyKernel->addArg(globals); for (auto& buffer : params->getParameterInfos()) perParticleEnergyKernel->addArg(buffer.getArray()); for (auto& buffer : computedValues->getParameterInfos()) perParticleEnergyKernel->addArg(buffer.getArray()); for (auto& buffer : energyDerivs->getParameterInfos()) perParticleEnergyKernel->addArg(buffer.getArray()); for (auto& buffer : energyDerivChain->getParameterInfos()) perParticleEnergyKernel->addArg(buffer.getArray()); perParticleEnergyKernel->addArg(longEnergyDerivs); if (needEnergyParamDerivs) perParticleEnergyKernel->addArg(cc.getEnergyParamDerivBuffer()); for (auto& function : tabulatedFunctionArrays) perParticleEnergyKernel->addArg(function); if (needParameterGradient || needEnergyParamDerivs) { gradientChainRuleKernel->addArg(cc.getPosq()); gradientChainRuleKernel->addArg(cc.getLongForceBuffer()); if (globals.isInitialized()) gradientChainRuleKernel->addArg(globals); for (auto& buffer : params->getParameterInfos()) gradientChainRuleKernel->addArg(buffer.getArray()); for (auto& buffer : computedValues->getParameterInfos()) gradientChainRuleKernel->addArg(buffer.getArray()); for (auto& buffer : energyDerivs->getParameterInfos()) gradientChainRuleKernel->addArg(buffer.getArray()); if (needEnergyParamDerivs) { gradientChainRuleKernel->addArg(cc.getEnergyParamDerivBuffer()); for (auto d : dValuedParam) for (auto& buffer : d->getParameterInfos()) gradientChainRuleKernel->addArg(buffer.getArray()); } for (auto& function : tabulatedFunctionArrays) gradientChainRuleKernel->addArg(function); } } if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } pairEnergyKernel->setArg(5, (int) includeEnergy); if (nb.getUseCutoff()) { setPeriodicBoxArgs(cc, pairValueKernel, 6); setPeriodicBoxArgs(cc, pairEnergyKernel, 8); if (maxTiles < nb.getInteractingTiles().getSize()) { maxTiles = nb.getInteractingTiles().getSize(); pairValueKernel->setArg(11, maxTiles); pairEnergyKernel->setArg(13, maxTiles); } } pairValueKernel->execute(nb.getNumForceThreadBlocks()*nb.getForceThreadBlockSize(), nb.getForceThreadBlockSize()); perParticleValueKernel->execute(cc.getPaddedNumAtoms()); pairEnergyKernel->execute(nb.getNumForceThreadBlocks()*nb.getForceThreadBlockSize(), nb.getForceThreadBlockSize()); perParticleEnergyKernel->execute(cc.getPaddedNumAtoms()); if (needParameterGradient || needEnergyParamDerivs) gradientChainRuleKernel->execute(cc.getPaddedNumAtoms()); return 0.0; } void CommonCalcCustomGBForceKernel::copyParametersToContext(ContextImpl& context, const CustomGBForce& force) { ContextSelector selector(cc); int numParticles = force.getNumParticles(); if (numParticles != cc.getNumAtoms()) throw OpenMMException("updateParametersInContext: The number of particles has changed"); // Record the per-particle parameters. vector > paramVector(cc.getPaddedNumAtoms(), vector(force.getNumPerParticleParameters(), 0)); vector parameters; for (int i = 0; i < numParticles; i++) { force.getParticleParameters(i, parameters); for (int j = 0; j < (int) parameters.size(); j++) paramVector[i][j] = (float) parameters[j]; } params->setParameterValues(paramVector); // See if any tabulated functions have changed. for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { string name = force.getTabulatedFunctionName(i); if (force.getTabulatedFunction(i).getUpdateCount() != tabulatedFunctionUpdateCount[name]) { tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].upload(f); } } // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcCustomHbondForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomHbondForce& force) : force(force) { } bool areParticlesIdentical(int particle1, int particle2) { return true; } int getNumParticleGroups() { return force.getNumDonors()+force.getNumAcceptors()+force.getNumExclusions(); } void getParticlesInGroup(int index, vector& particles) { int p1, p2, p3; thread_local static vector parameters; if (index < force.getNumDonors()) { force.getDonorParameters(index, p1, p2, p3, parameters); particles.clear(); particles.push_back(p1); if (p2 > -1) particles.push_back(p2); if (p3 > -1) particles.push_back(p3); return; } index -= force.getNumDonors(); if (index < force.getNumAcceptors()) { force.getAcceptorParameters(index, p1, p2, p3, parameters); particles.clear(); particles.push_back(p1); if (p2 > -1) particles.push_back(p2); if (p3 > -1) particles.push_back(p3); return; } index -= force.getNumAcceptors(); int donor, acceptor; force.getExclusionParticles(index, donor, acceptor); particles.clear(); force.getDonorParameters(donor, p1, p2, p3, parameters); particles.push_back(p1); if (p2 > -1) particles.push_back(p2); if (p3 > -1) particles.push_back(p3); force.getAcceptorParameters(acceptor, p1, p2, p3, parameters); particles.push_back(p1); if (p2 > -1) particles.push_back(p2); if (p3 > -1) particles.push_back(p3); } bool areGroupsIdentical(int group1, int group2) { int p1, p2, p3; thread_local static vector params1, params2; if (group1 < force.getNumDonors() && group2 < force.getNumDonors()) { force.getDonorParameters(group1, p1, p2, p3, params1); force.getDonorParameters(group2, p1, p2, p3, params2); return (params1 == params2); } if (group1 < force.getNumDonors() || group2 < force.getNumDonors()) return false; group1 -= force.getNumDonors(); group2 -= force.getNumDonors(); if (group1 < force.getNumAcceptors() && group2 < force.getNumAcceptors()) { force.getAcceptorParameters(group1, p1, p2, p3, params1); force.getAcceptorParameters(group2, p1, p2, p3, params2); return (params1 == params2); } if (group1 < force.getNumAcceptors() || group2 < force.getNumAcceptors()) return false; return true; } private: const CustomHbondForce& force; }; CommonCalcCustomHbondForceKernel::~CommonCalcCustomHbondForceKernel() { ContextSelector selector(cc); if (donorParams != NULL) delete donorParams; if (acceptorParams != NULL) delete acceptorParams; } static void applyDonorAndAcceptorForces(stringstream& apply, int atom, const string& value, bool trim=true) { string forceNames[] = {"f1", "f2", "f3"}; string toAdd = (trim ? "trimTo3("+value+")" : value); if (atom < 3) apply << "localData[tbx+index]." << forceNames[atom]<<" += "<(cc, numDonors, "customHbondDonors"); acceptors.initialize(cc, numAcceptors, "customHbondAcceptors"); donorParams = new ComputeParameterSet(cc, force.getNumPerDonorParameters(), numDonors, "customHbondDonorParameters"); acceptorParams = new ComputeParameterSet(cc, force.getNumPerAcceptorParameters(), numAcceptors, "customHbondAcceptorParameters"); if (force.getNumGlobalParameters() > 0) globals.initialize(cc, force.getNumGlobalParameters(), "customHbondGlobals"); vector > donorParamVector(numDonors); vector donorVector(numDonors); for (int i = 0; i < numDonors; i++) { vector parameters; force.getDonorParameters(startIndex+i, donorVector[i].x, donorVector[i].y, donorVector[i].z, parameters); donorParamVector[i].resize(parameters.size()); for (int j = 0; j < (int) parameters.size(); j++) donorParamVector[i][j] = (float) parameters[j]; } donors.upload(donorVector); donorParams->setParameterValues(donorParamVector); vector > acceptorParamVector(numAcceptors); vector acceptorVector(numAcceptors); for (int i = 0; i < numAcceptors; i++) { vector parameters; force.getAcceptorParameters(i, acceptorVector[i].x, acceptorVector[i].y, acceptorVector[i].z, parameters); acceptorParamVector[i].resize(parameters.size()); for (int j = 0; j < (int) parameters.size(); j++) acceptorParamVector[i][j] = (float) parameters[j]; } acceptors.upload(acceptorVector); acceptorParams->setParameterValues(acceptorParamVector); info = new ForceInfo(force); cc.addForce(info); // Decide whether to use bounding boxes to accelerate the calculation. int numDonorBlocks = (numDonors+31)/32; int numAcceptorBlocks = (numAcceptors+31)/32; useBoundingBoxes = (force.getNonbondedMethod() != CustomHbondForce::NoCutoff && numDonorBlocks*numAcceptorBlocks > cc.getNumThreadBlocks()); if (useBoundingBoxes) { int elementSize = (cc.getUseDoublePrecision() ? sizeof(double) : sizeof(float)); donorBlockCenter.initialize(cc, numDonorBlocks, 4*elementSize, "donorBlockCenter"); donorBlockSize.initialize(cc, numDonorBlocks, 4*elementSize, "donorBlockSize"); acceptorBlockCenter.initialize(cc, numAcceptorBlocks, 4*elementSize, "acceptorBlockCenter"); acceptorBlockSize.initialize(cc, numAcceptorBlocks, 4*elementSize, "acceptorBlockSize"); } // Record exclusions. vector donorExclusionVector(numDonors, mm_int4(-1, -1, -1, -1)); vector acceptorExclusionVector(numAcceptors, mm_int4(-1, -1, -1, -1)); for (int i = 0; i < force.getNumExclusions(); i++) { int donor, acceptor; force.getExclusionParticles(i, donor, acceptor); if (donor < startIndex || donor >= endIndex) continue; donor -= startIndex; if (donorExclusionVector[donor].x == -1) donorExclusionVector[donor].x = acceptor; else if (donorExclusionVector[donor].y == -1) donorExclusionVector[donor].y = acceptor; else if (donorExclusionVector[donor].z == -1) donorExclusionVector[donor].z = acceptor; else if (donorExclusionVector[donor].w == -1) donorExclusionVector[donor].w = acceptor; else throw OpenMMException("CustomHbondForce: this platform does not support more than four exclusions per donor"); if (acceptorExclusionVector[acceptor].x == -1) acceptorExclusionVector[acceptor].x = donor; else if (acceptorExclusionVector[acceptor].y == -1) acceptorExclusionVector[acceptor].y = donor; else if (acceptorExclusionVector[acceptor].z == -1) acceptorExclusionVector[acceptor].z = donor; else if (acceptorExclusionVector[acceptor].w == -1) acceptorExclusionVector[acceptor].w = donor; else throw OpenMMException("CustomHbondForce: this platform does not support more than four exclusions per acceptor"); } donorExclusions.initialize(cc, numDonors, "customHbondDonorExclusions"); acceptorExclusions.initialize(cc, numAcceptors, "customHbondAcceptorExclusions"); donorExclusions.upload(donorExclusionVector); acceptorExclusions.upload(acceptorExclusionVector); // Record the tabulated functions. map functions; vector > functionDefinitions; vector functionList; stringstream tableArgs; tabulatedFunctionArrays.resize(force.getNumTabulatedFunctions()); for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { functionList.push_back(&force.getTabulatedFunction(i)); string name = force.getTabulatedFunctionName(i); tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); string arrayName = "table"+cc.intToString(i); functionDefinitions.push_back(make_pair(name, arrayName)); functions[name] = cc.getExpressionUtilities().getFunctionPlaceholder(force.getTabulatedFunction(i)); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].initialize(cc, f.size(), "TabulatedFunction"); tabulatedFunctionArrays[i].upload(f); tableArgs << ", GLOBAL const float"; if (width > 1) tableArgs << width; tableArgs << "* RESTRICT " << arrayName; } // Record information about parameters. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } if (globals.isInitialized()) globals.upload(globalParamValues); map variables; for (int i = 0; i < force.getNumPerDonorParameters(); i++) { const string& name = force.getPerDonorParameterName(i); variables[name] = "donorParams"+donorParams->getParameterSuffix(i); } for (int i = 0; i < force.getNumPerAcceptorParameters(); i++) { const string& name = force.getPerAcceptorParameterName(i); variables[name] = "acceptorParams"+acceptorParams->getParameterSuffix(i); } for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); variables[name] = "globals["+cc.intToString(i)+"]"; } // Now to generate the kernel. First, it needs to calculate all distances, angles, // and dihedrals the expression depends on. map > distances; map > angles; map > dihedrals; Lepton::ParsedExpression energyExpression = CustomHbondForceImpl::prepareExpression(force, functions, distances, angles, dihedrals); map forceExpressions; set computedDeltas; computedDeltas.insert("D1A1"); string atomNames[] = {"A1", "A2", "A3", "D1", "D2", "D3"}; string atomNamesLower[] = {"a1", "a2", "a3", "d1", "d2", "d3"}; stringstream compute, extraArgs; int index = 0; for (auto& distance : distances) { const vector& atoms = distance.second; string deltaName = atomNames[atoms[0]]+atomNames[atoms[1]]; if (computedDeltas.count(deltaName) == 0) { compute << "real4 delta"+deltaName+" = delta("+atomNamesLower[atoms[0]]+", "+atomNamesLower[atoms[1]]+", periodicBoxSize, invPeriodicBoxSize, periodicBoxVecX, periodicBoxVecY, periodicBoxVecZ);\n"; computedDeltas.insert(deltaName); } compute << "real r_"+deltaName+" = SQRT(delta"+deltaName+".w);\n"; variables[distance.first] = "r_"+deltaName; forceExpressions["real dEdDistance"+cc.intToString(index)+" = "] = energyExpression.differentiate(distance.first).optimize(); index++; } index = 0; for (auto& angle : angles) { const vector& atoms = angle.second; string deltaName1 = atomNames[atoms[1]]+atomNames[atoms[0]]; string deltaName2 = atomNames[atoms[1]]+atomNames[atoms[2]]; string angleName = "angle_"+atomNames[atoms[0]]+atomNames[atoms[1]]+atomNames[atoms[2]]; if (computedDeltas.count(deltaName1) == 0) { compute << "real4 delta"+deltaName1+" = delta("+atomNamesLower[atoms[1]]+", "+atomNamesLower[atoms[0]]+", periodicBoxSize, invPeriodicBoxSize, periodicBoxVecX, periodicBoxVecY, periodicBoxVecZ);\n"; computedDeltas.insert(deltaName1); } if (computedDeltas.count(deltaName2) == 0) { compute << "real4 delta"+deltaName2+" = delta("+atomNamesLower[atoms[1]]+", "+atomNamesLower[atoms[2]]+", periodicBoxSize, invPeriodicBoxSize, periodicBoxVecX, periodicBoxVecY, periodicBoxVecZ);\n"; computedDeltas.insert(deltaName2); } compute << "real "+angleName+" = computeAngle(delta"+deltaName1+", delta"+deltaName2+");\n"; variables[angle.first] = angleName; forceExpressions["real dEdAngle"+cc.intToString(index)+" = "] = energyExpression.differentiate(angle.first).optimize(); index++; } index = 0; for (auto& dihedral : dihedrals) { const vector& atoms = dihedral.second; string deltaName1 = atomNames[atoms[0]]+atomNames[atoms[1]]; string deltaName2 = atomNames[atoms[2]]+atomNames[atoms[1]]; string deltaName3 = atomNames[atoms[2]]+atomNames[atoms[3]]; string crossName1 = "cross_"+deltaName1+"_"+deltaName2; string crossName2 = "cross_"+deltaName2+"_"+deltaName3; string dihedralName = "dihedral_"+atomNames[atoms[0]]+atomNames[atoms[1]]+atomNames[atoms[2]]+atomNames[atoms[3]]; if (computedDeltas.count(deltaName1) == 0) { compute << "real4 delta"+deltaName1+" = delta("+atomNamesLower[atoms[0]]+", "+atomNamesLower[atoms[1]]+", periodicBoxSize, invPeriodicBoxSize, periodicBoxVecX, periodicBoxVecY, periodicBoxVecZ);\n"; computedDeltas.insert(deltaName1); } if (computedDeltas.count(deltaName2) == 0) { compute << "real4 delta"+deltaName2+" = delta("+atomNamesLower[atoms[2]]+", "+atomNamesLower[atoms[1]]+", periodicBoxSize, invPeriodicBoxSize, periodicBoxVecX, periodicBoxVecY, periodicBoxVecZ);\n"; computedDeltas.insert(deltaName2); } if (computedDeltas.count(deltaName3) == 0) { compute << "real4 delta"+deltaName3+" = delta("+atomNamesLower[atoms[2]]+", "+atomNamesLower[atoms[3]]+", periodicBoxSize, invPeriodicBoxSize, periodicBoxVecX, periodicBoxVecY, periodicBoxVecZ);\n"; computedDeltas.insert(deltaName3); } compute << "real4 "+crossName1+" = computeCross(delta"+deltaName1+", delta"+deltaName2+");\n"; compute << "real4 "+crossName2+" = computeCross(delta"+deltaName2+", delta"+deltaName3+");\n"; compute << "real "+dihedralName+" = computeAngle("+crossName1+", "+crossName2+");\n"; compute << dihedralName+" *= (delta"+deltaName1+".x*"+crossName2+".x + delta"+deltaName1+".y*"+crossName2+".y + delta"+deltaName1+".z*"+crossName2+".z < 0 ? -1 : 1);\n"; variables[dihedral.first] = dihedralName; forceExpressions["real dEdDihedral"+cc.intToString(index)+" = "] = energyExpression.differentiate(dihedral.first).optimize(); index++; } // Next it needs to load parameters from global memory. if (force.getNumGlobalParameters() > 0) extraArgs << ", GLOBAL const float* RESTRICT globals"; for (int i = 0; i < (int) donorParams->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = donorParams->getParameterInfos()[i]; extraArgs << ", GLOBAL const "+parameter.getType()+"* RESTRICT donor"+parameter.getName(); compute << parameter.getType()+" donorParams"+cc.intToString(i+1)+" = donor"+parameter.getName()+"[donorIndex];\n"; } for (int i = 0; i < (int) acceptorParams->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = acceptorParams->getParameterInfos()[i]; extraArgs << ", GLOBAL const "+parameter.getType()+"* RESTRICT acceptor"+parameter.getName(); compute << parameter.getType()+" acceptorParams"+cc.intToString(i+1)+" = acceptor"+parameter.getName()+"[acceptorIndex];\n"; } // Now evaluate the expressions. forceExpressions["energy += "] = energyExpression; compute << cc.getExpressionUtilities().createExpressions(forceExpressions, variables, functionList, functionDefinitions, "temp"); // Finally, apply forces to atoms. index = 0; for (auto& distance : distances) { const vector& atoms = distance.second; string deltaName = atomNames[atoms[0]]+atomNames[atoms[1]]; string value = "(dEdDistance"+cc.intToString(index)+"/r_"+deltaName+")*delta"+deltaName; applyDonorAndAcceptorForces(compute, atoms[0], "-"+value); applyDonorAndAcceptorForces(compute, atoms[1], value); index++; } index = 0; for (auto& angle : angles) { const vector& atoms = angle.second; string deltaName1 = atomNames[atoms[1]]+atomNames[atoms[0]]; string deltaName2 = atomNames[atoms[1]]+atomNames[atoms[2]]; compute << "{\n"; compute << "real3 crossProd = trimTo3(cross(delta"+deltaName2+", delta"+deltaName1+"));\n"; compute << "real lengthCross = max(SQRT(dot(crossProd,crossProd)), (real) 1e-6f);\n"; compute << "real3 deltaCross0 = -cross(trimTo3(delta"+deltaName1+"), crossProd)*dEdAngle"+cc.intToString(index)+"/(delta"+deltaName1+".w*lengthCross);\n"; compute << "real3 deltaCross2 = cross(trimTo3(delta"+deltaName2+"), crossProd)*dEdAngle"+cc.intToString(index)+"/(delta"+deltaName2+".w*lengthCross);\n"; compute << "real3 deltaCross1 = -(deltaCross0+deltaCross2);\n"; applyDonorAndAcceptorForces(compute, atoms[0], "deltaCross0", false); applyDonorAndAcceptorForces(compute, atoms[1], "deltaCross1", false); applyDonorAndAcceptorForces(compute, atoms[2], "deltaCross2", false); compute << "}\n"; index++; } index = 0; for (auto& dihedral : dihedrals) { const vector& atoms = dihedral.second; string deltaName1 = atomNames[atoms[0]]+atomNames[atoms[1]]; string deltaName2 = atomNames[atoms[2]]+atomNames[atoms[1]]; string deltaName3 = atomNames[atoms[2]]+atomNames[atoms[3]]; string crossName1 = "cross_"+deltaName1+"_"+deltaName2; string crossName2 = "cross_"+deltaName2+"_"+deltaName3; compute << "{\n"; compute << "real r = SQRT(delta"+deltaName2+".w);\n"; compute << "real4 ff;\n"; compute << "ff.x = (-dEdDihedral"+cc.intToString(index)+"*r)/"+crossName1+".w;\n"; compute << "ff.y = (delta"+deltaName1+".x*delta"+deltaName2+".x + delta"+deltaName1+".y*delta"+deltaName2+".y + delta"+deltaName1+".z*delta"+deltaName2+".z)/delta"+deltaName2+".w;\n"; compute << "ff.z = (delta"+deltaName3+".x*delta"+deltaName2+".x + delta"+deltaName3+".y*delta"+deltaName2+".y + delta"+deltaName3+".z*delta"+deltaName2+".z)/delta"+deltaName2+".w;\n"; compute << "ff.w = (dEdDihedral"+cc.intToString(index)+"*r)/"+crossName2+".w;\n"; compute << "real4 internalF0 = ff.x*"+crossName1+";\n"; compute << "real4 internalF3 = ff.w*"+crossName2+";\n"; compute << "real4 s = ff.y*internalF0 - ff.z*internalF3;\n"; applyDonorAndAcceptorForces(compute, atoms[0], "internalF0"); applyDonorAndAcceptorForces(compute, atoms[1], "s-internalF0"); applyDonorAndAcceptorForces(compute, atoms[2], "-s-internalF3"); applyDonorAndAcceptorForces(compute, atoms[3], "internalF3"); compute << "}\n"; index++; } // Generate the kernels. map replacements; replacements["COMPUTE_FORCE"] = compute.str(); replacements["PARAMETER_ARGUMENTS"] = extraArgs.str()+tableArgs.str(); map defines; defines["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); defines["NUM_DONORS"] = cc.intToString(numDonors); defines["NUM_ACCEPTORS"] = cc.intToString(numAcceptors); defines["NUM_DONOR_BLOCKS"] = cc.intToString(numDonorBlocks); defines["NUM_ACCEPTOR_BLOCKS"] = cc.intToString(numAcceptorBlocks); defines["M_PI"] = cc.doubleToString(M_PI); defines["THREAD_BLOCK_SIZE"] = "128"; if (force.getNonbondedMethod() != CustomHbondForce::NoCutoff) { defines["USE_CUTOFF"] = "1"; defines["CUTOFF_SQUARED"] = cc.doubleToString(force.getCutoffDistance()*force.getCutoffDistance()); } if (force.getNonbondedMethod() != CustomHbondForce::NoCutoff && force.getNonbondedMethod() != CustomHbondForce::CutoffNonPeriodic) defines["USE_PERIODIC"] = "1"; if (force.getNumExclusions() > 0) defines["USE_EXCLUSIONS"] = "1"; if (useBoundingBoxes) defines["USE_BOUNDING_BOXES"] = "1"; ComputeProgram program = cc.compileProgram(cc.replaceStrings(CommonKernelSources::customHbondForce, replacements), defines); blockBoundsKernel = program->createKernel("findBlockBounds"); forceKernel = program->createKernel("computeHbondForces"); } double CommonCalcCustomHbondForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { if (numDonors == 0 || numAcceptors == 0) return 0.0; ContextSelector selector(cc); if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } if (!hasInitializedKernel) { hasInitializedKernel = true; if (useBoundingBoxes) { blockBoundsKernel->addArg(donors); blockBoundsKernel->addArg(acceptors); for (int i = 0; i < 5; i++) blockBoundsKernel->addArg(); // Periodic box size arguments are set when the kernel is executed. blockBoundsKernel->addArg(cc.getPosq()); blockBoundsKernel->addArg(donorBlockCenter); blockBoundsKernel->addArg(donorBlockSize); blockBoundsKernel->addArg(acceptorBlockCenter); blockBoundsKernel->addArg(acceptorBlockSize); } forceKernel->addArg(cc.getLongForceBuffer()); forceKernel->addArg(cc.getEnergyBuffer()); forceKernel->addArg(cc.getPosq()); forceKernel->addArg(donorExclusions); forceKernel->addArg(donors); forceKernel->addArg(acceptors); for (int i = 0; i < 5; i++) forceKernel->addArg(); // Periodic box size arguments are set when the kernel is executed. if (useBoundingBoxes) { forceKernel->addArg(donorBlockCenter); forceKernel->addArg(donorBlockSize); forceKernel->addArg(acceptorBlockCenter); forceKernel->addArg(acceptorBlockSize); } if (globals.isInitialized()) forceKernel->addArg(globals); for (auto& parameter : donorParams->getParameterInfos()) forceKernel->addArg(parameter.getArray()); for (auto& parameter : acceptorParams->getParameterInfos()) forceKernel->addArg(parameter.getArray()); for (auto& function : tabulatedFunctionArrays) forceKernel->addArg(function); } if (useBoundingBoxes) { setPeriodicBoxArgs(cc, blockBoundsKernel, 2); blockBoundsKernel->execute(max(numDonors, numAcceptors)); } setPeriodicBoxArgs(cc, forceKernel, 6); int numDonorBlocks = (numDonors+31)/32; int numAcceptorBlocks = (numAcceptors+31)/32; forceKernel->execute(numDonorBlocks*numAcceptorBlocks*32, cc.getIsCPU() ? 32 : 128); return 0.0; } void CommonCalcCustomHbondForceKernel::copyParametersToContext(ContextImpl& context, const CustomHbondForce& force) { ContextSelector selector(cc); int numContexts = cc.getNumContexts(); int startIndex = cc.getContextIndex()*force.getNumDonors()/numContexts; int endIndex = (cc.getContextIndex()+1)*force.getNumDonors()/numContexts; if (numDonors != endIndex-startIndex) throw OpenMMException("updateParametersInContext: The number of donors has changed"); if (numAcceptors != force.getNumAcceptors()) throw OpenMMException("updateParametersInContext: The number of acceptors has changed"); // Record the per-donor parameters. if (numDonors > 0) { vector > donorParamVector(numDonors); vector parameters; for (int i = 0; i < numDonors; i++) { int d1, d2, d3; force.getDonorParameters(startIndex+i, d1, d2, d3, parameters); donorParamVector[i].resize(parameters.size()); for (int j = 0; j < (int) parameters.size(); j++) donorParamVector[i][j] = (float) parameters[j]; } donorParams->setParameterValues(donorParamVector); } // Record the per-acceptor parameters. if (numAcceptors > 0) { vector > acceptorParamVector(numAcceptors); vector parameters; for (int i = 0; i < numAcceptors; i++) { int a1, a2, a3; force.getAcceptorParameters(i, a1, a2, a3, parameters); acceptorParamVector[i].resize(parameters.size()); for (int j = 0; j < (int) parameters.size(); j++) acceptorParamVector[i][j] = (float) parameters[j]; } acceptorParams->setParameterValues(acceptorParamVector); } // See if any tabulated functions have changed. for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { string name = force.getTabulatedFunctionName(i); if (force.getTabulatedFunction(i).getUpdateCount() != tabulatedFunctionUpdateCount[name]) { tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].upload(f); } } // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcCustomManyParticleForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const CustomManyParticleForce& force) : force(force) { } bool areParticlesIdentical(int particle1, int particle2) { thread_local static vector params1, params2; int type1, type2; force.getParticleParameters(particle1, params1, type1); force.getParticleParameters(particle2, params2, type2); if (type1 != type2) return false; for (int i = 0; i < (int) params1.size(); i++) if (params1[i] != params2[i]) return false; return true; } int getNumParticleGroups() { return force.getNumExclusions(); } void getParticlesInGroup(int index, vector& particles) { int particle1, particle2; force.getExclusionParticles(index, particle1, particle2); particles.resize(2); particles[0] = particle1; particles[1] = particle2; } bool areGroupsIdentical(int group1, int group2) { return true; } private: const CustomManyParticleForce& force; }; CommonCalcCustomManyParticleForceKernel::~CommonCalcCustomManyParticleForceKernel() { ContextSelector selector(cc); if (params != NULL) delete params; } void CommonCalcCustomManyParticleForceKernel::initialize(const System& system, const CustomManyParticleForce& force) { ContextSelector selector(cc); int numParticles = force.getNumParticles(); int particlesPerSet = force.getNumParticlesPerSet(); bool centralParticleMode = (force.getPermutationMode() == CustomManyParticleForce::UniqueCentralParticle); nonbondedMethod = CalcCustomManyParticleForceKernel::NonbondedMethod(force.getNonbondedMethod()); forceWorkgroupSize = 128; findNeighborsWorkgroupSize = (cc.getSIMDWidth() >= 32 ? 128 : 32); // Record parameter values. params = new ComputeParameterSet(cc, force.getNumPerParticleParameters(), numParticles, "customManyParticleParameters"); vector > paramVector(numParticles); for (int i = 0; i < numParticles; i++) { vector parameters; int type; force.getParticleParameters(i, parameters, type); paramVector[i].resize(parameters.size()); for (int j = 0; j < (int) parameters.size(); j++) paramVector[i][j] = (float) parameters[j]; } params->setParameterValues(paramVector); info = new ForceInfo(force); cc.addForce(info); // Record the tabulated functions. map functions; vector > functionDefinitions; vector functionList; stringstream tableArgs; tabulatedFunctionArrays.resize(force.getNumTabulatedFunctions()); for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { functionList.push_back(&force.getTabulatedFunction(i)); string name = force.getTabulatedFunctionName(i); tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); string arrayName = "table"+cc.intToString(i); functionDefinitions.push_back(make_pair(name, arrayName)); functions[name] = cc.getExpressionUtilities().getFunctionPlaceholder(force.getTabulatedFunction(i)); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].initialize(cc, f.size(), "TabulatedFunction"); tabulatedFunctionArrays[i].upload(f); tableArgs << ", GLOBAL const float"; if (width > 1) tableArgs << width; tableArgs << "* RESTRICT " << arrayName; } // Record information about parameters. globalParamNames.resize(force.getNumGlobalParameters()); globalParamValues.resize(force.getNumGlobalParameters()); for (int i = 0; i < force.getNumGlobalParameters(); i++) { globalParamNames[i] = force.getGlobalParameterName(i); globalParamValues[i] = (float) force.getGlobalParameterDefaultValue(i); } vector > variables; for (int i = 0; i < particlesPerSet; i++) { string index = cc.intToString(i+1); variables.push_back(makeVariable("x"+index, "pos"+index+".x")); variables.push_back(makeVariable("y"+index, "pos"+index+".y")); variables.push_back(makeVariable("z"+index, "pos"+index+".z")); } for (int i = 0; i < force.getNumPerParticleParameters(); i++) { const string& name = force.getPerParticleParameterName(i); for (int j = 0; j < particlesPerSet; j++) { string index = cc.intToString(j+1); variables.push_back(makeVariable(name+index, "((real) params"+params->getParameterSuffix(i, index)+")")); } } if (force.getNumGlobalParameters() > 0) { globals.initialize(cc, force.getNumGlobalParameters(), "customManyParticleGlobals"); globals.upload(globalParamValues); for (int i = 0; i < force.getNumGlobalParameters(); i++) { const string& name = force.getGlobalParameterName(i); string value = "globals["+cc.intToString(i)+"]"; variables.push_back(makeVariable(name, value)); } } // Build data structures for type filters. vector particleTypesVec; vector orderIndexVec; vector > particleOrderVec; int numTypes; CustomManyParticleForceImpl::buildFilterArrays(force, numTypes, particleTypesVec, orderIndexVec, particleOrderVec); bool hasTypeFilters = (particleOrderVec.size() > 1); if (hasTypeFilters) { particleTypes.initialize(cc, particleTypesVec.size(), "customManyParticleTypes"); orderIndex.initialize(cc, orderIndexVec.size(), "customManyParticleOrderIndex"); particleOrder.initialize(cc, particleOrderVec.size()*particlesPerSet, "customManyParticleOrder"); particleTypes.upload(particleTypesVec); orderIndex.upload(orderIndexVec); vector flattenedOrder(particleOrder.getSize()); for (int i = 0; i < (int) particleOrderVec.size(); i++) for (int j = 0; j < particlesPerSet; j++) flattenedOrder[i*particlesPerSet+j] = particleOrderVec[i][j]; particleOrder.upload(flattenedOrder); } // Build data structures for exclusions. if (force.getNumExclusions() > 0) { vector > particleExclusions(numParticles); for (int i = 0; i < force.getNumExclusions(); i++) { int p1, p2; force.getExclusionParticles(i, p1, p2); particleExclusions[p1].push_back(p2); particleExclusions[p2].push_back(p1); } vector exclusionsVec; vector exclusionStartIndexVec(numParticles+1); exclusionStartIndexVec[0] = 0; for (int i = 0; i < numParticles; i++) { sort(particleExclusions[i].begin(), particleExclusions[i].end()); exclusionsVec.insert(exclusionsVec.end(), particleExclusions[i].begin(), particleExclusions[i].end()); exclusionStartIndexVec[i+1] = exclusionsVec.size(); } exclusions.initialize(cc, exclusionsVec.size(), "customManyParticleExclusions"); exclusionStartIndex.initialize(cc, exclusionStartIndexVec.size(), "customManyParticleExclusionStart"); exclusions.upload(exclusionsVec); exclusionStartIndex.upload(exclusionStartIndexVec); } // Build data structures for the neighbor list. int numAtomBlocks = cc.getPaddedNumAtoms()/32; if (nonbondedMethod != NoCutoff) { int elementSize = (cc.getUseDoublePrecision() ? sizeof(double) : sizeof(float)); blockCenter.initialize(cc, numAtomBlocks, 4*elementSize, "blockCenter"); blockBoundingBox.initialize(cc, numAtomBlocks, 4*elementSize, "blockBoundingBox"); numNeighborPairs.initialize(cc, 1, "customManyParticleNumNeighborPairs"); neighborStartIndex.initialize(cc, numParticles+1, "customManyParticleNeighborStartIndex"); numNeighborsForAtom.initialize(cc, numParticles, "customManyParticleNumNeighborsForAtom"); // Select a size for the array that holds the neighbor list. We have to make a fairly // arbitrary guess, but if this turns out to be too small we'll increase it later. maxNeighborPairs = 150*numParticles; neighborPairs.initialize(cc, maxNeighborPairs, "customManyParticleNeighborPairs"); neighbors.initialize(cc, maxNeighborPairs, "customManyParticleNeighbors"); } // Generate the kernel. Lepton::ParsedExpression energyExpression = CustomManyParticleForceImpl::prepareExpression(force, functions); map forceExpressions; stringstream compute; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = params->getParameterInfos()[i]; compute<getParameterInfos().size(); j++) loadData<getParameterInfos()[j].getType()<<" params"<<(j+1)<<(i+1)<<" = global_params"<<(j+1)<<"[atom"<<(i+1)<<"];\n"; } if (centralParticleMode) { for (int i = 1; i < particlesPerSet; i++) { if (i > 1) isValidCombination<<" && p"<<(i+1)<<">p"< 2) isValidCombination<<" && "; isValidCombination<<"a"<<(i+1)<<">a"< 1) numCombinations<<"*"; numCombinations<<"numNeighbors"; if (centralParticleMode) atomsForCombination<<"int a"<<(i+1)<<" = tempIndex%numNeighbors;\n"; else atomsForCombination<<"int a"<<(i+1)<<" = 1+tempIndex%numNeighbors;\n"; if (i < particlesPerSet-1) atomsForCombination<<"tempIndex /= numNeighbors;\n"; } if (particlesPerSet > 2) { if (centralParticleMode) atomsForCombination<<"a2 = (a3%2 == 0 ? a2 : numNeighbors-a2-1);\n"; else atomsForCombination<<"a2 = (a3%2 == 0 ? a2 : numNeighbors-a2+1);\n"; } for (int i = 1; i < particlesPerSet; i++) { if (nonbondedMethod == NoCutoff) { if (centralParticleMode) atomsForCombination<<"int p"<<(i+1)<<" = a"<<(i+1)<<";\n"; else atomsForCombination<<"int p"<<(i+1)<<" = p1+a"<<(i+1)<<";\n"; } else { if (centralParticleMode) atomsForCombination<<"int p"<<(i+1)<<" = neighbors[firstNeighbor+a"<<(i+1)<<"];\n"; else atomsForCombination<<"int p"<<(i+1)<<" = neighbors[firstNeighbor-1+a"<<(i+1)<<"];\n"; } } if (nonbondedMethod != NoCutoff) { for (int i = 1; i < particlesPerSet; i++) verifyCutoff<<"real3 pos"<<(i+1)<<" = trimTo3(posq[p"<<(i+1)<<"]);\n"; if (!centralParticleMode) { for (int i = 1; i < particlesPerSet; i++) { for (int j = i+1; j < particlesPerSet; j++) verifyCutoff<<"includeInteraction &= (delta(pos"<<(i+1)<<", pos"<<(j+1)<<", periodicBoxSize, invPeriodicBoxSize, periodicBoxVecX, periodicBoxVecY, periodicBoxVecZ).w < CUTOFF_SQUARED);\n"; } } } if (force.getNumExclusions() > 0) { int startCheckFrom = (nonbondedMethod == NoCutoff ? 0 : 1); for (int i = startCheckFrom; i < particlesPerSet; i++) for (int j = i+1; j < particlesPerSet; j++) verifyExclusions<<"includeInteraction &= !isInteractionExcluded(p"<<(i+1)<<", p"<<(j+1)<<", exclusions, exclusionStartIndex);\n"; } string computeTypeIndex = "particleTypes[p"+cc.intToString(particlesPerSet)+"]"; for (int i = particlesPerSet-2; i >= 0; i--) computeTypeIndex = "particleTypes[p"+cc.intToString(i+1)+"]+"+cc.intToString(numTypes)+"*("+computeTypeIndex+")"; // Create replacements for extra arguments. stringstream extraArgs; if (force.getNumGlobalParameters() > 0) extraArgs << ", GLOBAL const float* globals"; for (int i = 0; i < (int) params->getParameterInfos().size(); i++) { ComputeParameterInfo& parameter = params->getParameterInfos()[i]; extraArgs<<", GLOBAL const "< replacements; replacements["COMPUTE_INTERACTION"] = compute.str(); replacements["NUM_CANDIDATE_COMBINATIONS"] = numCombinations.str(); replacements["FIND_ATOMS_FOR_COMBINATION_INDEX"] = atomsForCombination.str(); replacements["IS_VALID_COMBINATION"] = isValidCombination.str(); replacements["VERIFY_CUTOFF"] = verifyCutoff.str(); replacements["VERIFY_EXCLUSIONS"] = verifyExclusions.str(); replacements["PERMUTE_ATOMS"] = permute.str(); replacements["LOAD_PARTICLE_DATA"] = loadData.str(); replacements["COMPUTE_TYPE_INDEX"] = computeTypeIndex; replacements["PARAMETER_ARGUMENTS"] = extraArgs.str()+tableArgs.str(); map defines; if (nonbondedMethod != NoCutoff) defines["USE_CUTOFF"] = "1"; if (nonbondedMethod == CutoffPeriodic) defines["USE_PERIODIC"] = "1"; if (centralParticleMode) defines["USE_CENTRAL_PARTICLE"] = "1"; if (hasTypeFilters) defines["USE_FILTERS"] = "1"; if (force.getNumExclusions() > 0) defines["USE_EXCLUSIONS"] = "1"; defines["NUM_ATOMS"] = cc.intToString(cc.getNumAtoms()); defines["PADDED_NUM_ATOMS"] = cc.intToString(cc.getPaddedNumAtoms()); defines["M_PI"] = cc.doubleToString(M_PI); defines["CUTOFF_SQUARED"] = cc.doubleToString(force.getCutoffDistance()*force.getCutoffDistance()); defines["TILE_SIZE"] = cc.intToString(32); defines["NUM_BLOCKS"] = cc.intToString(numAtomBlocks); defines["FIND_NEIGHBORS_WORKGROUP_SIZE"] = cc.intToString(findNeighborsWorkgroupSize); ComputeProgram program = cc.compileProgram(cc.replaceStrings(CommonKernelSources::pointFunctions+CommonKernelSources::customManyParticle, replacements), defines); forceKernel = program->createKernel("computeInteraction"); blockBoundsKernel = program->createKernel("findBlockBounds"); neighborsKernel = program->createKernel("findNeighbors"); startIndicesKernel = program->createKernel("computeNeighborStartIndices"); copyPairsKernel = program->createKernel("copyPairsToNeighborList"); event = cc.createEvent(); } double CommonCalcCustomManyParticleForceKernel::execute(ContextImpl& context, bool includeForces, bool includeEnergy) { ContextSelector selector(cc); if (!hasInitializedKernel) { hasInitializedKernel = true; // Set arguments for the force kernel. forceKernel->addArg(cc.getLongForceBuffer()); forceKernel->addArg(cc.getEnergyBuffer()); forceKernel->addArg(cc.getPosq()); for (int i = 0; i < 5; i++) forceKernel->addArg(); setPeriodicBoxArgs(cc, forceKernel, 3); if (nonbondedMethod != NoCutoff) { forceKernel->addArg(neighbors); forceKernel->addArg(neighborStartIndex); } if (particleTypes.isInitialized()) { forceKernel->addArg(particleTypes); forceKernel->addArg(orderIndex); forceKernel->addArg(particleOrder); } if (exclusions.isInitialized()) { forceKernel->addArg(exclusions); forceKernel->addArg(exclusionStartIndex); } if (globals.isInitialized()) forceKernel->addArg(globals); for (auto& parameter : params->getParameterInfos()) forceKernel->addArg(parameter.getArray()); for (auto& function : tabulatedFunctionArrays) forceKernel->addArg(function); if (nonbondedMethod != NoCutoff) { // Set arguments for the block bounds kernel. for (int i = 0; i < 5; i++) blockBoundsKernel->addArg(); // Periodic box information will be set just before it is executed. blockBoundsKernel->addArg(cc.getPosq()); blockBoundsKernel->addArg(blockCenter); blockBoundsKernel->addArg(blockBoundingBox); blockBoundsKernel->addArg(numNeighborPairs); // Set arguments for the neighbor list kernel. for (int i = 0; i < 5; i++) neighborsKernel->addArg(); // Periodic box information will be set just before it is executed. neighborsKernel->addArg(cc.getPosq()); neighborsKernel->addArg(blockCenter); neighborsKernel->addArg(blockBoundingBox); neighborsKernel->addArg(neighborPairs); neighborsKernel->addArg(numNeighborPairs); neighborsKernel->addArg(numNeighborsForAtom); neighborsKernel->addArg(maxNeighborPairs); if (exclusions.isInitialized()) { neighborsKernel->addArg(exclusions); neighborsKernel->addArg(exclusionStartIndex); } // Set arguments for the kernel to find neighbor list start indices. startIndicesKernel->addArg(numNeighborsForAtom); startIndicesKernel->addArg(neighborStartIndex); startIndicesKernel->addArg(numNeighborPairs); startIndicesKernel->addArg(maxNeighborPairs); // Set arguments for the kernel to assemble the final neighbor list. copyPairsKernel->addArg(neighborPairs); copyPairsKernel->addArg(neighbors); copyPairsKernel->addArg(numNeighborPairs); copyPairsKernel->addArg(maxNeighborPairs); copyPairsKernel->addArg(numNeighborsForAtom); copyPairsKernel->addArg(neighborStartIndex); } } if (globals.isInitialized()) { bool changed = false; for (int i = 0; i < (int) globalParamNames.size(); i++) { float value = (float) context.getParameter(globalParamNames[i]); if (value != globalParamValues[i]) changed = true; globalParamValues[i] = value; } if (changed) globals.upload(globalParamValues); } while (true) { int* numPairs = (int*) cc.getPinnedBuffer(); if (nonbondedMethod != NoCutoff) { setPeriodicBoxArgs(cc, forceKernel, 3); setPeriodicBoxArgs(cc, blockBoundsKernel, 0); setPeriodicBoxArgs(cc, neighborsKernel, 0); blockBoundsKernel->execute(cc.getPaddedNumAtoms()/32); neighborsKernel->execute(cc.getNumAtoms(), findNeighborsWorkgroupSize); // We need to make sure there was enough memory for the neighbor list. Download the // information asynchronously so kernels can be running at the same time. numNeighborPairs.download(numPairs, false); event->enqueue(); startIndicesKernel->execute(256, 256); copyPairsKernel->execute(maxNeighborPairs); } int maxThreads = min(cc.getNumAtoms()*forceWorkgroupSize, (int) cc.getEnergyBuffer().getSize()); forceKernel->execute(maxThreads, forceWorkgroupSize); if (nonbondedMethod != NoCutoff) { // Make sure there was enough memory for the neighbor list. event->wait(); if (*numPairs > maxNeighborPairs) { // Resize the arrays and run the calculation again. maxNeighborPairs = (int) (1.1*(*numPairs)); neighborPairs.resize(maxNeighborPairs); neighbors.resize(maxNeighborPairs); neighborsKernel->setArg(11, maxNeighborPairs); startIndicesKernel->setArg(3, maxNeighborPairs); copyPairsKernel->setArg(3, maxNeighborPairs); continue; } } break; } return 0.0; } void CommonCalcCustomManyParticleForceKernel::copyParametersToContext(ContextImpl& context, const CustomManyParticleForce& force) { ContextSelector selector(cc); int numParticles = force.getNumParticles(); if (numParticles != cc.getNumAtoms()) throw OpenMMException("updateParametersInContext: The number of particles has changed"); // Record the per-particle parameters. vector > paramVector(numParticles); vector parameters; int type; for (int i = 0; i < numParticles; i++) { force.getParticleParameters(i, parameters, type); paramVector[i].resize(parameters.size()); for (int j = 0; j < (int) parameters.size(); j++) paramVector[i][j] = (float) parameters[j]; } params->setParameterValues(paramVector); // See if any tabulated functions have changed. for (int i = 0; i < force.getNumTabulatedFunctions(); i++) { string name = force.getTabulatedFunctionName(i); if (force.getTabulatedFunction(i).getUpdateCount() != tabulatedFunctionUpdateCount[name]) { tabulatedFunctionUpdateCount[name] = force.getTabulatedFunction(i).getUpdateCount(); int width; vector f = cc.getExpressionUtilities().computeFunctionCoefficients(force.getTabulatedFunction(i), width); tabulatedFunctionArrays[i].upload(f); } } // Mark that the current reordering may be invalid. cc.invalidateMolecules(info); } class CommonCalcGayBerneForceKernel::ForceInfo : public ComputeForceInfo { public: ForceInfo(const GayBerneForce& force) : force(force) { } bool areParticlesIdentical(int particle1, int particle2) { int xparticle1, yparticle1; double sigma1, epsilon1, sx1, sy1, sz1, ex1, ey1, ez1; int xparticle2, yparticle2; double sigma2, epsilon2, sx2, sy2, sz2, ex2, ey2, ez2; force.getParticleParameters(particle1, sigma1, epsilon1, xparticle1, yparticle1, sx1, sy1, sz1, ex1, ey1, ez1); force.getParticleParameters(particle2, sigma2, epsilon2, xparticle2, yparticle2, sx2, sy2, sz2, ex2, ey2, ez2); return (sigma1 == sigma2 && epsilon1 == epsilon2 && sx1 == sx2 && sy1 == sy2 && sz1 == sz2 && ex1 == ex2 && ey1 == ey2 && ez1 == ez2); } int getNumParticleGroups() { return force.getNumExceptions()+force.getNumParticles(); } void getParticlesInGroup(int index, vector& particles) { if (index < force.getNumExceptions()) { int particle1, particle2; double sigma, epsilon; force.getExceptionParameters(index, particle1, particle2, sigma, epsilon); particles.resize(2); particles[0] = particle1; particles[1] = particle2; } else { int particle = index-force.getNumExceptions(); int xparticle, yparticle; double sigma, epsilon, sx, sy, sz, ex, ey, ez; force.getParticleParameters(particle, sigma, epsilon, xparticle, yparticle, sx, sy, sz, ex, ey, ez); particles.clear(); particles.push_back(particle); if (xparticle > -1) particles.push_back(xparticle); if (yparticle > -1) particles.push_back(yparticle); } } bool areGroupsIdentical(int group1, int group2) { if (group1 < force.getNumExceptions() && group2 < force.getNumExceptions()) { int particle1, particle2; double sigma1, sigma2, epsilon1, epsilon2; force.getExceptionParameters(group1, particle1, particle2, sigma1, epsilon1); force.getExceptionParameters(group2, particle1, particle2, sigma2, epsilon2); return (sigma1 == sigma2 && epsilon1 == epsilon2); } return true; } private: const GayBerneForce& force; }; class CommonCalcGayBerneForceKernel::ReorderListener : public ComputeContext::ReorderListener { public: ReorderListener(CommonCalcGayBerneForceKernel& owner) : owner(owner) { } void execute() { owner.sortAtoms(); } private: CommonCalcGayBerneForceKernel& owner; }; void CommonCalcGayBerneForceKernel::initialize(const System& system, const GayBerneForce& force) { // Initialize interactions. ContextSelector selector(cc); int numParticles = force.getNumParticles(); sigParams.initialize(cc, cc.getPaddedNumAtoms(), "sigParams"); epsParams.initialize(cc, cc.getPaddedNumAtoms(), "epsParams"); scale.initialize(cc, cc.getPaddedNumAtoms(), "scale"); axisParticleIndices.initialize(cc, cc.getPaddedNumAtoms(), "axisParticleIndices"); sortedParticles.initialize(cc, cc.getPaddedNumAtoms(), "sortedParticles"); aMatrix.initialize