/* -------------------------------------------------------------------------- * * OpenMM * * -------------------------------------------------------------------------- * * This is part of the OpenMM molecular simulation toolkit originating from * * Simbios, the NIH National Center for Physics-Based Simulation of * * Biological Structures at Stanford, funded under the NIH Roadmap for * * Medical Research, grant U54 GM072970. See https://simtk.org. * * * * Portions copyright (c) 2016 Stanford University and the Authors. * * Authors: Peter Eastman * * Contributors: * * * * Permission is hereby granted, free of charge, to any person obtaining a * * copy of this software and associated documentation files (the "Software"), * * to deal in the Software without restriction, including without limitation * * the rights to use, copy, modify, merge, publish, distribute, sublicense, * * and/or sell copies of the Software, and to permit persons to whom the * * Software is furnished to do so, subject to the following conditions: * * * * The above copyright notice and this permission notice shall be included in * * all copies or substantial portions of the Software. * * * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * * THE AUTHORS, CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, * * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR * * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE * * USE OR OTHER DEALINGS IN THE SOFTWARE. * * -------------------------------------------------------------------------- */ #include "CpuGayBerneForce.h" #include "ReferenceForce.h" #include "openmm/OpenMMException.h" #include "openmm/GayBerneForce.h" #include "openmm/internal/gmx_atomic.h" #include using namespace OpenMM; using namespace std; class CpuGayBerneForce::ComputeTask : public ThreadPool::Task { public: ComputeTask(CpuGayBerneForce& owner) : owner(owner) { } void execute(ThreadPool& threads, int threadIndex) { owner.threadComputeForce(threads, threadIndex); } CpuGayBerneForce& owner; }; CpuGayBerneForce::CpuGayBerneForce(const GayBerneForce& force) : neighborList(NULL) { // Record the force parameters. int numParticles = force.getNumParticles(); particles.resize(numParticles); for (int i = 0; i < numParticles; i++) { ParticleInfo& p = particles[i]; double sigma, epsilon, sx, sy, sz, ex, ey, ez; force.getParticleParameters(i, sigma, epsilon, p.xparticle, p.yparticle, sx, sy, sz, ex, ey, ez); p.sigmaOver2 = 0.5*sigma; p.sqrtEpsilon = sqrt(epsilon); p.rx = 0.5*sx; p.ry = 0.5*sy; p.rz = 0.5*sz; p.ex = ex; p.ey = ey; p.ez = ez; p.isPointParticle = (sx == sigma && sy == sigma && sz == sigma && ex == 1.0 && ey == 1.0 && ez == 1.0); } int numExceptions = force.getNumExceptions(); exceptions.resize(numExceptions); particleExclusions.resize(numParticles); for (int i = 0; i < numExceptions; i++) { ExceptionInfo& e = exceptions[i]; double sigma, epsilon; force.getExceptionParameters(i, e.particle1, e.particle2, sigma, epsilon); e.sigma = sigma; e.epsilon = epsilon; exclusions.insert(make_pair(min(e.particle1, e.particle2), max(e.particle1, e.particle2))); particleExclusions[e.particle1].insert(e.particle2); particleExclusions[e.particle2].insert(e.particle1); } nonbondedMethod = force.getNonbondedMethod(); cutoffDistance = force.getCutoffDistance(); switchingDistance = force.getSwitchingDistance(); useSwitchingFunction = force.getUseSwitchingFunction(); if (nonbondedMethod != GayBerneForce::NoCutoff) neighborList = new CpuNeighborList(4); // Allocate workspace for calculations. s.resize(numParticles); A.resize(numParticles); B.resize(numParticles); G.resize(numParticles); // We can precompute the shape factors. for (int i = 0; i < numParticles; i++) { ParticleInfo& p = particles[i]; s[i] = (p.rx*p.ry + p.rz*p.rz)*sqrtf(p.rx*p.ry); } } CpuGayBerneForce::~CpuGayBerneForce() { if (neighborList != NULL) delete neighborList; } RealOpenMM CpuGayBerneForce::calculateForce(const vector& positions, std::vector& forces, std::vector >& threadForce, RealVec* boxVectors, CpuPlatform::PlatformData& data) { if (nonbondedMethod == GayBerneForce::CutoffPeriodic) { double minAllowedSize = 1.999999*cutoffDistance; if (boxVectors[0][0] < minAllowedSize || boxVectors[1][1] < minAllowedSize || boxVectors[2][2] < minAllowedSize) throw OpenMMException("The periodic box size has decreased to less than twice the nonbonded cutoff."); } // Build the neighbor list. int numParticles = particles.size(); if (nonbondedMethod != GayBerneForce::NoCutoff) neighborList->computeNeighborList(numParticles, data.posq, particleExclusions, boxVectors, nonbondedMethod == GayBerneForce::CutoffPeriodic, cutoffDistance, data.threads); // First find the orientations of the particles and compute the matrices we'll be needing. computeEllipsoidFrames(positions); // Record the parameters for the threads. ThreadPool& threads = data.threads; int numThreads = threads.getNumThreads(); this->positions = &positions[0]; this->threadForce = &threadForce; this->boxVectors = boxVectors; threadEnergy.resize(numThreads); threadTorque.resize(numThreads); gmx_atomic_t counter; gmx_atomic_set(&counter, 0); this->atomicCounter = &counter; // Signal the threads to compute the pairwise interactions. ComputeTask task(*this); threads.execute(task); threads.waitForThreads(); // Signal the threads to compute exceptions. gmx_atomic_set(&counter, 0); threads.resumeThreads(); threads.waitForThreads(); // Combine the energies from all the threads. double energy = 0; for (int i = 0; i < numThreads; i++) energy += threadEnergy[i]; // Apply torques. applyTorques(positions, forces); return energy; } void CpuGayBerneForce::threadComputeForce(ThreadPool& threads, int threadIndex) { int numParticles = particles.size(); int numThreads = threads.getNumThreads(); threadEnergy[threadIndex] = 0; float* forces = &(*threadForce)[threadIndex][0]; vector& torques = threadTorque[threadIndex]; torques.resize(numParticles); for (int i = 0; i < numParticles; i++) torques[i] = RealVec(); double energy = 0.0; // Compute this thread's subset of interactions. if (neighborList == NULL) { while (true) { int i = gmx_atomic_fetch_add(reinterpret_cast(atomicCounter), 1); if (i >= numParticles) break; if (particles[i].sqrtEpsilon == 0.0f) continue; for (int j = 0; j < i; j++) { if (particles[j].sqrtEpsilon == 0.0f) continue; if (particleExclusions[i].find(j) != particleExclusions[i].end()) continue; // This interaction will be handled by an exception. RealOpenMM sigma = particles[i].sigmaOver2+particles[j].sigmaOver2; RealOpenMM epsilon = particles[i].sqrtEpsilon*particles[j].sqrtEpsilon; energy += computeOneInteraction(i, j, sigma, epsilon, positions, forces, torques, boxVectors); } } } else { while (true) { int blockIndex = gmx_atomic_fetch_add(reinterpret_cast(atomicCounter), 1); if (blockIndex >= neighborList->getNumBlocks()) break; const int* blockAtom = &neighborList->getSortedAtoms()[4*blockIndex]; const vector& neighbors = neighborList->getBlockNeighbors(blockIndex); const vector& exclusions = neighborList->getBlockExclusions(blockIndex); for (int i = 0; i < (int) neighbors.size(); i++) { int first = neighbors[i]; if (particles[first].sqrtEpsilon == 0.0f) continue; for (int k = 0; k < 4; k++) { if ((exclusions[i] & (1<(atomicCounter), groupSize); if (start >= numExceptions) break; int end = min(start+groupSize, numExceptions); for (int i = start; i < end; i++) { ExceptionInfo& e = exceptions[i]; energy += computeOneInteraction(e.particle1, e.particle2, e.sigma, e.epsilon, positions, forces, torques, boxVectors); } } threadEnergy[threadIndex] = energy; } void CpuGayBerneForce::computeEllipsoidFrames(const vector& positions) { int numParticles = particles.size(); for (int particle = 0; particle < numParticles; particle++) { ParticleInfo& p = particles[particle]; // Compute the local coordinate system of the ellipsoid; RealVec xdir, ydir, zdir; if (p.xparticle == -1) { xdir = RealVec(1, 0, 0); ydir = RealVec(0, 1, 0); } else { xdir = positions[particle]-positions[p.xparticle]; xdir /= SQRT(xdir.dot(xdir)); if (p.yparticle == -1) { if (xdir[1] > -0.5 && xdir[1] < 0.5) ydir = RealVec(0, 1, 0); else ydir = RealVec(1, 0, 0); } else ydir = positions[particle]-positions[p.yparticle]; ydir -= xdir*(xdir.dot(ydir)); ydir /= SQRT(ydir.dot(ydir)); } zdir = xdir.cross(ydir); // Compute matrices we will need later. RealOpenMM (&a)[3][3] = A[particle].v; RealOpenMM (&b)[3][3] = B[particle].v; RealOpenMM (&g)[3][3] = G[particle].v; a[0][0] = xdir[0]; a[0][1] = xdir[1]; a[0][2] = xdir[2]; a[1][0] = ydir[0]; a[1][1] = ydir[1]; a[1][2] = ydir[2]; a[2][0] = zdir[0]; a[2][1] = zdir[1]; a[2][2] = zdir[2]; RealVec r2(p.rx*p.rx, p.ry*p.ry, p.rz*p.rz); RealVec e2(1/sqrt(p.ex), 1/sqrt(p.ey), 1/sqrt(p.ez)); for (int i = 0; i < 3; i++) for (int j = 0; j < 3; j++) { b[i][j] = 0; g[i][j] = 0; for (int k = 0; k < 3; k++) { b[i][j] += a[k][i]*e2[k]*a[k][j]; g[i][j] += a[k][i]*r2[k]*a[k][j]; } } } } void CpuGayBerneForce::applyTorques(const vector& positions, vector& forces) { int numParticles = particles.size(); int numThreads = threadTorque.size(); for (int particle = 0; particle < numParticles; particle++) { ParticleInfo& p = particles[particle]; RealVec pos = positions[particle]; if (p.xparticle != -1) { // Add up the torques from the individual threads. RealVec torque; for (int i = 0; i < numThreads; i++) torque += threadTorque[i][particle]; // Apply a force to the x particle. RealVec dx = positions[p.xparticle]-pos; double dx2 = dx.dot(dx); RealVec f = torque.cross(dx)/dx2; forces[p.xparticle] += f; forces[particle] -= f; if (p.yparticle != -1) { // Apply a force to the y particle. This is based on the component of the torque // that was not already applied to the x particle. RealVec dy = positions[p.yparticle]-pos; double dy2 = dy.dot(dy); RealVec torque2 = dx*(torque.dot(dx)/dx2); f = torque2.cross(dy)/dy2; forces[p.yparticle] += f; forces[particle] -= f; } } } } RealOpenMM CpuGayBerneForce::computeOneInteraction(int particle1, int particle2, RealOpenMM sigma, RealOpenMM epsilon, const RealVec* positions, float* forces, vector& torques, const RealVec* boxVectors) { // Compute the displacement and check against the cutoff. RealOpenMM deltaR[ReferenceForce::LastDeltaRIndex]; if (nonbondedMethod == GayBerneForce::CutoffPeriodic) ReferenceForce::getDeltaRPeriodic(positions[particle2], positions[particle1], boxVectors, deltaR); else ReferenceForce::getDeltaR(positions[particle2], positions[particle1], deltaR); RealOpenMM r = deltaR[ReferenceForce::RIndex]; if (nonbondedMethod != GayBerneForce::NoCutoff && r >= cutoffDistance) return 0; RealOpenMM rInv = 1/r; RealVec dr(deltaR[ReferenceForce::XIndex], deltaR[ReferenceForce::YIndex], deltaR[ReferenceForce::ZIndex]); RealVec drUnit = dr*rInv; // Compute the switching function. RealOpenMM switchValue = 1, switchDeriv = 0; if (useSwitchingFunction && r > switchingDistance) { RealOpenMM t = (r-switchingDistance)/(cutoffDistance-switchingDistance); switchValue = 1+t*t*t*(-10+t*(15-t*6)); switchDeriv = t*t*(-30+t*(60-t*30))/(cutoffDistance-switchingDistance); } // Interactions between two point particles can be computed more easily. if (particles[particle1].isPointParticle && particles[particle2].isPointParticle) { RealOpenMM sig = sigma*rInv; RealOpenMM sig2 = sig*sig; RealOpenMM sig6 = sig2*sig2*sig2; RealOpenMM energy = 4*epsilon*(sig6-1)*sig6; RealVec force = drUnit*(switchValue*4*epsilon*(12*sig6 - 6)*sig6*rInv - energy*switchDeriv); forces[4*particle1] += force[0]; forces[4*particle1+1] += force[1]; forces[4*particle1+2] += force[2]; forces[4*particle2] -= force[0]; forces[4*particle2+1] -= force[1]; forces[4*particle2+2] -= force[2]; return energy*switchValue; } // Compute vectors and matrices we'll be needing. Matrix B12 = B[particle1]+B[particle2]; Matrix G12 = G[particle1]+G[particle2]; Matrix B12inv = B12.inverse(); Matrix G12inv = G12.inverse(); RealOpenMM detG12 = G12.determinant(); // Estimate the distance between the ellipsoids and compute the first terms needed for the energy. RealOpenMM sigma12 = 1/SQRT(0.5*drUnit.dot(G12inv*drUnit)); RealOpenMM h12 = r - sigma12; RealOpenMM rho = sigma/(h12+sigma); RealOpenMM rho2 = rho*rho; RealOpenMM rho6 = rho2*rho2*rho2; RealOpenMM u = 4*epsilon*(rho6*rho6-rho6); RealOpenMM eta = SQRT(2*s[particle1]*s[particle2]/detG12); RealOpenMM chi = 2*drUnit.dot(B12inv*drUnit); chi *= chi; RealOpenMM energy = u*eta*chi; // Compute the terms needed for the force. RealVec kappa = G12inv*dr; RealVec iota = B12inv*dr; RealOpenMM rInv2 = rInv*rInv; RealOpenMM dUSLJdr = 24*epsilon*(2*rho6-1)*rho6*rho/sigma; RealOpenMM temp = 0.5*sigma12*sigma12*sigma12*rInv2; RealVec dudr = (drUnit + (kappa-drUnit*kappa.dot(drUnit))*temp)*dUSLJdr; RealVec dchidr = (iota-drUnit*iota.dot(drUnit))*(-8*rInv2*SQRT(chi)); RealVec force = (dchidr*u + dudr*chi)*(eta*switchValue) - drUnit*(energy*switchDeriv); forces[4*particle1] += force[0]; forces[4*particle1+1] += force[1]; forces[4*particle1+2] += force[2]; forces[4*particle2] -= force[0]; forces[4*particle2+1] -= force[1]; forces[4*particle2+2] -= force[2]; // Compute the terms needed for the torque. for (int j = 0; j < 2; j++) { int particle = (j == 0 ? particle1 : particle2); ParticleInfo& p = particles[particle]; if (p.isPointParticle) continue; RealVec dudq = (kappa*G[particle]).cross(kappa*(temp*dUSLJdr)); RealVec dchidq = (iota*B[particle]).cross(iota)*(-4*rInv2); RealOpenMM (&g12)[3][3] = G12.v; RealOpenMM (&a)[3][3] = A[particle].v; RealVec scale = RealVec(p.rx*p.rx, p.ry*p.ry, p.rz*p.rz)*(-0.5*eta/detG12); Matrix D; RealOpenMM (&d)[3][3] = D.v; d[0][0] = scale[0]*(2*a[0][0]*(g12[1][1]*g12[2][2] - g12[1][2]*g12[2][1]) + a[0][2]*(g12[1][2]*g12[0][1] + g12[1][0]*g12[2][1] - g12[1][1]*(g12[0][2] + g12[2][0])) + a[0][1]*(g12[0][2]*g12[2][1] + g12[2][0]*g12[1][2] - g12[2][2]*(g12[0][1] + g12[1][0]))); d[0][1] = scale[0]*( a[0][0]*(g12[0][2]*g12[2][1] + g12[2][0]*g12[1][2] - g12[2][2]*(g12[0][1] + g12[1][0])) + 2*a[0][1]*(g12[0][0]*g12[2][2] - g12[2][0]*g12[0][2]) + a[0][2]*(g12[1][0]*g12[0][2] + g12[2][0]*g12[0][1] - g12[0][0]*(g12[1][2] + g12[2][1]))); d[0][2] = scale[0]*( a[0][0]*(g12[0][1]*g12[1][2] + g12[1][0]*g12[2][1] - g12[1][1]*(g12[0][2] + g12[2][0])) + a[0][1]*(g12[1][0]*g12[0][2] + g12[2][0]*g12[0][1] - g12[0][0]*(g12[1][2] + g12[2][1])) + 2*a[0][2]*(g12[1][1]*g12[0][0] - g12[1][0]*g12[0][1])); d[1][0] = scale[1]*(2*a[1][0]*(g12[1][1]*g12[2][2] - g12[1][2]*g12[2][1]) + a[1][1]*(g12[0][2]*g12[2][1] + g12[2][0]*g12[1][2] - g12[2][2]*(g12[0][1] + g12[1][0])) + a[1][2]*(g12[1][2]*g12[0][1] + g12[1][0]*g12[2][1] - g12[1][1]*(g12[0][2] + g12[2][0]))); d[1][1] = scale[1]*( a[1][0]*(g12[0][2]*g12[2][1] + g12[2][0]*g12[1][2] - g12[2][2]*(g12[0][1] + g12[1][0])) + 2*a[1][1]*(g12[2][2]*g12[0][0] - g12[2][0]*g12[0][2]) + a[1][2]*(g12[1][0]*g12[0][2] + g12[0][1]*g12[2][0] - g12[0][0]*(g12[1][2] + g12[2][1]))); d[1][2] = scale[1]*( a[1][0]*(g12[0][1]*g12[1][2] + g12[1][0]*g12[2][1] - g12[1][1]*(g12[0][2] + g12[2][0])) + a[1][1]*(g12[1][0]*g12[0][2] + g12[0][1]*g12[2][0] - g12[0][0]*(g12[1][2] + g12[2][1])) + 2*a[1][2]*(g12[1][1]*g12[0][0] - g12[1][0]*g12[0][1])); d[2][0] = scale[2]*(2*a[2][0]*(g12[1][1]*g12[2][2] - g12[2][1]*g12[1][2]) + a[2][1]*(g12[0][2]*g12[2][1] + g12[1][2]*g12[2][0] - g12[2][2]*(g12[0][1] + g12[1][0])) + a[2][2]*(g12[0][1]*g12[1][2] + g12[2][1]*g12[1][0] - g12[1][1]*(g12[0][2] + g12[2][0]))); d[2][1] = scale[2]*( a[2][0]*(g12[0][2]*g12[2][1] + g12[1][2]*g12[2][0] - g12[2][2]*(g12[0][1] + g12[1][0])) + 2*a[2][1]*(g12[0][0]*g12[2][2] - g12[0][2]*g12[2][0]) + a[2][2]*(g12[1][0]*g12[0][2] + g12[0][1]*g12[2][0] - g12[0][0]*(g12[1][2] + g12[2][1]))); d[2][2] = scale[2]*( a[2][0]*(g12[0][1]*g12[1][2] + g12[2][1]*g12[1][0] - g12[1][1]*(g12[0][2] + g12[2][0])) + a[2][1]*(g12[1][0]*g12[0][2] + g12[2][0]*g12[0][1] - g12[0][0]*(g12[1][2] + g12[2][1])) + 2*a[2][2]*(g12[1][1]*g12[0][0] - g12[1][0]*g12[0][1])); RealVec detadq; for (int i = 0; i < 3; i++) detadq += RealVec(a[i][0], a[i][1], a[i][2]).cross(RealVec(d[i][0], d[i][1], d[i][2])); RealVec torque = (dchidq*(u*eta) + detadq*(u*chi) + dudq*(eta*chi))*switchValue; torques[particle] -= torque; } return switchValue*energy; }