/* -------------------------------------------------------------------------- * * OpenMM * * -------------------------------------------------------------------------- * * This is part of the OpenMM molecular simulation toolkit originating from * * Simbios, the NIH National Center for Physics-Based Simulation of * * Biological Structures at Stanford, funded under the NIH Roadmap for * * Medical Research, grant U54 GM072970. See https://simtk.org. * * * * Portions copyright (c) 2009 Stanford University and the Authors. * * Authors: Scott Le Grand, Peter Eastman * * Contributors: * * * * This program is free software: you can redistribute it and/or modify * * it under the terms of the GNU Lesser General Public License as published * * by the Free Software Foundation, either version 3 of the License, or * * (at your option) any later version. * * * * This program is distributed in the hope that it will be useful, * * but WITHOUT ANY WARRANTY; without even the implied warranty of * * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * * GNU Lesser General Public License for more details. * * * * You should have received a copy of the GNU Lesser General Public License * * along with this program. If not, see . * * -------------------------------------------------------------------------- */ /** * This file contains the kernel for evalauating nonbonded forces * using the Ewald summation method. */ #include /* Define complex multiply operations */ __device__ cuComplex ComplexMul(cuComplex a, cuComplex b) { cuComplex c; c.x = a.x * b.x - a.y * b.y; c.y = a.x * b.y + a.y * b.x; return c; } __device__ cuComplex ComplexConjMul(cuComplex a, cuComplex b) { cuComplex c; c.x = a.x*b.x + a.y*b.y; c.y = a.y*b.x - a.x*b.y; return c; } __device__ cuComplex FloatComplexMul(float r, cuComplex a) { cuComplex b; b.x = r*a.x; b.y = r*a.y; return b; } /* This kernel is under development */ __global__ void kCalculateCDLJEwaldForces_kernel(unsigned int* workUnit, int numWorkUnits) { // ******************************************************************* float alphaEwald = 3.123413f; float factorEwald = -1.0 / (4*alphaEwald*alphaEwald); float PI = 3.14159265358979323846f; float SQRT_PI = sqrt(PI); float TWO_PI = 2.0f * PI; float epsilon = 1.0f; /////############################################################################## float recipCoeff = 4.0*PI/(cSim.periodicBoxSizeX * cSim.periodicBoxSizeY * cSim.periodicBoxSizeZ) /epsilon; // setup reciprocal box float recipBoxSizeX = TWO_PI / cSim.periodicBoxSizeX; float recipBoxSizeY = TWO_PI / cSim.periodicBoxSizeY; float recipBoxSizeZ = TWO_PI / cSim.periodicBoxSizeZ; // setup K-vectors unsigned int numRx = 60+1; unsigned int numRy = 60+1; unsigned int numRz = 60+1; const int kmax = 61; unsigned int pos = threadIdx.x + blockIdx.x * blockDim.x; cuComplex eir[kmax][cSim.atoms][3]; cuComplex tab_xy[cSim.atoms]; cuComplex tab_qxyz[cSim.atoms]; while (pos < cSim.atoms) { float4 apos = cSim.pPosq[pos]; for(unsigned int m = 0; (m < 3); m++) { eir[0][pos][m].x = 1; eir[0][pos][m].y = 0; } eir[1][pos][0].x = cos(apos.x*recipBoxSizeX); eir[1][pos][0].y = sin(apos.x*recipBoxSizeX); eir[1][pos][1].x = cos(apos.y*recipBoxSizeY); eir[1][pos][1].y = sin(apos.y*recipBoxSizeY); eir[1][pos][2].x = cos(apos.z*recipBoxSizeZ); eir[1][pos][2].y = sin(apos.z*recipBoxSizeZ); for(unsigned int j=2; (j= 0) { while (pos < cSim.atoms) { tab_xy[pos] = ComplexMul (eir[rx][pos][0] , eir[ry][pos][1]); pos += blockDim.x * gridDim.x; } } else { while (pos < cSim.atoms) { tab_xy[pos]= ComplexConjMul (eir[rx][pos][0] , (eir[-ry][pos][1])); pos += blockDim.x * gridDim.x; } } for (int rz = lowrz; rz < numRz; rz++) { float kz = rz * recipBoxSizeZ; float k2 = kx * kx + ky * ky + kz * kz; float ak = exp(k2*factorEwald) / k2; float akv = 2.0 * ak * (1.0/k2 - factorEwald); if( rz >= 0) { while (pos < cSim.atoms) { float4 apos = cSim.pPosq[pos]; apos.w *= cSim.epsfac; tab_qxyz[pos] = FloatComplexMul ( apos.w * ComplexMul (tab_xy[pos] , eir[rz][pos][2])); pos += blockDim.x * gridDim.x; } } else { while (pos < cSim.atoms) { float4 apos = cSim.pPosq[pos]; apos.w *= cSim.epsfac; tab_qxyz[pos] = FloatComplexMul( apos.w * ComplexConjMul (tab_xy[pos] , conj(eir[-rz][pos][2])) ); pos += blockDim.x * gridDim.x; } } float cs = 0.0f; float ss = 0.0f; while (pos < cSim.atoms) { cs += tab_qxyz[pos].x; ss += tab_qxyz[pos].y; pos += blockDim.x * gridDim.x; } recipEnergy += ak * ( cs * cs + ss * ss); float vir = akv * ( cs * cs + ss * ss); while (pos < cSim.atoms) { float4 force = cSim.pForce4[pos]; float dEdR = ak * (cs * tab_qxyz[pos].y - ss * tab_qxyz[pos].x); force.x += 2.0 * recipCoeff * dEdR * kx ; force.y += 2.0 * recipCoeff * dEdR * ky ; force.z += 2.0 * recipCoeff * dEdR * kz ; } lowrz = 1 - numRz; } lowry = 1 - numRy; } } //########################################################################### //########################################################################### // END EWALD RECIP SPACE //########################################################################### }