#ifndef OPENMM_CPU_PME_KERNELS_H_ #define OPENMM_CPU_PME_KERNELS_H_ /* -------------------------------------------------------------------------- * * OpenMM * * -------------------------------------------------------------------------- * * This is part of the OpenMM molecular simulation toolkit originating from * * Simbios, the NIH National Center for Physics-Based Simulation of * * Biological Structures at Stanford, funded under the NIH Roadmap for * * Medical Research, grant U54 GM072970. See https://simtk.org. * * * * Portions copyright (c) 2013-2025 Stanford University and the Authors. * * Authors: Peter Eastman * * Contributors: Evan Pretti * * * * Permission is hereby granted, free of charge, to any person obtaining a * * copy of this software and associated documentation files (the "Software"), * * to deal in the Software without restriction, including without limitation * * the rights to use, copy, modify, merge, publish, distribute, sublicense, * * and/or sell copies of the Software, and to permit persons to whom the * * Software is furnished to do so, subject to the following conditions: * * * * The above copyright notice and this permission notice shall be included in * * all copies or substantial portions of the Software. * * * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * * THE AUTHORS, CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, * * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR * * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE * * USE OR OTHER DEALINGS IN THE SOFTWARE. * * -------------------------------------------------------------------------- */ #define NOMINMAX #include "internal/windowsExportPme.h" #include "openmm/kernels.h" #include "openmm/Vec3.h" #include "openmm/internal/ThreadPool.h" #include #include #include #include #include #include namespace OpenMM { /** * This is an optimized CPU implementation of CalcPmeReciprocalForceKernel. It is both * vectorized (requiring SSE 4.1) and multithreaded. It uses PocketFFT to perform the FFTs. */ class OPENMM_EXPORT_PME CpuCalcPmeReciprocalForceKernel : public CalcPmeReciprocalForceKernel { public: CpuCalcPmeReciprocalForceKernel(const std::string& name, const Platform& platform) : CalcPmeReciprocalForceKernel(name, platform), isDeleted(false) { } /** * Initialize the kernel. * * @param gridx the x size of the PME grid * @param gridy the y size of the PME grid * @param gridz the z size of the PME grid * @param numParticles the number of particles in the system * @param indices indices of particles to compute charge derivatives for * @param alpha the Ewald blending parameter * @param deterministic whether it should attempt to make the resulting forces deterministic */ void initialize(int xsize, int ysize, int zsize, int numParticles, const std::vector& indices, double alpha, bool deterministic); ~CpuCalcPmeReciprocalForceKernel(); /** * Begin computing the force and energy. * * @param io an object that coordinates data transfer * @param periodicBoxVectors the vectors defining the periodic box (measured in nm) * @param includeEnergy true if potential energy should be computed * @param includeForces true if forces should be computed * @param includeChargeDerivatives true if charge derivatives should be computed */ void beginComputation(IO& io, const Vec3* periodicBoxVectors, bool includeEnergy, bool includeForces, bool includeChargeDerivatives); /** * Finish computing the force and energy. * * @param io an object that coordinates data transfer * @return the potential energy due to the PME reciprocal space interactions */ double finishComputation(IO& io); /** * This routine contains the code executed by the main thread. */ void runMainThread(); /** * This routine contains the code executed by each worker thread. */ void runWorkerThread(ThreadPool& threads, int index); /** * Get whether the current CPU supports all features needed by this kernel. */ static bool isProcessorSupported(); /** * Get the parameters being used for PME. * * @param alpha the separation parameter * @param nx the number of grid points along the X axis * @param ny the number of grid points along the Y axis * @param nz the number of grid points along the Z axis */ void getPMEParameters(double& alpha, int& nx, int& ny, int& nz) const; private: /** * Select a size for one grid dimension that PocketFFT can handle efficiently. */ int findFFTDimension(int minimum); static bool hasInitializedThreads; static int numThreads; int gridx, gridy, gridz, numParticles, numIndices; double alpha; bool deterministic; bool isFinished, isDeleted; std::vector chargeIndices; std::vector force; std::vector chargeDerivatives; std::vector bsplineModuli[3]; std::vector recipEterm; Vec3 lastBoxVectors[3]; std::vector threadEnergy; std::vector > realGrids; std::vector > complexGrid; std::vector gridShape, fftAxes; std::vector realGridStride, complexGridStride; int waitCount; std::condition_variable startCondition, endCondition; std::mutex lock; std::thread mainThread; // The following variables are used to store information about the calculation currently being performed. IO* io; float energy; float* posq; Vec3 periodicBoxVectors[3], recipBoxVectors[3]; bool includeEnergy, includeForces, includeChargeDerivatives; std::atomic atomicCounter; }; /** * This is an optimized CPU implementation of CalcDispersionPmeReciprocalForceKernel. It is both * vectorized (requiring SSE 4.1) and multithreaded. It uses PocketFFT to perform the FFTs. */ class OPENMM_EXPORT_PME CpuCalcDispersionPmeReciprocalForceKernel : public CalcDispersionPmeReciprocalForceKernel { public: CpuCalcDispersionPmeReciprocalForceKernel(const std::string& name, const Platform& platform) : CalcDispersionPmeReciprocalForceKernel(name, platform), isDeleted(false) { } /** * Initialize the kernel. * * @param gridx the x size of the PME grid * @param gridy the y size of the PME grid * @param gridz the z size of the PME grid * @param numParticles the number of particles in the system * @param alpha the Ewald blending parameter * @param deterministic whether it should attempt to make the resulting forces deterministic */ void initialize(int xsize, int ysize, int zsize, int numParticles, double alpha, bool deterministic); ~CpuCalcDispersionPmeReciprocalForceKernel(); /** * Begin computing the force and energy. * * @param io an object that coordinates data transfer * @param periodicBoxVectors the vectors defining the periodic box (measured in nm) * @param includeEnergy true if potential energy should be computed */ void beginComputation(CalcPmeReciprocalForceKernel::IO& io, const Vec3* periodicBoxVectors, bool includeEnergy); /** * Finish computing the force and energy. * * @param io an object that coordinates data transfer * @return the potential energy due to the PME reciprocal space interactions */ double finishComputation(CalcPmeReciprocalForceKernel::IO& io); /** * This routine contains the code executed by the main thread. */ void runMainThread(); /** * This routine contains the code executed by each worker thread. */ void runWorkerThread(ThreadPool& threads, int index); /** * Get whether the current CPU supports all features needed by this kernel. */ static bool isProcessorSupported(); /** * Get the parameters being used for PME. * * @param alpha the separation parameter * @param nx the number of grid points along the X axis * @param ny the number of grid points along the Y axis * @param nz the number of grid points along the Z axis */ void getPMEParameters(double& alpha, int& nx, int& ny, int& nz) const; private: class ComputeTask; /** * Select a size for one grid dimension that PocketFFT can handle efficiently. */ int findFFTDimension(int minimum); static bool hasInitializedThreads; static int numThreads; int gridx, gridy, gridz, numParticles; double alpha; bool deterministic; bool isFinished, isDeleted; std::vector force; std::vector bsplineModuli[3]; std::vector recipEterm; Vec3 lastBoxVectors[3]; std::vector threadEnergy; std::vector > realGrids; std::vector > complexGrid; std::vector gridShape, fftAxes; std::vector realGridStride, complexGridStride; int waitCount; std::condition_variable startCondition, endCondition; std::mutex lock; std::thread mainThread; // The following variables are used to store information about the calculation currently being performed. CalcPmeReciprocalForceKernel::IO* io; float energy; float* posq; Vec3 periodicBoxVectors[3], recipBoxVectors[3]; bool includeEnergy; std::atomic atomicCounter; }; } // namespace OpenMM #endif /*OPENMM_CPU_PME_KERNELS_H_*/