/* -------------------------------------------------------------------------- * * OpenMM * * -------------------------------------------------------------------------- * * This is part of the OpenMM molecular simulation toolkit originating from * * Simbios, the NIH National Center for Physics-Based Simulation of * * Biological Structures at Stanford, funded under the NIH Roadmap for * * Medical Research, grant U54 GM072970. See https://simtk.org. * * * * Portions copyright (c) 2008-2025 Stanford University and the Authors. * * Authors: Peter Eastman * * Contributors: * * * * This program is free software: you can redistribute it and/or modify * * it under the terms of the GNU Lesser General Public License as published * * by the Free Software Foundation, either version 3 of the License, or * * (at your option) any later version. * * * * This program is distributed in the hope that it will be useful, * * but WITHOUT ANY WARRANTY; without even the implied warranty of * * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * * GNU Lesser General Public License for more details. * * * * You should have received a copy of the GNU Lesser General Public License * * along with this program. If not, see . * * -------------------------------------------------------------------------- */ #include "OpenCLContext.h" #include "OpenCLPlatform.h" #include "OpenCLKernelFactory.h" #include "OpenCLKernels.h" #include "openmm/Context.h" #include "openmm/System.h" #include "openmm/internal/ContextImpl.h" #include "openmm/internal/hardware.h" #include #include #include #ifdef __APPLE__ #include "sys/sysctl.h" #endif using namespace OpenMM; using namespace std; #ifdef OPENMM_COMMON_BUILDING_STATIC_LIBRARY extern "C" void registerOpenCLPlatform() { if (OpenCLPlatform::isPlatformSupported()) Platform::registerPlatform(new OpenCLPlatform()); } #else extern "C" OPENMM_EXPORT_COMMON void registerPlatforms() { if (OpenCLPlatform::isPlatformSupported()) Platform::registerPlatform(new OpenCLPlatform()); } #endif OpenCLPlatform::OpenCLPlatform() { deprecatedPropertyReplacements["OpenCLDeviceIndex"] = OpenCLDeviceIndex(); deprecatedPropertyReplacements["OpenCLDeviceName"] = OpenCLDeviceName(); deprecatedPropertyReplacements["OpenCLPrecision"] = OpenCLPrecision(); deprecatedPropertyReplacements["OpenCLUseCpuPme"] = OpenCLUseCpuPme(); deprecatedPropertyReplacements["OpenCLDisablePmeStream"] = OpenCLDisablePmeStream(); OpenCLKernelFactory* factory = new OpenCLKernelFactory(); registerKernelFactory(CalcForcesAndEnergyKernel::Name(), factory); registerKernelFactory(UpdateStateDataKernel::Name(), factory); registerKernelFactory(ApplyConstraintsKernel::Name(), factory); registerKernelFactory(VirtualSitesKernel::Name(), factory); registerKernelFactory(CalcHarmonicBondForceKernel::Name(), factory); registerKernelFactory(CalcCustomBondForceKernel::Name(), factory); registerKernelFactory(CalcHarmonicAngleForceKernel::Name(), factory); registerKernelFactory(CalcCustomAngleForceKernel::Name(), factory); registerKernelFactory(CalcPeriodicTorsionForceKernel::Name(), factory); registerKernelFactory(CalcRBTorsionForceKernel::Name(), factory); registerKernelFactory(CalcCMAPTorsionForceKernel::Name(), factory); registerKernelFactory(CalcCustomTorsionForceKernel::Name(), factory); registerKernelFactory(CalcNonbondedForceKernel::Name(), factory); registerKernelFactory(CalcConstantPotentialForceKernel::Name(), factory); registerKernelFactory(CalcCustomNonbondedForceKernel::Name(), factory); registerKernelFactory(CalcGBSAOBCForceKernel::Name(), factory); registerKernelFactory(CalcCustomGBForceKernel::Name(), factory); registerKernelFactory(CalcCustomExternalForceKernel::Name(), factory); registerKernelFactory(CalcCustomHbondForceKernel::Name(), factory); registerKernelFactory(CalcCustomCentroidBondForceKernel::Name(), factory); registerKernelFactory(CalcCustomCompoundBondForceKernel::Name(), factory); registerKernelFactory(CalcCustomCPPForceKernel::Name(), factory); registerKernelFactory(CalcCustomCVForceKernel::Name(), factory); registerKernelFactory(CalcATMForceKernel::Name(), factory); registerKernelFactory(CalcOrientationRestraintForceKernel::Name(), factory); registerKernelFactory(CalcRGForceKernel::Name(), factory); registerKernelFactory(CalcRMSDForceKernel::Name(), factory); registerKernelFactory(CalcCustomManyParticleForceKernel::Name(), factory); registerKernelFactory(CalcGayBerneForceKernel::Name(), factory); registerKernelFactory(IntegrateVerletStepKernel::Name(), factory); registerKernelFactory(IntegrateNoseHooverStepKernel::Name(), factory); registerKernelFactory(IntegrateLangevinMiddleStepKernel::Name(), factory); registerKernelFactory(IntegrateBrownianStepKernel::Name(), factory); registerKernelFactory(IntegrateVariableVerletStepKernel::Name(), factory); registerKernelFactory(IntegrateVariableLangevinStepKernel::Name(), factory); registerKernelFactory(IntegrateCustomStepKernel::Name(), factory); registerKernelFactory(IntegrateDPDStepKernel::Name(), factory); registerKernelFactory(IntegrateQTBStepKernel::Name(), factory); registerKernelFactory(ApplyAndersenThermostatKernel::Name(), factory); registerKernelFactory(ApplyMonteCarloBarostatKernel::Name(), factory); registerKernelFactory(RemoveCMMotionKernel::Name(), factory); platformProperties.push_back(OpenCLDeviceIndex()); platformProperties.push_back(OpenCLDeviceName()); platformProperties.push_back(OpenCLPlatformIndex()); platformProperties.push_back(OpenCLPlatformName()); platformProperties.push_back(OpenCLPrecision()); platformProperties.push_back(OpenCLUseCpuPme()); platformProperties.push_back(OpenCLDisablePmeStream()); setPropertyDefaultValue(OpenCLDeviceIndex(), ""); setPropertyDefaultValue(OpenCLDeviceName(), ""); setPropertyDefaultValue(OpenCLPlatformIndex(), ""); setPropertyDefaultValue(OpenCLPlatformName(), ""); setPropertyDefaultValue(OpenCLPrecision(), "single"); setPropertyDefaultValue(OpenCLUseCpuPme(), "false"); setPropertyDefaultValue(OpenCLDisablePmeStream(), "false"); } double OpenCLPlatform::getSpeed() const { return 50; } bool OpenCLPlatform::supportsDoublePrecision() const { return true; } bool OpenCLPlatform::isPlatformSupported() { // Return false for OpenCL implementations that are known // to be buggy (Apple OS X prior to 10.10). #ifdef __APPLE__ char str[256]; size_t size = sizeof(str); int ret = sysctlbyname("kern.osrelease", str, &size, NULL, 0); if (ret != 0) return false; int major, minor, micro; if (sscanf(str, "%d.%d.%d", &major, &minor, µ) != 3) return false; if (major < 14 || (major == 14 && minor < 3)) // 14.3.0 is the darwin release corresponding to OS X 10.10.3. Versions prior to that // contained a number of serious bugs in the Apple OpenCL libraries. // (See https://github.com/openmm/openmm/issues/395 for example.) return false; #endif // Make sure at least one OpenCL implementation is installed. std::vector platforms; try { cl::Platform::get(&platforms); if (platforms.size() == 0) return false; } catch (...) { return false; } return true; } const string& OpenCLPlatform::getPropertyValue(const Context& context, const string& property) const { const ContextImpl& impl = getContextImpl(context); const PlatformData* data = reinterpret_cast(impl.getPlatformData()); string propertyName = property; if (deprecatedPropertyReplacements.find(property) != deprecatedPropertyReplacements.end()) propertyName = deprecatedPropertyReplacements.find(property)->second; map::const_iterator value = data->propertyValues.find(propertyName); if (value != data->propertyValues.end()) return value->second; return Platform::getPropertyValue(context, property); } void OpenCLPlatform::setPropertyValue(Context& context, const string& property, const string& value) const { } void OpenCLPlatform::contextCreated(ContextImpl& context, const map& properties) const { const string& platformPropValue = (properties.find(OpenCLPlatformIndex()) == properties.end() ? getPropertyDefaultValue(OpenCLPlatformIndex()) : properties.find(OpenCLPlatformIndex())->second); const string& devicePropValue = (properties.find(OpenCLDeviceIndex()) == properties.end() ? getPropertyDefaultValue(OpenCLDeviceIndex()) : properties.find(OpenCLDeviceIndex())->second); string precisionPropValue = (properties.find(OpenCLPrecision()) == properties.end() ? getPropertyDefaultValue(OpenCLPrecision()) : properties.find(OpenCLPrecision())->second); string cpuPmePropValue = (properties.find(OpenCLUseCpuPme()) == properties.end() ? getPropertyDefaultValue(OpenCLUseCpuPme()) : properties.find(OpenCLUseCpuPme())->second); string pmeStreamPropValue = (properties.find(OpenCLDisablePmeStream()) == properties.end() ? getPropertyDefaultValue(OpenCLDisablePmeStream()) : properties.find(OpenCLDisablePmeStream())->second); transform(precisionPropValue.begin(), precisionPropValue.end(), precisionPropValue.begin(), ::tolower); transform(cpuPmePropValue.begin(), cpuPmePropValue.end(), cpuPmePropValue.begin(), ::tolower); transform(pmeStreamPropValue.begin(), pmeStreamPropValue.end(), pmeStreamPropValue.begin(), ::tolower); vector pmeKernelName; pmeKernelName.push_back(CalcPmeReciprocalForceKernel::Name()); if (!supportsKernels(pmeKernelName)) cpuPmePropValue = "false"; int threads = getNumProcessors(); char* threadsEnv = getenv("OPENMM_CPU_THREADS"); if (threadsEnv != NULL) stringstream(threadsEnv) >> threads; context.setPlatformData(new PlatformData(context.getSystem(), &context, platformPropValue, devicePropValue, precisionPropValue, cpuPmePropValue, pmeStreamPropValue, threads, NULL)); } void OpenCLPlatform::linkedContextCreated(ContextImpl& context, ContextImpl& originalContext) const { Platform& platform = originalContext.getPlatform(); string platformPropValue = platform.getPropertyValue(originalContext.getOwner(), OpenCLPlatformIndex()); string devicePropValue = platform.getPropertyValue(originalContext.getOwner(), OpenCLDeviceIndex()); string precisionPropValue = platform.getPropertyValue(originalContext.getOwner(), OpenCLPrecision()); string cpuPmePropValue = platform.getPropertyValue(originalContext.getOwner(), OpenCLUseCpuPme()); string pmeStreamPropValue = platform.getPropertyValue(originalContext.getOwner(), OpenCLDisablePmeStream()); int threads = reinterpret_cast(originalContext.getPlatformData())->threads.getNumThreads(); context.setPlatformData(new PlatformData(context.getSystem(), &context, platformPropValue, devicePropValue, precisionPropValue, cpuPmePropValue, pmeStreamPropValue, threads, &originalContext)); } void OpenCLPlatform::contextDestroyed(ContextImpl& context) const { PlatformData* data = reinterpret_cast(context.getPlatformData()); delete data; } OpenCLPlatform::PlatformData::PlatformData(const System& system, ContextImpl* context, const string& platformPropValue, const string& deviceIndexProperty, const string& precisionProperty, const string& cpuPmeProperty, const string& pmeStreamProperty, int numThreads, ContextImpl* originalContext) : context(context), removeCM(false), stepCount(0), computeForceCount(0), time(0.0), hasInitializedContexts(false), threads(numThreads) { int platformIndex = -1; if (platformPropValue.length() > 0) stringstream(platformPropValue) >> platformIndex; vector devices; size_t searchPos = 0, nextPos; while ((nextPos = deviceIndexProperty.find_first_of(", ", searchPos)) != string::npos) { devices.push_back(deviceIndexProperty.substr(searchPos, nextPos-searchPos)); searchPos = nextPos+1; } devices.push_back(deviceIndexProperty.substr(searchPos)); PlatformData* originalData = NULL; if (originalContext != NULL) originalData = reinterpret_cast(originalContext->getPlatformData()); try { for (int i = 0; i < (int) devices.size(); i++) { if (devices[i].length() > 0) { int deviceIndex; stringstream(devices[i]) >> deviceIndex; contexts.push_back(new OpenCLContext(system, platformIndex, deviceIndex, precisionProperty, *this, (originalData == NULL ? NULL : originalData->contexts[i]))); } } if (contexts.size() == 0) contexts.push_back(new OpenCLContext(system, platformIndex, -1, precisionProperty, *this, (originalData == NULL ? NULL : originalData->contexts[0]))); } catch (...) { // If an exception was thrown, do our best to clean up memory. for (int i = 0; i < (int) contexts.size(); i++) delete contexts[i]; throw; } stringstream deviceIndex, deviceName; for (int i = 0; i < (int) contexts.size(); i++) { if (i > 0) { deviceIndex << ','; deviceName << ','; } deviceIndex << contexts[i]->getDeviceIndex(); deviceName << contexts[i]->getDevice().getInfo(); } platformIndex = contexts[0]->getPlatformIndex(); useCpuPme = (cpuPmeProperty == "true" && !contexts[0]->getUseDoublePrecision()); disablePmeStream = (pmeStreamProperty == "true"); propertyValues[OpenCLPlatform::OpenCLDeviceIndex()] = deviceIndex.str(); propertyValues[OpenCLPlatform::OpenCLDeviceName()] = deviceName.str(); propertyValues[OpenCLPlatform::OpenCLPlatformIndex()] = contexts[0]->intToString(platformIndex); std::vector platforms; cl::Platform::get(&platforms); propertyValues[OpenCLPlatform::OpenCLPlatformName()] = platforms[platformIndex].getInfo(); propertyValues[OpenCLPlatform::OpenCLPrecision()] = precisionProperty; propertyValues[OpenCLPlatform::OpenCLUseCpuPme()] = useCpuPme ? "true" : "false"; propertyValues[OpenCLPlatform::OpenCLDisablePmeStream()] = disablePmeStream ? "true" : "false"; contextEnergy.resize(contexts.size()); } OpenCLPlatform::PlatformData::~PlatformData() { for (int i = 0; i < (int) contexts.size(); i++) delete contexts[i]; } void OpenCLPlatform::PlatformData::initializeContexts(const System& system) { if (hasInitializedContexts) return; for (int i = 0; i < (int) contexts.size(); i++) contexts[i]->initialize(); hasInitializedContexts = true; } void OpenCLPlatform::PlatformData::syncContexts() { for (int i = 0; i < (int) contexts.size(); i++) contexts[i]->getWorkThread().flush(); }