CpuPmeKernels.h 5.72 KB
Newer Older
1
2
#ifndef OPENMM_CPU_PME_KERNELS_H_
#define OPENMM_CPU_PME_KERNELS_H_
peastman's avatar
peastman committed
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34

/* -------------------------------------------------------------------------- *
 *                                   OpenMM                                   *
 * -------------------------------------------------------------------------- *
 * This is part of the OpenMM molecular simulation toolkit originating from   *
 * Simbios, the NIH National Center for Physics-Based Simulation of           *
 * Biological Structures at Stanford, funded under the NIH Roadmap for        *
 * Medical Research, grant U54 GM072970. See https://simtk.org.               *
 *                                                                            *
 * Portions copyright (c) 2013 Stanford University and the Authors.           *
 * Authors: Peter Eastman                                                     *
 * Contributors:                                                              *
 *                                                                            *
 * Permission is hereby granted, free of charge, to any person obtaining a    *
 * copy of this software and associated documentation files (the "Software"), *
 * to deal in the Software without restriction, including without limitation  *
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,   *
 * and/or sell copies of the Software, and to permit persons to whom the      *
 * Software is furnished to do so, subject to the following conditions:       *
 *                                                                            *
 * The above copyright notice and this permission notice shall be included in *
 * all copies or substantial portions of the Software.                        *
 *                                                                            *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR *
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,   *
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL    *
 * THE AUTHORS, CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,    *
 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR      *
 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE  *
 * USE OR OTHER DEALINGS IN THE SOFTWARE.                                     *
 * -------------------------------------------------------------------------- */

35
36
#include "internal/windowsExportPme.h"
#include "openmm/kernels.h"
peastman's avatar
peastman committed
37
#include "openmm/Vec3.h"
38
#include <fftw3.h>
peastman's avatar
peastman committed
39
40
41
42
43
44
#include <pthread.h>
#include <vector>

namespace OpenMM {

/**
45
46
 * This is an optimized CPU implementation of CalcPmeReciprocalForceKernel.  It is both
 * vectorized (requiring SSE 4.1) and multithreaded.  It uses FFTW to perform the FFTs.
peastman's avatar
peastman committed
47
48
 */

49
class OPENMM_EXPORT_PME CpuCalcPmeReciprocalForceKernel : public CalcPmeReciprocalForceKernel {
peastman's avatar
peastman committed
50
public:
51
    class ThreadData;
52
53
54
    CpuCalcPmeReciprocalForceKernel(std::string name, const Platform& platform) : CalcPmeReciprocalForceKernel(name, platform),
            hasCreatedPlan(false), isDeleted(false), realGrid(NULL), complexGrid(NULL) {
    }
55
56
57
58
59
60
61
62
63
64
    /**
     * Initialize the kernel.
     * 
     * @param gridx        the x size of the PME grid
     * @param gridy        the y size of the PME grid
     * @param gridz        the z size of the PME grid
     * @param numParticles the number of particles in the system
     * @param alpha        the Ewald blending parameter
     */
    void initialize(int xsize, int ysize, int zsize, int numParticles, double alpha);
65
    ~CpuCalcPmeReciprocalForceKernel();
66
67
68
69
70
71
72
    /**
     * Begin computing the force and energy.
     * 
     * @param io               an object that coordinates data transfer
     * @param periodicBoxSize  the size of the periodic box (measured in nm)
     * @param includeEnergy    true if potential energy should be computed
     */
73
    void beginComputation(IO& io, Vec3 periodicBoxSize, bool includeEnergy);
74
75
76
77
78
79
    /**
     * Finish computing the force and energy.
     * 
     * @param io   an object that coordinates data transfer
     * @return the potential energy due to the PME reciprocal space interactions
     */
80
    double finishComputation(IO& io);
81
82
83
    /**
     * This routine contains the code executed by each thread.
     */
84
    void runThread(int index);
85
86
87
    /**
     * Get whether the current CPU supports all features needed by this kernel.
     */
88
    static bool isProcessorSupported();
peastman's avatar
peastman committed
89
private:
90
91
92
    /**
     * This is called by the worker threads to wait until the master thread instructs them to advance.
     */
93
    void threadWait();
94
95
96
    /**
     * This is called by the master thread to instruct all the worker threads to advance.
     */
97
    void advanceThreads();
98
99
100
101
    /**
     * Select a size for one grid dimension that FFTW can handle efficiently.
     */
    int findFFTDimension(int minimum);
102
103
    static bool hasInitializedThreads;
    static int numThreads;
peastman's avatar
peastman committed
104
105
    int gridx, gridy, gridz, numParticles;
    double alpha;
106
107
    bool hasCreatedPlan, isFinished, isDeleted;
    std::vector<float> force;
108
    std::vector<float> bsplineModuli[3];
109
110
    std::vector<float> recipEterm;
    Vec3 lastBoxSize;
111
112
113
    float* realGrid;
    fftwf_complex* complexGrid;
    fftwf_plan forwardFFT, backwardFFT;
114
115
    int waitCount;
    pthread_cond_t startCondition, endCondition;
116
    pthread_cond_t mainThreadStartCondition, mainThreadEndCondition;
117
    pthread_mutex_t lock;
118
    pthread_t mainThread;
peastman's avatar
peastman committed
119
    std::vector<pthread_t> thread;
120
121
    std::vector<ThreadData*> threadData;
    // The following variables are used to store information about the calculation currently being performed.
122
    IO* io;
123
124
125
126
    float energy;
    float* posq;
    Vec3 periodicBoxSize;
    bool includeEnergy;
peastman's avatar
peastman committed
127
128
129
130
};

} // namespace OpenMM

131
#endif /*OPENMM_CPU_PME_KERNELS_H_*/