OpenCLExpressionUtilities.cpp 18.3 KB
Newer Older
1
2
3
4
5
6
7
8
/* -------------------------------------------------------------------------- *
 *                                   OpenMM                                   *
 * -------------------------------------------------------------------------- *
 * This is part of the OpenMM molecular simulation toolkit originating from   *
 * Simbios, the NIH National Center for Physics-Based Simulation of           *
 * Biological Structures at Stanford, funded under the NIH Roadmap for        *
 * Medical Research, grant U54 GM072970. See https://simtk.org.               *
 *                                                                            *
9
 * Portions copyright (c) 2009-2011 Stanford University and the Authors.      *
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
 * Authors: Peter Eastman                                                     *
 * Contributors:                                                              *
 *                                                                            *
 * This program is free software: you can redistribute it and/or modify       *
 * it under the terms of the GNU Lesser General Public License as published   *
 * by the Free Software Foundation, either version 3 of the License, or       *
 * (at your option) any later version.                                        *
 *                                                                            *
 * This program is distributed in the hope that it will be useful,            *
 * but WITHOUT ANY WARRANTY; without even the implied warranty of             *
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the              *
 * GNU Lesser General Public License for more details.                        *
 *                                                                            *
 * You should have received a copy of the GNU Lesser General Public License   *
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.      *
 * -------------------------------------------------------------------------- */

#include "OpenCLExpressionUtilities.h"
#include "openmm/OpenMMException.h"
29
#include "openmm/internal/SplineFitter.h"
30
31
32
33
34
35
#include "lepton/Operation.h"

using namespace OpenMM;
using namespace Lepton;
using namespace std;

36
string OpenCLExpressionUtilities::createExpressions(const map<string, ParsedExpression>& expressions, const map<string, string>& variables,
37
        const vector<pair<string, string> >& functions, const string& prefix, const string& functionParams, const string& tempType) {
38
39
40
    vector<pair<ExpressionTreeNode, string> > variableNodes;
    for (map<string, string>::const_iterator iter = variables.begin(); iter != variables.end(); ++iter)
        variableNodes.push_back(make_pair(ExpressionTreeNode(new Operation::Variable(iter->first)), iter->second));
41
    return createExpressions(expressions, variableNodes, functions, prefix, functionParams, tempType);
42
43
44
}

string OpenCLExpressionUtilities::createExpressions(const map<string, ParsedExpression>& expressions, const vector<pair<ExpressionTreeNode, string> >& variables,
45
        const vector<pair<string, string> >& functions, const string& prefix, const string& functionParams, const string& tempType) {
46
    stringstream out;
47
48
49
    vector<ParsedExpression> allExpressions;
    for (map<string, ParsedExpression>::const_iterator iter = expressions.begin(); iter != expressions.end(); ++iter)
        allExpressions.push_back(iter->second);
50
    vector<pair<ExpressionTreeNode, string> > temps = variables;
51
    for (map<string, ParsedExpression>::const_iterator iter = expressions.begin(); iter != expressions.end(); ++iter) {
52
        processExpression(out, iter->second.getRootNode(), temps, functions, prefix, functionParams, allExpressions, tempType);
53
54
55
        out << iter->first << getTempName(iter->second.getRootNode(), temps) << ";\n";
    }
    return out.str();
56
57
}

58
void OpenCLExpressionUtilities::processExpression(stringstream& out, const ExpressionTreeNode& node, vector<pair<ExpressionTreeNode, string> >& temps,
59
        const vector<pair<string, string> >& functions, const string& prefix, const string& functionParams, const vector<ParsedExpression>& allExpressions, const string& tempType) {
60
61
62
63
    for (int i = 0; i < (int) temps.size(); i++)
        if (temps[i].first == node)
            return;
    for (int i = 0; i < (int) node.getChildren().size(); i++)
64
        processExpression(out, node.getChildren()[i], temps, functions, prefix, functionParams, allExpressions, tempType);
65
    string name = prefix+context.intToString(temps.size());
66
    bool hasRecordedNode = false;
67
    
68
    out << tempType << " " << name << " = ";
69
70
    switch (node.getOperation().getId()) {
        case Operation::CONSTANT:
71
            out << context.doubleToString(dynamic_cast<const Operation::Constant*>(&node.getOperation())->getValue());
72
            break;
73
        case Operation::VARIABLE:
74
            throw OpenMMException("Unknown variable in expression: "+node.getOperation().getName());
75
76
77
78
79
80
81
        case Operation::CUSTOM:
        {
            int i;
            for (i = 0; i < (int) functions.size() && functions[i].first != node.getOperation().getName(); i++)
                ;
            if (i == functions.size())
                throw OpenMMException("Unknown function in expression: "+node.getOperation().getName());
82
            bool isDeriv = (dynamic_cast<const Operation::Custom*>(&node.getOperation())->getDerivOrder()[0] == 1);
83
            out << "0.0f;\n";
84
85
86
87
88
89
90
91
92
93
94
95
96
            temps.push_back(make_pair(node, name));
            hasRecordedNode = true;

            // If both the value and derivative of the function are needed, it's faster to calculate them both
            // at once, so check to see if both are needed.

            const ExpressionTreeNode* valueNode = NULL;
            const ExpressionTreeNode* derivNode = NULL;
            for (int j = 0; j < (int) allExpressions.size(); j++)
                findRelatedTabulatedFunctions(node, allExpressions[j].getRootNode(), valueNode, derivNode);
            string valueName = name;
            string derivName = name;
            if (valueNode != NULL && derivNode != NULL) {
97
                string name2 = prefix+context.intToString(temps.size());
98
                out << tempType << " " << name2 << " = 0.0f;\n";
99
100
101
102
103
104
105
106
107
                if (isDeriv) {
                    valueName = name2;
                    temps.push_back(make_pair(*valueNode, name2));
                }
                else {
                    derivName = name2;
                    temps.push_back(make_pair(*derivNode, name2));
                }
            }
108
109
110
111
            out << "{\n";
            out << "float4 params = " << functionParams << "[" << i << "];\n";
            out << "float x = " << getTempName(node.getChildren()[0], temps) << ";\n";
            out << "if (x >= params.x && x <= params.y) {\n";
112
113
            out << "x = (x-params.x)*params.z;\n";
            out << "int index = (int) (floor(x));\n";
114
            out << "index = min(index, (int) params.w);\n";
115
            out << "float4 coeff = " << functions[i].second << "[index];\n";
116
117
            out << "float b = x-index;\n";
            out << "float a = 1.0f-b;\n";
118
            if (valueNode != NULL)
119
                out << valueName << " = a*coeff.x+b*coeff.y+((a*a*a-a)*coeff.z+(b*b*b-b)*coeff.w)/(params.z*params.z);\n";
120
            if (derivNode != NULL)
121
                out << derivName << " = (coeff.y-coeff.x)*params.z+((1.0f-3.0f*a*a)*coeff.z+(3.0f*b*b-1.0f)*coeff.w)/params.z;\n";
122
123
124
            out << "}\n";
            out << "}";
            break;
125
126
        }
        case Operation::ADD:
127
128
            out << getTempName(node.getChildren()[0], temps) << "+" << getTempName(node.getChildren()[1], temps);
            break;
129
        case Operation::SUBTRACT:
130
131
            out << getTempName(node.getChildren()[0], temps) << "-" << getTempName(node.getChildren()[1], temps);
            break;
132
        case Operation::MULTIPLY:
133
134
            out << getTempName(node.getChildren()[0], temps) << "*" << getTempName(node.getChildren()[1], temps);
            break;
135
        case Operation::DIVIDE:
136
137
138
139
140
141
142
143
144
        {
            bool haveReciprocal = false;
            for (int i = 0; i < (int) temps.size(); i++)
                if (temps[i].first.getOperation().getId() == Operation::RECIPROCAL && temps[i].first.getChildren()[0] == node.getChildren()[1]) {
                    haveReciprocal = true;
                    out << getTempName(node.getChildren()[0], temps) << "*" << temps[i].second;
                }
            if (!haveReciprocal)
                out << getTempName(node.getChildren()[0], temps) << "/" << getTempName(node.getChildren()[1], temps);
145
            break;
146
        }
147
        case Operation::POWER:
148
149
            out << "pow(" << getTempName(node.getChildren()[0], temps) << ", " << getTempName(node.getChildren()[1], temps) << ")";
            break;
150
        case Operation::NEGATE:
151
152
            out << "-" << getTempName(node.getChildren()[0], temps);
            break;
153
        case Operation::SQRT:
154
155
            out << "sqrt(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
156
        case Operation::EXP:
157
            out << "EXP(" << getTempName(node.getChildren()[0], temps) << ")";
158
            break;
159
        case Operation::LOG:
160
            out << "LOG(" << getTempName(node.getChildren()[0], temps) << ")";
161
            break;
162
        case Operation::SIN:
163
164
            out << "sin(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
165
        case Operation::COS:
166
167
            out << "cos(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
168
        case Operation::SEC:
169
170
            out << "1.0f/cos(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
171
        case Operation::CSC:
172
173
            out << "1.0f/sin(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
174
        case Operation::TAN:
175
176
            out << "tan(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
177
        case Operation::COT:
178
179
            out << "1.0f/tan(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
180
        case Operation::ASIN:
181
182
            out << "asin(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
183
        case Operation::ACOS:
184
185
            out << "acos(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
186
        case Operation::ATAN:
187
188
            out << "atan(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
189
190
191
192
193
194
195
196
197
        case Operation::SINH:
            out << "sinh(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
        case Operation::COSH:
            out << "cosh(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
        case Operation::TANH:
            out << "tanh(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
198
199
200
201
202
203
        case Operation::ERF:
            out << "erf(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
        case Operation::ERFC:
            out << "erfc(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
204
205
206
        case Operation::STEP:
            out << getTempName(node.getChildren()[0], temps) << " >= 0.0f ? 1.0f : 0.0f";
            break;
207
208
209
        case Operation::DELTA:
            out << getTempName(node.getChildren()[0], temps) << " == 0.0f ? 1.0f : 0.0f";
            break;
210
        case Operation::SQUARE:
211
212
213
214
215
        {
            string arg = getTempName(node.getChildren()[0], temps);
            out << arg << "*" << arg;
            break;
        }
216
        case Operation::CUBE:
217
218
219
220
221
        {
            string arg = getTempName(node.getChildren()[0], temps);
            out << arg << "*" << arg << "*" << arg;
            break;
        }
222
        case Operation::RECIPROCAL:
223
            out << "RECIP(" << getTempName(node.getChildren()[0], temps) << ")";
224
            break;
225
        case Operation::ADD_CONSTANT:
226
            out << context.doubleToString(dynamic_cast<const Operation::AddConstant*>(&node.getOperation())->getValue()) << "+" << getTempName(node.getChildren()[0], temps);
227
            break;
228
        case Operation::MULTIPLY_CONSTANT:
229
            out << context.doubleToString(dynamic_cast<const Operation::MultiplyConstant*>(&node.getOperation())->getValue()) << "*" << getTempName(node.getChildren()[0], temps);
230
            break;
231
        case Operation::POWER_CONSTANT:
232
233
234
235
236
237
        {
            double exponent = dynamic_cast<const Operation::PowerConstant*>(&node.getOperation())->getValue();
            if (exponent == 0.0)
                out << "1.0f";
            else if (exponent == (int) exponent) {
                out << "0.0f;\n";
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
                temps.push_back(make_pair(node, name));
                hasRecordedNode = true;

                // If multiple integral powers of the same base are needed, it's faster to calculate all of them
                // at once, so check to see if others are also needed.

                map<int, const ExpressionTreeNode*> powers;
                powers[(int) exponent] = &node;
                for (int j = 0; j < (int) allExpressions.size(); j++)
                    findRelatedPowers(node, allExpressions[j].getRootNode(), powers);
                vector<int> exponents;
                vector<string> names;
                vector<bool> hasAssigned(powers.size(), false);
                exponents.push_back((int) fabs(exponent));
                names.push_back(name);
                for (map<int, const ExpressionTreeNode*>::const_iterator iter = powers.begin(); iter != powers.end(); ++iter) {
                    if (iter->first != exponent) {
255
                        exponents.push_back(iter->first >= 0 ? iter->first : -iter->first);
256
                        string name2 = prefix+context.intToString(temps.size());
257
258
                        names.push_back(name2);
                        temps.push_back(make_pair(*iter->second, name2));
259
                        out << tempType << " " << name2 << " = 0.0f;\n";
260
261
                    }
                }
262
263
                out << "{\n";
                out << "float multiplier = " << (exponent < 0.0 ? "1.0f/" : "") << getTempName(node.getChildren()[0], temps) << ";\n";
264
265
266
                bool done = false;
                while (!done) {
                    done = true;
267
                    for (int i = 0; i < (int) exponents.size(); i++) {
268
269
270
271
272
273
274
275
276
277
                        if (exponents[i]%2 == 1) {
                            if (!hasAssigned[i])
                                out << names[i] << " = multiplier;\n";
                            else
                                out << names[i] << " *= multiplier;\n";
                            hasAssigned[i] = true;
                        }
                        exponents[i] >>= 1;
                        if (exponents[i] != 0)
                            done = false;
278
                    }
279
                    if (!done)
280
281
282
283
284
                        out << "multiplier *= multiplier;\n";
                }
                out << "}";
            }
            else
285
                out << "pow(" << getTempName(node.getChildren()[0], temps) << ", " << context.doubleToString(exponent) << ")";
286
            break;
287
        }
288
289
290
291
292
293
294
295
296
        case Operation::MIN:
            out << "min(" << getTempName(node.getChildren()[0], temps) << ", " << getTempName(node.getChildren()[1], temps) << ")";
            break;
        case Operation::MAX:
            out << "max(" << getTempName(node.getChildren()[0], temps) << ", " << getTempName(node.getChildren()[1], temps) << ")";
            break;
        case Operation::ABS:
            out << "fabs(" << getTempName(node.getChildren()[0], temps) << ")";
            break;
297
298
        default:
            throw OpenMMException("Internal error: Unknown operation in user-defined expression: "+node.getOperation().getName());
299
    }
300
    out << ";\n";
301
302
    if (!hasRecordedNode)
        temps.push_back(make_pair(node, name));
303
304
305
306
307
308
309
310
311
}

string OpenCLExpressionUtilities::getTempName(const ExpressionTreeNode& node, const vector<pair<ExpressionTreeNode, string> >& temps) {
    for (int i = 0; i < (int) temps.size(); i++)
        if (temps[i].first == node)
            return temps[i].second;
    stringstream out;
    out << "Internal error: No temporary variable for expression node: " << node;
    throw OpenMMException(out.str());
312
}
313
314
315
316
317
318
319
320
321
322
323
324
325

void OpenCLExpressionUtilities::findRelatedTabulatedFunctions(const ExpressionTreeNode& node, const ExpressionTreeNode& searchNode,
            const ExpressionTreeNode*& valueNode, const ExpressionTreeNode*& derivNode) {
    if (searchNode.getOperation().getId() == Operation::CUSTOM && node.getChildren()[0] == searchNode.getChildren()[0]) {
        if (dynamic_cast<const Operation::Custom*>(&searchNode.getOperation())->getDerivOrder()[0] == 0)
            valueNode = &searchNode;
        else
            derivNode = &searchNode;
    }
    else
        for (int i = 0; i < (int) searchNode.getChildren().size(); i++)
            findRelatedTabulatedFunctions(node, searchNode.getChildren()[i], valueNode, derivNode);
}
326
327
328

void OpenCLExpressionUtilities::findRelatedPowers(const ExpressionTreeNode& node, const ExpressionTreeNode& searchNode, map<int, const ExpressionTreeNode*>& powers) {
    if (searchNode.getOperation().getId() == Operation::POWER_CONSTANT && node.getChildren()[0] == searchNode.getChildren()[0]) {
329
330
331
332
        double realPower = dynamic_cast<const Operation::PowerConstant*>(&searchNode.getOperation())->getValue();
        int power = (int) realPower;
        if (power != realPower)
            return; // We are only interested in integer powers.
333
334
335
336
337
338
339
340
341
342
        if (powers.find(power) != powers.end())
            return; // This power is already in the map.
        if (powers.begin()->first*power < 0)
            return; // All powers must have the same sign.
        powers[power] = &searchNode;
    }
    else
        for (int i = 0; i < (int) searchNode.getChildren().size(); i++)
            findRelatedPowers(node, searchNode.getChildren()[i], powers);
}
343

344
345
vector<mm_float4> OpenCLExpressionUtilities::computeFunctionCoefficients(const vector<double>& values, double min, double max) {
    // Compute the spline coefficients.
346

347
348
349
350
351
352
353
354
    int numValues = values.size();
    vector<double> x(numValues), derivs;
    for (int i = 0; i < numValues; i++)
        x[i] = min+i*(max-min)/(numValues-1);
    SplineFitter::createNaturalSpline(x, values, derivs);
    vector<mm_float4> f(numValues-1);
    for (int i = 0; i < (int) values.size()-1; i++)
        f[i] = mm_float4((cl_float) values[i], (cl_float) values[i+1], (cl_float) (derivs[i]/6.0), (cl_float) (derivs[i+1]/6.0));
355
356
    return f;
}