c_api.h 20.6 KB
Newer Older
Guolin Ke's avatar
Guolin Ke committed
1
2
#ifndef LIGHTGBM_C_API_H_
#define LIGHTGBM_C_API_H_
3
4
5
#include <cstdint>
#include <exception>
#include <stdexcept>
wxchan's avatar
wxchan committed
6
#include <cstring>
7
#include <string>
wxchan's avatar
wxchan committed
8

9
10
11
/*!
* To avoid type conversion on large data, most of our expose interface support both for float_32 and float_64.
* Except following:
wxchan's avatar
wxchan committed
12
* 1. gradients and hessians.
13
* 2. Get current score for training data and validation
wxchan's avatar
wxchan committed
14
* The reason is because they are called frequently, the type-conversion on them maybe time cost.
15
16
*/

17
#include <LightGBM/export.h>
Guolin Ke's avatar
Guolin Ke committed
18

Guolin Ke's avatar
typo  
Guolin Ke committed
19
typedef void* DatasetHandle;
Guolin Ke's avatar
Guolin Ke committed
20
21
typedef void* BoosterHandle;

Guolin Ke's avatar
Guolin Ke committed
22
23
24
25
26
27
28
29
#define C_API_DTYPE_FLOAT32 (0)
#define C_API_DTYPE_FLOAT64 (1)
#define C_API_DTYPE_INT32   (2)
#define C_API_DTYPE_INT64   (3)

#define C_API_PREDICT_NORMAL     (0)
#define C_API_PREDICT_RAW_SCORE  (1)
#define C_API_PREDICT_LEAF_INDEX (2)
30

Guolin Ke's avatar
Guolin Ke committed
31
32
/*!
* \brief get string message of the last error
wxchan's avatar
wxchan committed
33
*  all function in this file will return 0 when succeed
Guolin Ke's avatar
Guolin Ke committed
34
35
36
*  and -1 when an error occured,
* \return const char* error inforomation
*/
37
LIGHTGBM_C_EXPORT const char* LGBM_GetLastError();
Guolin Ke's avatar
Guolin Ke committed
38
39


Guolin Ke's avatar
Guolin Ke committed
40
// --- start Dataset interface
Guolin Ke's avatar
Guolin Ke committed
41
42
43
44

/*!
* \brief load data set from file like the command_line LightGBM do
* \param filename the name of the file
Guolin Ke's avatar
Guolin Ke committed
45
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
46
47
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out a loaded dataset
wxchan's avatar
wxchan committed
48
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
49
*/
50
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromFile(const char* filename,
Guolin Ke's avatar
Guolin Ke committed
51
  const char* parameters,
52
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
53
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
54
55
56
57

/*!
* \brief create a dataset from CSR format
* \param indptr pointer to row headers
wxchan's avatar
wxchan committed
58
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
59
60
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
61
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
62
* \param nindptr number of rows in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
63
* \param nelem number of nonzero elements in the matrix
wxchan's avatar
wxchan committed
64
* \param num_col number of columns
Guolin Ke's avatar
Guolin Ke committed
65
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
66
67
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
68
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
69
*/
70
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromCSR(const void* indptr,
71
  int indptr_type,
Guolin Ke's avatar
Guolin Ke committed
72
  const int32_t* indices,
73
  const void* data,
74
75
76
77
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
Guolin Ke's avatar
Guolin Ke committed
78
  const char* parameters,
79
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
80
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
81
82
83
84

/*!
* \brief create a dataset from CSC format
* \param col_ptr pointer to col headers
wxchan's avatar
wxchan committed
85
* \param col_ptr_type type of col_ptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
86
87
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
88
89
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param ncol_ptr number of cols in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
90
* \param nelem number of nonzero elements in the matrix
wxchan's avatar
wxchan committed
91
* \param num_row number of rows
Guolin Ke's avatar
Guolin Ke committed
92
93
94
* \param parameters additional parameters
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
95
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
96
*/
97
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromCSC(const void* col_ptr,
98
  int col_ptr_type,
Guolin Ke's avatar
Guolin Ke committed
99
100
  const int32_t* indices,
  const void* data,
101
102
103
104
  int data_type,
  int64_t ncol_ptr,
  int64_t nelem,
  int64_t num_row,
Guolin Ke's avatar
Guolin Ke committed
105
  const char* parameters,
106
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
107
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
108
109
110
111

/*!
* \brief create dataset from dense matrix
* \param data pointer to the data space
wxchan's avatar
wxchan committed
112
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
113
114
* \param nrow number of rows
* \param ncol number columns
115
* \param is_row_major 1 for row major, 0 for column major
Guolin Ke's avatar
Guolin Ke committed
116
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
117
118
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
119
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
120
*/
121
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromMat(const void* data,
122
  int data_type,
Guolin Ke's avatar
Guolin Ke committed
123
124
  int32_t nrow,
  int32_t ncol,
125
  int is_row_major,
Guolin Ke's avatar
Guolin Ke committed
126
  const char* parameters,
127
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
128
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
129

wxchan's avatar
wxchan committed
130
131
132
133
134
135
136
137
138
/*!
* \brief Create subset of a data
* \param handle handle of full dataset
* \param used_row_indices Indices used in subset
* \param num_used_row_indices len of used_row_indices
* \param parameters additional parameters
* \param out subset of data
* \return 0 when succeed, -1 when failure happens
*/
139
LIGHTGBM_C_EXPORT int LGBM_DatasetGetSubset(
140
  const DatasetHandle handle,
wxchan's avatar
wxchan committed
141
142
143
  const int32_t* used_row_indices,
  int32_t num_used_row_indices,
  const char* parameters,
Guolin Ke's avatar
typo  
Guolin Ke committed
144
  DatasetHandle* out);
wxchan's avatar
wxchan committed
145

Guolin Ke's avatar
Guolin Ke committed
146
147
148
149
150
151
152
/*!
* \brief save feature names to Dataset
* \param handle handle
* \param feature_names feature names
* \param num_feature_names number of feature names
* \return 0 when succeed, -1 when failure happens
*/
153
LIGHTGBM_C_EXPORT int LGBM_DatasetSetFeatureNames(
Guolin Ke's avatar
typo  
Guolin Ke committed
154
  DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
155
  const char** feature_names,
Guolin Ke's avatar
Guolin Ke committed
156
  int num_feature_names);
Guolin Ke's avatar
Guolin Ke committed
157

158
159
160
161
162
163
164
165

/*!
* \brief get feature names of Dataset
* \param handle handle
* \param feature_names feature names, should pre-allocate memory
* \param num_feature_names number of feature names
* \return 0 when succeed, -1 when failure happens
*/
166
LIGHTGBM_C_EXPORT int LGBM_DatasetGetFeatureNames(
167
168
  DatasetHandle handle,
  char** feature_names,
Guolin Ke's avatar
Guolin Ke committed
169
  int* num_feature_names);
170
171


Guolin Ke's avatar
Guolin Ke committed
172
173
/*!
* \brief free space for dataset
wxchan's avatar
wxchan committed
174
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
175
*/
176
LIGHTGBM_C_EXPORT int LGBM_DatasetFree(DatasetHandle handle);
Guolin Ke's avatar
Guolin Ke committed
177
178
179
180
181

/*!
* \brief save dateset to binary file
* \param handle a instance of dataset
* \param filename file name
wxchan's avatar
wxchan committed
182
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
183
*/
184
LIGHTGBM_C_EXPORT int LGBM_DatasetSaveBinary(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
185
186
187
188
  const char* filename);

/*!
* \brief set vector to a content in info
wxchan's avatar
wxchan committed
189
190
*        Note: group and group only work for C_API_DTYPE_INT32
*              label and weight only work for C_API_DTYPE_FLOAT32
Guolin Ke's avatar
Guolin Ke committed
191
* \param handle a instance of dataset
wxchan's avatar
wxchan committed
192
* \param field_name field name, can be label, weight, group, group_id
193
* \param field_data pointer to vector
Guolin Ke's avatar
Guolin Ke committed
194
* \param num_element number of element in field_data
wxchan's avatar
wxchan committed
195
196
* \param type C_API_DTYPE_FLOAT32 or C_API_DTYPE_INT32
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
197
*/
198
LIGHTGBM_C_EXPORT int LGBM_DatasetSetField(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
199
200
  const char* field_name,
  const void* field_data,
Guolin Ke's avatar
Guolin Ke committed
201
  int num_element,
Guolin Ke's avatar
Guolin Ke committed
202
203
204
  int type);

/*!
205
* \brief get info vector from dataset
Guolin Ke's avatar
Guolin Ke committed
206
207
208
209
* \param handle a instance of data matrix
* \param field_name field name
* \param out_len used to set result length
* \param out_ptr pointer to the result
wxchan's avatar
wxchan committed
210
211
* \param out_type  C_API_DTYPE_FLOAT32 or C_API_DTYPE_INT32
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
212
*/
213
LIGHTGBM_C_EXPORT int LGBM_DatasetGetField(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
214
  const char* field_name,
Guolin Ke's avatar
Guolin Ke committed
215
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
216
217
218
219
220
221
222
  const void** out_ptr,
  int* out_type);

/*!
* \brief get number of data.
* \param handle the handle to the dataset
* \param out The address to hold number of data
wxchan's avatar
wxchan committed
223
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
224
*/
225
LIGHTGBM_C_EXPORT int LGBM_DatasetGetNumData(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
226
  int* out);
Guolin Ke's avatar
Guolin Ke committed
227
228
229
230
231

/*!
* \brief get number of features
* \param handle the handle to the dataset
* \param out The output of number of features
wxchan's avatar
wxchan committed
232
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
233
*/
234
LIGHTGBM_C_EXPORT int LGBM_DatasetGetNumFeature(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
235
  int* out);
Guolin Ke's avatar
Guolin Ke committed
236
237
238
239
240

// --- start Booster interfaces

/*!
* \brief create an new boosting learner
Guolin Ke's avatar
Guolin Ke committed
241
* \param train_data training data set
Guolin Ke's avatar
Guolin Ke committed
242
243
* \param parameters format: 'key1=value1 key2=value2'
* \prama out handle of created Booster
wxchan's avatar
wxchan committed
244
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
245
*/
246
LIGHTGBM_C_EXPORT int LGBM_BoosterCreate(const DatasetHandle train_data,
Guolin Ke's avatar
Guolin Ke committed
247
248
249
250
  const char* parameters,
  BoosterHandle* out);

/*!
Guolin Ke's avatar
Guolin Ke committed
251
* \brief load an existing boosting from model file
Guolin Ke's avatar
Guolin Ke committed
252
* \param filename filename of model
wxchan's avatar
wxchan committed
253
* \param out_num_iterations number of iterations of this booster
Guolin Ke's avatar
Guolin Ke committed
254
* \param out handle of created Booster
wxchan's avatar
wxchan committed
255
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
256
*/
257
LIGHTGBM_C_EXPORT int LGBM_BoosterCreateFromModelfile(
Guolin Ke's avatar
Guolin Ke committed
258
  const char* filename,
Guolin Ke's avatar
Guolin Ke committed
259
  int* out_num_iterations,
Guolin Ke's avatar
Guolin Ke committed
260
261
  BoosterHandle* out);

wxchan's avatar
wxchan committed
262

Guolin Ke's avatar
Guolin Ke committed
263
264
265
/*!
* \brief free obj in handle
* \param handle handle to be freed
wxchan's avatar
wxchan committed
266
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
267
*/
268
LIGHTGBM_C_EXPORT int LGBM_BoosterFree(BoosterHandle handle);
Guolin Ke's avatar
Guolin Ke committed
269

wxchan's avatar
wxchan committed
270
271
272
273
274
275
/*!
* \brief Merge model in two booster to first handle
* \param handle handle, will merge other handle to this
* \param other_handle
* \return 0 when succeed, -1 when failure happens
*/
276
LIGHTGBM_C_EXPORT int LGBM_BoosterMerge(BoosterHandle handle,
wxchan's avatar
wxchan committed
277
278
279
280
281
282
283
284
  BoosterHandle other_handle);

/*!
* \brief Add new validation to booster
* \param handle handle
* \param valid_data validation data set
* \return 0 when succeed, -1 when failure happens
*/
285
LIGHTGBM_C_EXPORT int LGBM_BoosterAddValidData(BoosterHandle handle,
Guolin Ke's avatar
typo  
Guolin Ke committed
286
  const DatasetHandle valid_data);
wxchan's avatar
wxchan committed
287
288
289
290
291
292
293

/*!
* \brief Reset training data for booster
* \param handle handle
* \param train_data training data set
* \return 0 when succeed, -1 when failure happens
*/
294
LIGHTGBM_C_EXPORT int LGBM_BoosterResetTrainingData(BoosterHandle handle,
Guolin Ke's avatar
typo  
Guolin Ke committed
295
  const DatasetHandle train_data);
wxchan's avatar
wxchan committed
296
297
298
299
300
301
302

/*!
* \brief Reset config for current booster
* \param handle handle
* \param parameters format: 'key1=value1 key2=value2'
* \return 0 when succeed, -1 when failure happens
*/
303
LIGHTGBM_C_EXPORT int LGBM_BoosterResetParameter(BoosterHandle handle, const char* parameters);
wxchan's avatar
wxchan committed
304
305

/*!
Guolin Ke's avatar
Guolin Ke committed
306
* \brief Get number of class
wxchan's avatar
wxchan committed
307
308
309
310
* \param handle handle
* \param out_len number of class
* \return 0 when succeed, -1 when failure happens
*/
311
LIGHTGBM_C_EXPORT int LGBM_BoosterGetNumClasses(BoosterHandle handle, int* out_len);
wxchan's avatar
wxchan committed
312

Guolin Ke's avatar
Guolin Ke committed
313
314
315
/*!
* \brief update the model in one round
* \param handle handle
Guolin Ke's avatar
Guolin Ke committed
316
* \param is_finished 1 means finised(cannot split any more)
wxchan's avatar
wxchan committed
317
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
318
*/
319
LIGHTGBM_C_EXPORT int LGBM_BoosterUpdateOneIter(BoosterHandle handle, int* is_finished);
Guolin Ke's avatar
Guolin Ke committed
320
321
322
323
324
325
326

/*!
* \brief update the model, by directly specify gradient and second order gradient,
*       this can be used to support customized loss function
* \param handle handle
* \param grad gradient statistics
* \param hess second order gradient statistics
Guolin Ke's avatar
Guolin Ke committed
327
* \param is_finished 1 means finised(cannot split any more)
wxchan's avatar
wxchan committed
328
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
329
*/
330
LIGHTGBM_C_EXPORT int LGBM_BoosterUpdateOneIterCustom(BoosterHandle handle,
331
332
  const float* grad,
  const float* hess,
Guolin Ke's avatar
Guolin Ke committed
333
334
335
  int* is_finished);

/*!
wxchan's avatar
wxchan committed
336
* \brief Rollback one iteration
Guolin Ke's avatar
Guolin Ke committed
337
* \param handle handle
wxchan's avatar
wxchan committed
338
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
339
*/
340
LIGHTGBM_C_EXPORT int LGBM_BoosterRollbackOneIter(BoosterHandle handle);
wxchan's avatar
wxchan committed
341
342
343
344
345
346

/*!
* \brief Get iteration of current boosting rounds
* \param out_iteration iteration of boosting rounds
* \return 0 when succeed, -1 when failure happens
*/
347
LIGHTGBM_C_EXPORT int LGBM_BoosterGetCurrentIteration(BoosterHandle handle, int* out_iteration);
Guolin Ke's avatar
Guolin Ke committed
348

Guolin Ke's avatar
Guolin Ke committed
349
/*!
Guolin Ke's avatar
Guolin Ke committed
350
* \brief Get number of eval
wxchan's avatar
wxchan committed
351
352
353
* \param out_len total number of eval results
* \return 0 when succeed, -1 when failure happens
*/
354
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEvalCounts(BoosterHandle handle, int* out_len);
wxchan's avatar
wxchan committed
355
356
357
358

/*!
* \brief Get Name of eval
* \param out_len total number of eval results
Guolin Ke's avatar
typo  
Guolin Ke committed
359
* \param out_strs names of eval result, need to pre-allocate memory before call this
wxchan's avatar
wxchan committed
360
361
* \return 0 when succeed, -1 when failure happens
*/
362
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEvalNames(BoosterHandle handle, int* out_len, char** out_strs);
wxchan's avatar
wxchan committed
363
364
365

/*!
* \brief get evaluation for training data and validation data
Guolin Ke's avatar
Guolin Ke committed
366
367
Note: 1. you should call LGBM_BoosterGetEvalNames first to get the name of evaluation results
2. should pre-allocate memory for out_results, you can get its length by LGBM_BoosterGetEvalCounts
Guolin Ke's avatar
Guolin Ke committed
368
* \param handle handle
wxchan's avatar
wxchan committed
369
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
Guolin Ke's avatar
Guolin Ke committed
370
* \param out_len len of output result
wxchan's avatar
wxchan committed
371
372
* \param out_result float arrary contains result
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
373
*/
374
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEval(BoosterHandle handle,
wxchan's avatar
wxchan committed
375
  int data_idx,
Guolin Ke's avatar
Guolin Ke committed
376
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
377
378
379
380
381
382
383
384
385
386
387
  double* out_results);

/*!
* \brief Get number of predict for inner dataset
this can be used to support customized eval function
Note:  should pre-allocate memory for out_result, its length is equal to num_class * num_data
* \param handle handle
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
* \param out_len len of output result
* \return 0 when succeed, -1 when failure happens
*/
388
LIGHTGBM_C_EXPORT int LGBM_BoosterGetNumPredict(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
389
390
  int data_idx,
  int64_t* out_len);
Guolin Ke's avatar
Guolin Ke committed
391

Guolin Ke's avatar
Guolin Ke committed
392
/*!
Guolin Ke's avatar
Guolin Ke committed
393
* \brief Get prediction for training data and validation data
Guolin Ke's avatar
Guolin Ke committed
394
395
this can be used to support customized eval function
Note:  should pre-allocate memory for out_result, its length is equal to num_class * num_data
Guolin Ke's avatar
Guolin Ke committed
396
* \param handle handle
wxchan's avatar
wxchan committed
397
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
Guolin Ke's avatar
Guolin Ke committed
398
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
399
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
400
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
401
*/
402
LIGHTGBM_C_EXPORT int LGBM_BoosterGetPredict(BoosterHandle handle,
wxchan's avatar
wxchan committed
403
  int data_idx,
404
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
405
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
406

407
408
409
410
/*!
* \brief make prediction for file
* \param handle handle
* \param data_filename filename of data file
wxchan's avatar
wxchan committed
411
412
413
414
415
416
* \param data_has_header data file has header or not
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
417
* \param result_filename filename of result file
wxchan's avatar
wxchan committed
418
* \return 0 when succeed, -1 when failure happens
419
*/
420
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForFile(BoosterHandle handle,
421
  const char* data_filename,
wxchan's avatar
wxchan committed
422
423
  int data_has_header,
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
424
  int num_iteration,
425
426
  const char* result_filename);

Guolin Ke's avatar
Guolin Ke committed
427
428
429
/*!
* \brief Get number of prediction
* \param handle handle
Guolin Ke's avatar
Guolin Ke committed
430
* \param num_row
Guolin Ke's avatar
Guolin Ke committed
431
432
433
434
435
436
437
438
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len lenght of prediction
* \return 0 when succeed, -1 when failure happens
*/
439
LIGHTGBM_C_EXPORT int LGBM_BoosterCalcNumPredict(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
440
  int num_row,
Guolin Ke's avatar
Guolin Ke committed
441
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
442
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
443
444
  int64_t* out_len);

Guolin Ke's avatar
Guolin Ke committed
445
446
/*!
* \brief make prediction for an new data set
Guolin Ke's avatar
Guolin Ke committed
447
*        Note:  should pre-allocate memory for out_result,
wxchan's avatar
wxchan committed
448
449
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
Guolin Ke's avatar
Guolin Ke committed
450
451
* \param handle handle
* \param indptr pointer to row headers
wxchan's avatar
wxchan committed
452
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
453
454
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
455
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
456
* \param nindptr number of rows in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
457
458
459
* \param nelem number of nonzero elements in the matrix
* \param num_col number of columns; when it's set to 0, then guess from data
* \param predict_type
wxchan's avatar
wxchan committed
460
461
462
463
464
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
465
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
466
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
467
*/
468
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForCSR(BoosterHandle handle,
469
470
  const void* indptr,
  int indptr_type,
Guolin Ke's avatar
Guolin Ke committed
471
  const int32_t* indices,
472
  const void* data,
473
474
475
476
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
Guolin Ke's avatar
Guolin Ke committed
477
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
478
  int num_iteration,
wxchan's avatar
wxchan committed
479
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
  double* out_result);

/*!
* \brief make prediction for an new data set
*        Note:  should pre-allocate memory for out_result,
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
* \param handle handle
* \param col_ptr pointer to col headers
* \param col_ptr_type type of col_ptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
* \param indices findex
* \param data fvalue
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param ncol_ptr number of cols in the matrix + 1
* \param nelem number of nonzero elements in the matrix
* \param num_row number of rows
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
* \param out_result used to set a pointer to array, should allocate memory before call this function
* \return 0 when succeed, -1 when failure happens
*/
505
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForCSC(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
506
507
508
509
510
511
512
513
514
  const void* col_ptr,
  int col_ptr_type,
  const int32_t* indices,
  const void* data,
  int data_type,
  int64_t ncol_ptr,
  int64_t nelem,
  int64_t num_row,
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
515
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
516
517
  int64_t* out_len,
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
518
519
520

/*!
* \brief make prediction for an new data set
wxchan's avatar
wxchan committed
521
522
523
*        Note:  should pre-allocate memory for out_result,
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
Guolin Ke's avatar
Guolin Ke committed
524
525
* \param handle handle
* \param data pointer to the data space
wxchan's avatar
wxchan committed
526
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
527
528
* \param nrow number of rows
* \param ncol number columns
Guolin Ke's avatar
Guolin Ke committed
529
* \param is_row_major 1 for row major, 0 for column major
Guolin Ke's avatar
Guolin Ke committed
530
* \param predict_type
wxchan's avatar
wxchan committed
531
532
533
534
535
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
536
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
537
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
538
*/
539
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForMat(BoosterHandle handle,
540
  const void* data,
541
  int data_type,
Guolin Ke's avatar
Guolin Ke committed
542
543
  int32_t nrow,
  int32_t ncol,
Guolin Ke's avatar
Guolin Ke committed
544
  int is_row_major,
Guolin Ke's avatar
Guolin Ke committed
545
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
546
  int num_iteration,
wxchan's avatar
wxchan committed
547
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
548
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
549
550
551
552

/*!
* \brief save model into file
* \param handle handle
wxchan's avatar
wxchan committed
553
* \param num_iteration, <= 0 means save all
Guolin Ke's avatar
Guolin Ke committed
554
* \param filename file name
wxchan's avatar
wxchan committed
555
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
556
*/
557
LIGHTGBM_C_EXPORT int LGBM_BoosterSaveModel(BoosterHandle handle,
wxchan's avatar
wxchan committed
558
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
559
560
  const char* filename);

wxchan's avatar
wxchan committed
561
562
563
/*!
* \brief dump model to json
* \param handle handle
564
* \param num_iteration, <= 0 means save all
wxchan's avatar
wxchan committed
565
566
* \param buffer_len string buffer length, if buffer_len < out_len, re-allocate buffer
* \param out_len actual output length
Guolin Ke's avatar
typo  
Guolin Ke committed
567
* \param out_str json format string of model, need to pre-allocate memory before call this
wxchan's avatar
wxchan committed
568
569
* \return 0 when succeed, -1 when failure happens
*/
570
LIGHTGBM_C_EXPORT int LGBM_BoosterDumpModel(BoosterHandle handle,
571
  int num_iteration,
wxchan's avatar
wxchan committed
572
  int buffer_len,
Guolin Ke's avatar
Guolin Ke committed
573
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
574
  char* out_str);
575

Guolin Ke's avatar
Guolin Ke committed
576
/*!
Guolin Ke's avatar
Guolin Ke committed
577
* \brief Get leaf value
Guolin Ke's avatar
Guolin Ke committed
578
579
580
581
582
583
* \param handle handle
* \param tree_idx index of tree
* \param leaf_idx index of leaf
* \param out_val out result
* \return 0 when succeed, -1 when failure happens
*/
584
LIGHTGBM_C_EXPORT int LGBM_BoosterGetLeafValue(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
585
586
  int tree_idx,
  int leaf_idx,
Guolin Ke's avatar
Guolin Ke committed
587
  double* out_val);
Guolin Ke's avatar
Guolin Ke committed
588
589
590
591
592
593
594
595
596

/*!
* \brief Set leaf value
* \param handle handle
* \param tree_idx index of tree
* \param leaf_idx index of leaf
* \param val leaf value
* \return 0 when succeed, -1 when failure happens
*/
597
LIGHTGBM_C_EXPORT int LGBM_BoosterSetLeafValue(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
598
599
  int tree_idx,
  int leaf_idx,
Guolin Ke's avatar
Guolin Ke committed
600
  double val);
601

wxchan's avatar
wxchan committed
602
#if defined(_MSC_VER)
603
// exception handle and error msg
wxchan's avatar
wxchan committed
604
605
606
607
static char* LastErrorMsg() { static __declspec(thread) char err_msg[512] = "Everything is fine"; return err_msg; }
#else
static char* LastErrorMsg() { static thread_local char err_msg[512] = "Everything is fine"; return err_msg; }
#endif
608
609

inline void LGBM_SetLastError(const char* msg) {
wxchan's avatar
wxchan committed
610
  std::strcpy(LastErrorMsg(), msg);
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
}

inline int LGBM_APIHandleException(const std::exception& ex) {
  LGBM_SetLastError(ex.what());
  return -1;
}
inline int LGBM_APIHandleException(const std::string& ex) {
  LGBM_SetLastError(ex.c_str());
  return -1;
}

#define API_BEGIN() try {

#define API_END() } \
catch(std::exception& ex) { return LGBM_APIHandleException(ex); } \
catch(std::string& ex) { return LGBM_APIHandleException(ex); } \
catch(...) { return LGBM_APIHandleException("unknown exception"); } \
wxchan's avatar
wxchan committed
628
return 0;
629

Guolin Ke's avatar
Guolin Ke committed
630
#endif // LIGHTGBM_C_API_H_