c_api.h 21.4 KB
Newer Older
Guolin Ke's avatar
Guolin Ke committed
1
2
#ifndef LIGHTGBM_C_API_H_
#define LIGHTGBM_C_API_H_
3
4
5
#include <cstdint>
#include <exception>
#include <stdexcept>
wxchan's avatar
wxchan committed
6
#include <cstring>
7
#include <string>
wxchan's avatar
wxchan committed
8

9
10
11
/*!
* To avoid type conversion on large data, most of our expose interface support both for float_32 and float_64.
* Except following:
wxchan's avatar
wxchan committed
12
* 1. gradients and hessians.
13
* 2. Get current score for training data and validation
wxchan's avatar
wxchan committed
14
* The reason is because they are called frequently, the type-conversion on them maybe time cost.
15
16
*/

17
#include <LightGBM/export.h>
Guolin Ke's avatar
Guolin Ke committed
18

Guolin Ke's avatar
typo  
Guolin Ke committed
19
typedef void* DatasetHandle;
Guolin Ke's avatar
Guolin Ke committed
20
21
typedef void* BoosterHandle;

Guolin Ke's avatar
Guolin Ke committed
22
23
24
25
26
27
28
29
#define C_API_DTYPE_FLOAT32 (0)
#define C_API_DTYPE_FLOAT64 (1)
#define C_API_DTYPE_INT32   (2)
#define C_API_DTYPE_INT64   (3)

#define C_API_PREDICT_NORMAL     (0)
#define C_API_PREDICT_RAW_SCORE  (1)
#define C_API_PREDICT_LEAF_INDEX (2)
30

Guolin Ke's avatar
Guolin Ke committed
31
32
/*!
* \brief get string message of the last error
wxchan's avatar
wxchan committed
33
*  all function in this file will return 0 when succeed
Guolin Ke's avatar
Guolin Ke committed
34
35
36
*  and -1 when an error occured,
* \return const char* error inforomation
*/
37
LIGHTGBM_C_EXPORT const char* LGBM_GetLastError();
Guolin Ke's avatar
Guolin Ke committed
38
39


Guolin Ke's avatar
Guolin Ke committed
40
// --- start Dataset interface
Guolin Ke's avatar
Guolin Ke committed
41
42
43
44

/*!
* \brief load data set from file like the command_line LightGBM do
* \param filename the name of the file
Guolin Ke's avatar
Guolin Ke committed
45
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
46
47
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out a loaded dataset
wxchan's avatar
wxchan committed
48
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
49
*/
50
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromFile(const char* filename,
Guolin Ke's avatar
Guolin Ke committed
51
  const char* parameters,
52
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
53
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
54
55
56
57

/*!
* \brief create a dataset from CSR format
* \param indptr pointer to row headers
wxchan's avatar
wxchan committed
58
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
59
60
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
61
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
62
* \param nindptr number of rows in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
63
* \param nelem number of nonzero elements in the matrix
wxchan's avatar
wxchan committed
64
* \param num_col number of columns
Guolin Ke's avatar
Guolin Ke committed
65
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
66
67
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
68
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
69
*/
70
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromCSR(const void* indptr,
71
  int indptr_type,
Guolin Ke's avatar
Guolin Ke committed
72
  const int32_t* indices,
73
  const void* data,
74
75
76
77
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
Guolin Ke's avatar
Guolin Ke committed
78
  const char* parameters,
79
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
80
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
81
82
83
84

/*!
* \brief create a dataset from CSC format
* \param col_ptr pointer to col headers
wxchan's avatar
wxchan committed
85
* \param col_ptr_type type of col_ptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
86
87
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
88
89
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param ncol_ptr number of cols in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
90
* \param nelem number of nonzero elements in the matrix
wxchan's avatar
wxchan committed
91
* \param num_row number of rows
Guolin Ke's avatar
Guolin Ke committed
92
93
94
* \param parameters additional parameters
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
95
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
96
*/
97
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromCSC(const void* col_ptr,
98
  int col_ptr_type,
Guolin Ke's avatar
Guolin Ke committed
99
100
  const int32_t* indices,
  const void* data,
101
102
103
104
  int data_type,
  int64_t ncol_ptr,
  int64_t nelem,
  int64_t num_row,
Guolin Ke's avatar
Guolin Ke committed
105
  const char* parameters,
106
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
107
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
108
109
110
111

/*!
* \brief create dataset from dense matrix
* \param data pointer to the data space
wxchan's avatar
wxchan committed
112
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
113
114
* \param nrow number of rows
* \param ncol number columns
115
* \param is_row_major 1 for row major, 0 for column major
Guolin Ke's avatar
Guolin Ke committed
116
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
117
118
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
119
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
120
*/
121
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromMat(const void* data,
122
  int data_type,
Guolin Ke's avatar
Guolin Ke committed
123
124
  int32_t nrow,
  int32_t ncol,
125
  int is_row_major,
Guolin Ke's avatar
Guolin Ke committed
126
  const char* parameters,
127
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
128
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
129

wxchan's avatar
wxchan committed
130
131
132
133
134
135
136
137
138
/*!
* \brief Create subset of a data
* \param handle handle of full dataset
* \param used_row_indices Indices used in subset
* \param num_used_row_indices len of used_row_indices
* \param parameters additional parameters
* \param out subset of data
* \return 0 when succeed, -1 when failure happens
*/
139
LIGHTGBM_C_EXPORT int LGBM_DatasetGetSubset(
140
  const DatasetHandle handle,
wxchan's avatar
wxchan committed
141
142
143
  const int32_t* used_row_indices,
  int32_t num_used_row_indices,
  const char* parameters,
Guolin Ke's avatar
typo  
Guolin Ke committed
144
  DatasetHandle* out);
wxchan's avatar
wxchan committed
145

Guolin Ke's avatar
Guolin Ke committed
146
147
148
149
150
151
152
/*!
* \brief save feature names to Dataset
* \param handle handle
* \param feature_names feature names
* \param num_feature_names number of feature names
* \return 0 when succeed, -1 when failure happens
*/
153
LIGHTGBM_C_EXPORT int LGBM_DatasetSetFeatureNames(
Guolin Ke's avatar
typo  
Guolin Ke committed
154
  DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
155
  const char** feature_names,
Guolin Ke's avatar
Guolin Ke committed
156
  int num_feature_names);
Guolin Ke's avatar
Guolin Ke committed
157

158
159
160
161
162
163
164
165

/*!
* \brief get feature names of Dataset
* \param handle handle
* \param feature_names feature names, should pre-allocate memory
* \param num_feature_names number of feature names
* \return 0 when succeed, -1 when failure happens
*/
166
LIGHTGBM_C_EXPORT int LGBM_DatasetGetFeatureNames(
167
168
  DatasetHandle handle,
  char** feature_names,
Guolin Ke's avatar
Guolin Ke committed
169
  int* num_feature_names);
170
171


Guolin Ke's avatar
Guolin Ke committed
172
173
/*!
* \brief free space for dataset
wxchan's avatar
wxchan committed
174
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
175
*/
176
LIGHTGBM_C_EXPORT int LGBM_DatasetFree(DatasetHandle handle);
Guolin Ke's avatar
Guolin Ke committed
177
178
179
180
181

/*!
* \brief save dateset to binary file
* \param handle a instance of dataset
* \param filename file name
wxchan's avatar
wxchan committed
182
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
183
*/
184
LIGHTGBM_C_EXPORT int LGBM_DatasetSaveBinary(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
185
186
187
188
  const char* filename);

/*!
* \brief set vector to a content in info
wxchan's avatar
wxchan committed
189
190
*        Note: group and group only work for C_API_DTYPE_INT32
*              label and weight only work for C_API_DTYPE_FLOAT32
Guolin Ke's avatar
Guolin Ke committed
191
* \param handle a instance of dataset
wxchan's avatar
wxchan committed
192
* \param field_name field name, can be label, weight, group, group_id
193
* \param field_data pointer to vector
Guolin Ke's avatar
Guolin Ke committed
194
* \param num_element number of element in field_data
wxchan's avatar
wxchan committed
195
196
* \param type C_API_DTYPE_FLOAT32 or C_API_DTYPE_INT32
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
197
*/
198
LIGHTGBM_C_EXPORT int LGBM_DatasetSetField(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
199
200
  const char* field_name,
  const void* field_data,
Guolin Ke's avatar
Guolin Ke committed
201
  int num_element,
Guolin Ke's avatar
Guolin Ke committed
202
203
204
  int type);

/*!
205
* \brief get info vector from dataset
Guolin Ke's avatar
Guolin Ke committed
206
207
208
209
* \param handle a instance of data matrix
* \param field_name field name
* \param out_len used to set result length
* \param out_ptr pointer to the result
wxchan's avatar
wxchan committed
210
211
* \param out_type  C_API_DTYPE_FLOAT32 or C_API_DTYPE_INT32
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
212
*/
213
LIGHTGBM_C_EXPORT int LGBM_DatasetGetField(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
214
  const char* field_name,
Guolin Ke's avatar
Guolin Ke committed
215
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
216
217
218
219
220
221
222
  const void** out_ptr,
  int* out_type);

/*!
* \brief get number of data.
* \param handle the handle to the dataset
* \param out The address to hold number of data
wxchan's avatar
wxchan committed
223
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
224
*/
225
LIGHTGBM_C_EXPORT int LGBM_DatasetGetNumData(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
226
  int* out);
Guolin Ke's avatar
Guolin Ke committed
227
228
229
230
231

/*!
* \brief get number of features
* \param handle the handle to the dataset
* \param out The output of number of features
wxchan's avatar
wxchan committed
232
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
233
*/
234
LIGHTGBM_C_EXPORT int LGBM_DatasetGetNumFeature(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
235
  int* out);
Guolin Ke's avatar
Guolin Ke committed
236
237
238
239
240

// --- start Booster interfaces

/*!
* \brief create an new boosting learner
Guolin Ke's avatar
Guolin Ke committed
241
* \param train_data training data set
Guolin Ke's avatar
Guolin Ke committed
242
243
* \param parameters format: 'key1=value1 key2=value2'
* \prama out handle of created Booster
wxchan's avatar
wxchan committed
244
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
245
*/
246
LIGHTGBM_C_EXPORT int LGBM_BoosterCreate(const DatasetHandle train_data,
Guolin Ke's avatar
Guolin Ke committed
247
248
249
250
  const char* parameters,
  BoosterHandle* out);

/*!
Guolin Ke's avatar
Guolin Ke committed
251
* \brief load an existing boosting from model file
Guolin Ke's avatar
Guolin Ke committed
252
* \param filename filename of model
wxchan's avatar
wxchan committed
253
* \param out_num_iterations number of iterations of this booster
Guolin Ke's avatar
Guolin Ke committed
254
* \param out handle of created Booster
wxchan's avatar
wxchan committed
255
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
256
*/
257
LIGHTGBM_C_EXPORT int LGBM_BoosterCreateFromModelfile(
Guolin Ke's avatar
Guolin Ke committed
258
  const char* filename,
Guolin Ke's avatar
Guolin Ke committed
259
  int* out_num_iterations,
Guolin Ke's avatar
Guolin Ke committed
260
261
  BoosterHandle* out);

262
263
264
265
266
267
268
269
270
271
272
/*!
* \brief load an existing boosting from string
* \param model_str model string
* \param out_num_iterations number of iterations of this booster
* \param out handle of created Booster
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_BoosterLoadModelFromString(
  const char* model_str,
  int* out_num_iterations,
  BoosterHandle* out);
wxchan's avatar
wxchan committed
273

Guolin Ke's avatar
Guolin Ke committed
274
275
276
/*!
* \brief free obj in handle
* \param handle handle to be freed
wxchan's avatar
wxchan committed
277
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
278
*/
279
LIGHTGBM_C_EXPORT int LGBM_BoosterFree(BoosterHandle handle);
Guolin Ke's avatar
Guolin Ke committed
280

wxchan's avatar
wxchan committed
281
282
283
284
285
286
/*!
* \brief Merge model in two booster to first handle
* \param handle handle, will merge other handle to this
* \param other_handle
* \return 0 when succeed, -1 when failure happens
*/
287
LIGHTGBM_C_EXPORT int LGBM_BoosterMerge(BoosterHandle handle,
wxchan's avatar
wxchan committed
288
289
290
291
292
293
294
295
  BoosterHandle other_handle);

/*!
* \brief Add new validation to booster
* \param handle handle
* \param valid_data validation data set
* \return 0 when succeed, -1 when failure happens
*/
296
LIGHTGBM_C_EXPORT int LGBM_BoosterAddValidData(BoosterHandle handle,
Guolin Ke's avatar
typo  
Guolin Ke committed
297
  const DatasetHandle valid_data);
wxchan's avatar
wxchan committed
298
299
300
301
302
303
304

/*!
* \brief Reset training data for booster
* \param handle handle
* \param train_data training data set
* \return 0 when succeed, -1 when failure happens
*/
305
LIGHTGBM_C_EXPORT int LGBM_BoosterResetTrainingData(BoosterHandle handle,
Guolin Ke's avatar
typo  
Guolin Ke committed
306
  const DatasetHandle train_data);
wxchan's avatar
wxchan committed
307
308
309
310
311
312
313

/*!
* \brief Reset config for current booster
* \param handle handle
* \param parameters format: 'key1=value1 key2=value2'
* \return 0 when succeed, -1 when failure happens
*/
314
LIGHTGBM_C_EXPORT int LGBM_BoosterResetParameter(BoosterHandle handle, const char* parameters);
wxchan's avatar
wxchan committed
315
316

/*!
Guolin Ke's avatar
Guolin Ke committed
317
* \brief Get number of class
wxchan's avatar
wxchan committed
318
319
320
321
* \param handle handle
* \param out_len number of class
* \return 0 when succeed, -1 when failure happens
*/
322
LIGHTGBM_C_EXPORT int LGBM_BoosterGetNumClasses(BoosterHandle handle, int* out_len);
wxchan's avatar
wxchan committed
323

Guolin Ke's avatar
Guolin Ke committed
324
325
326
/*!
* \brief update the model in one round
* \param handle handle
Guolin Ke's avatar
Guolin Ke committed
327
* \param is_finished 1 means finised(cannot split any more)
wxchan's avatar
wxchan committed
328
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
329
*/
330
LIGHTGBM_C_EXPORT int LGBM_BoosterUpdateOneIter(BoosterHandle handle, int* is_finished);
Guolin Ke's avatar
Guolin Ke committed
331
332
333
334
335
336
337

/*!
* \brief update the model, by directly specify gradient and second order gradient,
*       this can be used to support customized loss function
* \param handle handle
* \param grad gradient statistics
* \param hess second order gradient statistics
Guolin Ke's avatar
Guolin Ke committed
338
* \param is_finished 1 means finised(cannot split any more)
wxchan's avatar
wxchan committed
339
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
340
*/
341
LIGHTGBM_C_EXPORT int LGBM_BoosterUpdateOneIterCustom(BoosterHandle handle,
342
343
  const float* grad,
  const float* hess,
Guolin Ke's avatar
Guolin Ke committed
344
345
346
  int* is_finished);

/*!
wxchan's avatar
wxchan committed
347
* \brief Rollback one iteration
Guolin Ke's avatar
Guolin Ke committed
348
* \param handle handle
wxchan's avatar
wxchan committed
349
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
350
*/
351
LIGHTGBM_C_EXPORT int LGBM_BoosterRollbackOneIter(BoosterHandle handle);
wxchan's avatar
wxchan committed
352
353
354
355
356
357

/*!
* \brief Get iteration of current boosting rounds
* \param out_iteration iteration of boosting rounds
* \return 0 when succeed, -1 when failure happens
*/
358
LIGHTGBM_C_EXPORT int LGBM_BoosterGetCurrentIteration(BoosterHandle handle, int* out_iteration);
Guolin Ke's avatar
Guolin Ke committed
359

Guolin Ke's avatar
Guolin Ke committed
360
/*!
Guolin Ke's avatar
Guolin Ke committed
361
* \brief Get number of eval
wxchan's avatar
wxchan committed
362
363
364
* \param out_len total number of eval results
* \return 0 when succeed, -1 when failure happens
*/
365
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEvalCounts(BoosterHandle handle, int* out_len);
wxchan's avatar
wxchan committed
366
367
368
369

/*!
* \brief Get Name of eval
* \param out_len total number of eval results
Guolin Ke's avatar
typo  
Guolin Ke committed
370
* \param out_strs names of eval result, need to pre-allocate memory before call this
wxchan's avatar
wxchan committed
371
372
* \return 0 when succeed, -1 when failure happens
*/
373
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEvalNames(BoosterHandle handle, int* out_len, char** out_strs);
wxchan's avatar
wxchan committed
374
375
376

/*!
* \brief get evaluation for training data and validation data
Guolin Ke's avatar
Guolin Ke committed
377
378
Note: 1. you should call LGBM_BoosterGetEvalNames first to get the name of evaluation results
2. should pre-allocate memory for out_results, you can get its length by LGBM_BoosterGetEvalCounts
Guolin Ke's avatar
Guolin Ke committed
379
* \param handle handle
wxchan's avatar
wxchan committed
380
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
Guolin Ke's avatar
Guolin Ke committed
381
* \param out_len len of output result
wxchan's avatar
wxchan committed
382
383
* \param out_result float arrary contains result
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
384
*/
385
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEval(BoosterHandle handle,
wxchan's avatar
wxchan committed
386
  int data_idx,
Guolin Ke's avatar
Guolin Ke committed
387
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
388
389
390
391
392
393
394
395
396
397
398
  double* out_results);

/*!
* \brief Get number of predict for inner dataset
this can be used to support customized eval function
Note:  should pre-allocate memory for out_result, its length is equal to num_class * num_data
* \param handle handle
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
* \param out_len len of output result
* \return 0 when succeed, -1 when failure happens
*/
399
LIGHTGBM_C_EXPORT int LGBM_BoosterGetNumPredict(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
400
401
  int data_idx,
  int64_t* out_len);
Guolin Ke's avatar
Guolin Ke committed
402

Guolin Ke's avatar
Guolin Ke committed
403
/*!
Guolin Ke's avatar
Guolin Ke committed
404
* \brief Get prediction for training data and validation data
Guolin Ke's avatar
Guolin Ke committed
405
406
this can be used to support customized eval function
Note:  should pre-allocate memory for out_result, its length is equal to num_class * num_data
Guolin Ke's avatar
Guolin Ke committed
407
* \param handle handle
wxchan's avatar
wxchan committed
408
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
Guolin Ke's avatar
Guolin Ke committed
409
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
410
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
411
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
412
*/
413
LIGHTGBM_C_EXPORT int LGBM_BoosterGetPredict(BoosterHandle handle,
wxchan's avatar
wxchan committed
414
  int data_idx,
415
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
416
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
417

418
419
420
421
/*!
* \brief make prediction for file
* \param handle handle
* \param data_filename filename of data file
wxchan's avatar
wxchan committed
422
423
424
425
426
427
* \param data_has_header data file has header or not
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
428
* \param result_filename filename of result file
wxchan's avatar
wxchan committed
429
* \return 0 when succeed, -1 when failure happens
430
*/
431
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForFile(BoosterHandle handle,
432
  const char* data_filename,
wxchan's avatar
wxchan committed
433
434
  int data_has_header,
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
435
  int num_iteration,
436
437
  const char* result_filename);

Guolin Ke's avatar
Guolin Ke committed
438
439
440
/*!
* \brief Get number of prediction
* \param handle handle
Guolin Ke's avatar
Guolin Ke committed
441
* \param num_row
Guolin Ke's avatar
Guolin Ke committed
442
443
444
445
446
447
448
449
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len lenght of prediction
* \return 0 when succeed, -1 when failure happens
*/
450
LIGHTGBM_C_EXPORT int LGBM_BoosterCalcNumPredict(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
451
  int num_row,
Guolin Ke's avatar
Guolin Ke committed
452
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
453
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
454
455
  int64_t* out_len);

Guolin Ke's avatar
Guolin Ke committed
456
457
/*!
* \brief make prediction for an new data set
Guolin Ke's avatar
Guolin Ke committed
458
*        Note:  should pre-allocate memory for out_result,
wxchan's avatar
wxchan committed
459
460
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
Guolin Ke's avatar
Guolin Ke committed
461
462
* \param handle handle
* \param indptr pointer to row headers
wxchan's avatar
wxchan committed
463
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
464
465
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
466
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
467
* \param nindptr number of rows in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
468
469
470
* \param nelem number of nonzero elements in the matrix
* \param num_col number of columns; when it's set to 0, then guess from data
* \param predict_type
wxchan's avatar
wxchan committed
471
472
473
474
475
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
476
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
477
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
478
*/
479
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForCSR(BoosterHandle handle,
480
481
  const void* indptr,
  int indptr_type,
Guolin Ke's avatar
Guolin Ke committed
482
  const int32_t* indices,
483
  const void* data,
484
485
486
487
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
Guolin Ke's avatar
Guolin Ke committed
488
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
489
  int num_iteration,
wxchan's avatar
wxchan committed
490
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
  double* out_result);

/*!
* \brief make prediction for an new data set
*        Note:  should pre-allocate memory for out_result,
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
* \param handle handle
* \param col_ptr pointer to col headers
* \param col_ptr_type type of col_ptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
* \param indices findex
* \param data fvalue
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param ncol_ptr number of cols in the matrix + 1
* \param nelem number of nonzero elements in the matrix
* \param num_row number of rows
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
* \param out_result used to set a pointer to array, should allocate memory before call this function
* \return 0 when succeed, -1 when failure happens
*/
516
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForCSC(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
517
518
519
520
521
522
523
524
525
  const void* col_ptr,
  int col_ptr_type,
  const int32_t* indices,
  const void* data,
  int data_type,
  int64_t ncol_ptr,
  int64_t nelem,
  int64_t num_row,
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
526
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
527
528
  int64_t* out_len,
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
529
530
531

/*!
* \brief make prediction for an new data set
wxchan's avatar
wxchan committed
532
533
534
*        Note:  should pre-allocate memory for out_result,
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
Guolin Ke's avatar
Guolin Ke committed
535
536
* \param handle handle
* \param data pointer to the data space
wxchan's avatar
wxchan committed
537
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
538
539
* \param nrow number of rows
* \param ncol number columns
Guolin Ke's avatar
Guolin Ke committed
540
* \param is_row_major 1 for row major, 0 for column major
Guolin Ke's avatar
Guolin Ke committed
541
* \param predict_type
wxchan's avatar
wxchan committed
542
543
544
545
546
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
547
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
548
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
549
*/
550
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForMat(BoosterHandle handle,
551
  const void* data,
552
  int data_type,
Guolin Ke's avatar
Guolin Ke committed
553
554
  int32_t nrow,
  int32_t ncol,
Guolin Ke's avatar
Guolin Ke committed
555
  int is_row_major,
Guolin Ke's avatar
Guolin Ke committed
556
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
557
  int num_iteration,
wxchan's avatar
wxchan committed
558
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
559
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
560
561
562
563

/*!
* \brief save model into file
* \param handle handle
wxchan's avatar
wxchan committed
564
* \param num_iteration, <= 0 means save all
Guolin Ke's avatar
Guolin Ke committed
565
* \param filename file name
wxchan's avatar
wxchan committed
566
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
567
*/
568
LIGHTGBM_C_EXPORT int LGBM_BoosterSaveModel(BoosterHandle handle,
wxchan's avatar
wxchan committed
569
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
570
571
  const char* filename);

572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
/*!
* \brief save model to string
* \param handle handle
* \param num_iteration, <= 0 means save all
* \param buffer_len string buffer length, if buffer_len < out_len, re-allocate buffer
* \param out_len actual output length
* \param out_str string of model, need to pre-allocate memory before call this
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_BoosterSaveModelToString(BoosterHandle handle,
  int num_iteration,
  int buffer_len,
  int* out_len,
  char* out_str);

wxchan's avatar
wxchan committed
587
588
589
/*!
* \brief dump model to json
* \param handle handle
590
* \param num_iteration, <= 0 means save all
wxchan's avatar
wxchan committed
591
592
* \param buffer_len string buffer length, if buffer_len < out_len, re-allocate buffer
* \param out_len actual output length
Guolin Ke's avatar
typo  
Guolin Ke committed
593
* \param out_str json format string of model, need to pre-allocate memory before call this
wxchan's avatar
wxchan committed
594
595
* \return 0 when succeed, -1 when failure happens
*/
596
LIGHTGBM_C_EXPORT int LGBM_BoosterDumpModel(BoosterHandle handle,
597
  int num_iteration,
wxchan's avatar
wxchan committed
598
  int buffer_len,
Guolin Ke's avatar
Guolin Ke committed
599
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
600
  char* out_str);
601

Guolin Ke's avatar
Guolin Ke committed
602
/*!
Guolin Ke's avatar
Guolin Ke committed
603
* \brief Get leaf value
Guolin Ke's avatar
Guolin Ke committed
604
605
606
607
608
609
* \param handle handle
* \param tree_idx index of tree
* \param leaf_idx index of leaf
* \param out_val out result
* \return 0 when succeed, -1 when failure happens
*/
610
LIGHTGBM_C_EXPORT int LGBM_BoosterGetLeafValue(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
611
612
  int tree_idx,
  int leaf_idx,
Guolin Ke's avatar
Guolin Ke committed
613
  double* out_val);
Guolin Ke's avatar
Guolin Ke committed
614
615
616
617
618
619
620
621
622

/*!
* \brief Set leaf value
* \param handle handle
* \param tree_idx index of tree
* \param leaf_idx index of leaf
* \param val leaf value
* \return 0 when succeed, -1 when failure happens
*/
623
LIGHTGBM_C_EXPORT int LGBM_BoosterSetLeafValue(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
624
625
  int tree_idx,
  int leaf_idx,
Guolin Ke's avatar
Guolin Ke committed
626
  double val);
627

wxchan's avatar
wxchan committed
628
#if defined(_MSC_VER)
629
// exception handle and error msg
wxchan's avatar
wxchan committed
630
631
632
633
static char* LastErrorMsg() { static __declspec(thread) char err_msg[512] = "Everything is fine"; return err_msg; }
#else
static char* LastErrorMsg() { static thread_local char err_msg[512] = "Everything is fine"; return err_msg; }
#endif
634
635

inline void LGBM_SetLastError(const char* msg) {
wxchan's avatar
wxchan committed
636
  std::strcpy(LastErrorMsg(), msg);
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
}

inline int LGBM_APIHandleException(const std::exception& ex) {
  LGBM_SetLastError(ex.what());
  return -1;
}
inline int LGBM_APIHandleException(const std::string& ex) {
  LGBM_SetLastError(ex.c_str());
  return -1;
}

#define API_BEGIN() try {

#define API_END() } \
catch(std::exception& ex) { return LGBM_APIHandleException(ex); } \
catch(std::string& ex) { return LGBM_APIHandleException(ex); } \
catch(...) { return LGBM_APIHandleException("unknown exception"); } \
wxchan's avatar
wxchan committed
654
return 0;
655

Guolin Ke's avatar
Guolin Ke committed
656
#endif // LIGHTGBM_C_API_H_