c_api.h 24.7 KB
Newer Older
Guolin Ke's avatar
Guolin Ke committed
1
2
#ifndef LIGHTGBM_C_API_H_
#define LIGHTGBM_C_API_H_
3
4
5
#include <cstdint>
#include <exception>
#include <stdexcept>
wxchan's avatar
wxchan committed
6
#include <cstring>
7
#include <string>
wxchan's avatar
wxchan committed
8

9
10
11
/*!
* To avoid type conversion on large data, most of our expose interface support both for float_32 and float_64.
* Except following:
wxchan's avatar
wxchan committed
12
* 1. gradients and hessians.
13
* 2. Get current score for training data and validation
wxchan's avatar
wxchan committed
14
* The reason is because they are called frequently, the type-conversion on them maybe time cost.
15
16
*/

17
#include <LightGBM/export.h>
Guolin Ke's avatar
Guolin Ke committed
18

Guolin Ke's avatar
typo  
Guolin Ke committed
19
typedef void* DatasetHandle;
Guolin Ke's avatar
Guolin Ke committed
20
21
typedef void* BoosterHandle;

Guolin Ke's avatar
Guolin Ke committed
22
23
24
25
26
27
28
29
#define C_API_DTYPE_FLOAT32 (0)
#define C_API_DTYPE_FLOAT64 (1)
#define C_API_DTYPE_INT32   (2)
#define C_API_DTYPE_INT64   (3)

#define C_API_PREDICT_NORMAL     (0)
#define C_API_PREDICT_RAW_SCORE  (1)
#define C_API_PREDICT_LEAF_INDEX (2)
30

Guolin Ke's avatar
Guolin Ke committed
31
32
/*!
* \brief get string message of the last error
wxchan's avatar
wxchan committed
33
*  all function in this file will return 0 when succeed
Guolin Ke's avatar
Guolin Ke committed
34
35
36
*  and -1 when an error occured,
* \return const char* error inforomation
*/
37
LIGHTGBM_C_EXPORT const char* LGBM_GetLastError();
Guolin Ke's avatar
Guolin Ke committed
38
39


Guolin Ke's avatar
Guolin Ke committed
40
// --- start Dataset interface
Guolin Ke's avatar
Guolin Ke committed
41
42
43
44

/*!
* \brief load data set from file like the command_line LightGBM do
* \param filename the name of the file
Guolin Ke's avatar
Guolin Ke committed
45
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
46
47
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out a loaded dataset
wxchan's avatar
wxchan committed
48
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
49
*/
50
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromFile(const char* filename,
Guolin Ke's avatar
Guolin Ke committed
51
  const char* parameters,
52
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
53
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
54

Guolin Ke's avatar
Guolin Ke committed
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135

/*!
* \brief create a empty dataset by sampling csc data, if num_sample_row == num_total_row, will construct this dataset.
* \param indptr pointer to row headers
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
* \param indices findex
* \param data fvalue
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param nindptr number of rows in the matrix + 1
* \param n_sample_elem number of nonzero elements in the matrix
* \param num_col number of columns
* \param num_total_row number of total rows
* \param parameters additional parameters
* \param out created dataset
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromSampledCSR(const void* indptr,
  int indptr_type,
  const int32_t* indices,
  const void* data,
  int data_type,
  int64_t nindptr,
  int64_t n_sample_elem,
  int64_t num_col,
  int64_t num_total_row,
  const char* parameters,
  DatasetHandle* out);

/*!
* \brief create a empty dataset by reference Dataset
* \param reference used to align bin mapper
* \param num_total_row number of total rows
* \param out created dataset
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateByReference(const DatasetHandle reference,
  int64_t num_total_row,
  DatasetHandle* out);

/*!
* \brief push data to existing dataset, if nrow + start_row == num_total_row, will call dataset->FinishLoad
* \param dataset handle of dataset
* \param data pointer to the data space
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param nrow number of rows
* \param ncol number columns
* \param start_row row start index
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_DatasetPushRows(DatasetHandle dataset,
  const void* data,
  int data_type,
  int32_t nrow,
  int32_t ncol,
  int32_t start_row);

/*!
* \brief push data to existing dataset, if nrow + start_row == num_total_row, will call dataset->FinishLoad
* \param dataset handle of dataset
* \param indptr pointer to row headers
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
* \param indices findex
* \param data fvalue
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param nindptr number of rows in the matrix + 1
* \param nelem number of nonzero elements in the matrix
* \param num_col number of columns
* \param start_row row start index
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_DatasetPushRowsByCSR(DatasetHandle dataset,
  const void* indptr,
  int indptr_type,
  const int32_t* indices,
  const void* data,
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
  int64_t start_row);

Guolin Ke's avatar
Guolin Ke committed
136
137
138
/*!
* \brief create a dataset from CSR format
* \param indptr pointer to row headers
wxchan's avatar
wxchan committed
139
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
140
141
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
142
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
143
* \param nindptr number of rows in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
144
* \param nelem number of nonzero elements in the matrix
wxchan's avatar
wxchan committed
145
* \param num_col number of columns
Guolin Ke's avatar
Guolin Ke committed
146
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
147
148
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
149
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
150
*/
151
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromCSR(const void* indptr,
152
  int indptr_type,
Guolin Ke's avatar
Guolin Ke committed
153
  const int32_t* indices,
154
  const void* data,
155
156
157
158
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
Guolin Ke's avatar
Guolin Ke committed
159
  const char* parameters,
160
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
161
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
162
163
164
165

/*!
* \brief create a dataset from CSC format
* \param col_ptr pointer to col headers
wxchan's avatar
wxchan committed
166
* \param col_ptr_type type of col_ptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
167
168
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
169
170
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param ncol_ptr number of cols in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
171
* \param nelem number of nonzero elements in the matrix
wxchan's avatar
wxchan committed
172
* \param num_row number of rows
Guolin Ke's avatar
Guolin Ke committed
173
174
175
* \param parameters additional parameters
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
176
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
177
*/
178
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromCSC(const void* col_ptr,
179
  int col_ptr_type,
Guolin Ke's avatar
Guolin Ke committed
180
181
  const int32_t* indices,
  const void* data,
182
183
184
185
  int data_type,
  int64_t ncol_ptr,
  int64_t nelem,
  int64_t num_row,
Guolin Ke's avatar
Guolin Ke committed
186
  const char* parameters,
187
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
188
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
189
190
191
192

/*!
* \brief create dataset from dense matrix
* \param data pointer to the data space
wxchan's avatar
wxchan committed
193
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
194
195
* \param nrow number of rows
* \param ncol number columns
196
* \param is_row_major 1 for row major, 0 for column major
Guolin Ke's avatar
Guolin Ke committed
197
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
198
199
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
200
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
201
*/
202
LIGHTGBM_C_EXPORT int LGBM_DatasetCreateFromMat(const void* data,
203
  int data_type,
Guolin Ke's avatar
Guolin Ke committed
204
205
  int32_t nrow,
  int32_t ncol,
206
  int is_row_major,
Guolin Ke's avatar
Guolin Ke committed
207
  const char* parameters,
208
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
209
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
210

wxchan's avatar
wxchan committed
211
212
213
214
215
216
217
218
219
/*!
* \brief Create subset of a data
* \param handle handle of full dataset
* \param used_row_indices Indices used in subset
* \param num_used_row_indices len of used_row_indices
* \param parameters additional parameters
* \param out subset of data
* \return 0 when succeed, -1 when failure happens
*/
220
LIGHTGBM_C_EXPORT int LGBM_DatasetGetSubset(
221
  const DatasetHandle handle,
wxchan's avatar
wxchan committed
222
223
224
  const int32_t* used_row_indices,
  int32_t num_used_row_indices,
  const char* parameters,
Guolin Ke's avatar
typo  
Guolin Ke committed
225
  DatasetHandle* out);
wxchan's avatar
wxchan committed
226

Guolin Ke's avatar
Guolin Ke committed
227
228
229
230
231
232
233
/*!
* \brief save feature names to Dataset
* \param handle handle
* \param feature_names feature names
* \param num_feature_names number of feature names
* \return 0 when succeed, -1 when failure happens
*/
234
LIGHTGBM_C_EXPORT int LGBM_DatasetSetFeatureNames(
Guolin Ke's avatar
typo  
Guolin Ke committed
235
  DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
236
  const char** feature_names,
Guolin Ke's avatar
Guolin Ke committed
237
  int num_feature_names);
Guolin Ke's avatar
Guolin Ke committed
238

239
240
241
242
243
244
245
246

/*!
* \brief get feature names of Dataset
* \param handle handle
* \param feature_names feature names, should pre-allocate memory
* \param num_feature_names number of feature names
* \return 0 when succeed, -1 when failure happens
*/
247
LIGHTGBM_C_EXPORT int LGBM_DatasetGetFeatureNames(
248
249
  DatasetHandle handle,
  char** feature_names,
Guolin Ke's avatar
Guolin Ke committed
250
  int* num_feature_names);
251
252


Guolin Ke's avatar
Guolin Ke committed
253
254
/*!
* \brief free space for dataset
wxchan's avatar
wxchan committed
255
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
256
*/
257
LIGHTGBM_C_EXPORT int LGBM_DatasetFree(DatasetHandle handle);
Guolin Ke's avatar
Guolin Ke committed
258
259
260
261
262

/*!
* \brief save dateset to binary file
* \param handle a instance of dataset
* \param filename file name
wxchan's avatar
wxchan committed
263
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
264
*/
265
LIGHTGBM_C_EXPORT int LGBM_DatasetSaveBinary(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
266
267
268
269
  const char* filename);

/*!
* \brief set vector to a content in info
wxchan's avatar
wxchan committed
270
271
*        Note: group and group only work for C_API_DTYPE_INT32
*              label and weight only work for C_API_DTYPE_FLOAT32
Guolin Ke's avatar
Guolin Ke committed
272
* \param handle a instance of dataset
wxchan's avatar
wxchan committed
273
* \param field_name field name, can be label, weight, group, group_id
274
* \param field_data pointer to vector
Guolin Ke's avatar
Guolin Ke committed
275
* \param num_element number of element in field_data
wxchan's avatar
wxchan committed
276
277
* \param type C_API_DTYPE_FLOAT32 or C_API_DTYPE_INT32
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
278
*/
279
LIGHTGBM_C_EXPORT int LGBM_DatasetSetField(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
280
281
  const char* field_name,
  const void* field_data,
Guolin Ke's avatar
Guolin Ke committed
282
  int num_element,
Guolin Ke's avatar
Guolin Ke committed
283
284
285
  int type);

/*!
286
* \brief get info vector from dataset
Guolin Ke's avatar
Guolin Ke committed
287
288
289
290
* \param handle a instance of data matrix
* \param field_name field name
* \param out_len used to set result length
* \param out_ptr pointer to the result
wxchan's avatar
wxchan committed
291
292
* \param out_type  C_API_DTYPE_FLOAT32 or C_API_DTYPE_INT32
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
293
*/
294
LIGHTGBM_C_EXPORT int LGBM_DatasetGetField(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
295
  const char* field_name,
Guolin Ke's avatar
Guolin Ke committed
296
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
297
298
299
300
301
302
303
  const void** out_ptr,
  int* out_type);

/*!
* \brief get number of data.
* \param handle the handle to the dataset
* \param out The address to hold number of data
wxchan's avatar
wxchan committed
304
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
305
*/
306
LIGHTGBM_C_EXPORT int LGBM_DatasetGetNumData(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
307
  int* out);
Guolin Ke's avatar
Guolin Ke committed
308
309
310
311
312

/*!
* \brief get number of features
* \param handle the handle to the dataset
* \param out The output of number of features
wxchan's avatar
wxchan committed
313
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
314
*/
315
LIGHTGBM_C_EXPORT int LGBM_DatasetGetNumFeature(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
316
  int* out);
Guolin Ke's avatar
Guolin Ke committed
317
318
319
320
321

// --- start Booster interfaces

/*!
* \brief create an new boosting learner
Guolin Ke's avatar
Guolin Ke committed
322
* \param train_data training data set
Guolin Ke's avatar
Guolin Ke committed
323
324
* \param parameters format: 'key1=value1 key2=value2'
* \prama out handle of created Booster
wxchan's avatar
wxchan committed
325
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
326
*/
327
LIGHTGBM_C_EXPORT int LGBM_BoosterCreate(const DatasetHandle train_data,
Guolin Ke's avatar
Guolin Ke committed
328
329
330
331
  const char* parameters,
  BoosterHandle* out);

/*!
Guolin Ke's avatar
Guolin Ke committed
332
* \brief load an existing boosting from model file
Guolin Ke's avatar
Guolin Ke committed
333
* \param filename filename of model
wxchan's avatar
wxchan committed
334
* \param out_num_iterations number of iterations of this booster
Guolin Ke's avatar
Guolin Ke committed
335
* \param out handle of created Booster
wxchan's avatar
wxchan committed
336
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
337
*/
338
LIGHTGBM_C_EXPORT int LGBM_BoosterCreateFromModelfile(
Guolin Ke's avatar
Guolin Ke committed
339
  const char* filename,
Guolin Ke's avatar
Guolin Ke committed
340
  int* out_num_iterations,
Guolin Ke's avatar
Guolin Ke committed
341
342
  BoosterHandle* out);

343
344
345
346
347
348
349
350
351
352
353
/*!
* \brief load an existing boosting from string
* \param model_str model string
* \param out_num_iterations number of iterations of this booster
* \param out handle of created Booster
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_BoosterLoadModelFromString(
  const char* model_str,
  int* out_num_iterations,
  BoosterHandle* out);
wxchan's avatar
wxchan committed
354

Guolin Ke's avatar
Guolin Ke committed
355
356
357
/*!
* \brief free obj in handle
* \param handle handle to be freed
wxchan's avatar
wxchan committed
358
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
359
*/
360
LIGHTGBM_C_EXPORT int LGBM_BoosterFree(BoosterHandle handle);
Guolin Ke's avatar
Guolin Ke committed
361

wxchan's avatar
wxchan committed
362
363
364
365
366
367
/*!
* \brief Merge model in two booster to first handle
* \param handle handle, will merge other handle to this
* \param other_handle
* \return 0 when succeed, -1 when failure happens
*/
368
LIGHTGBM_C_EXPORT int LGBM_BoosterMerge(BoosterHandle handle,
wxchan's avatar
wxchan committed
369
370
371
372
373
374
375
376
  BoosterHandle other_handle);

/*!
* \brief Add new validation to booster
* \param handle handle
* \param valid_data validation data set
* \return 0 when succeed, -1 when failure happens
*/
377
LIGHTGBM_C_EXPORT int LGBM_BoosterAddValidData(BoosterHandle handle,
Guolin Ke's avatar
typo  
Guolin Ke committed
378
  const DatasetHandle valid_data);
wxchan's avatar
wxchan committed
379
380
381
382
383
384
385

/*!
* \brief Reset training data for booster
* \param handle handle
* \param train_data training data set
* \return 0 when succeed, -1 when failure happens
*/
386
LIGHTGBM_C_EXPORT int LGBM_BoosterResetTrainingData(BoosterHandle handle,
Guolin Ke's avatar
typo  
Guolin Ke committed
387
  const DatasetHandle train_data);
wxchan's avatar
wxchan committed
388
389
390
391
392
393
394

/*!
* \brief Reset config for current booster
* \param handle handle
* \param parameters format: 'key1=value1 key2=value2'
* \return 0 when succeed, -1 when failure happens
*/
395
LIGHTGBM_C_EXPORT int LGBM_BoosterResetParameter(BoosterHandle handle, const char* parameters);
wxchan's avatar
wxchan committed
396
397

/*!
Guolin Ke's avatar
Guolin Ke committed
398
* \brief Get number of class
wxchan's avatar
wxchan committed
399
400
401
402
* \param handle handle
* \param out_len number of class
* \return 0 when succeed, -1 when failure happens
*/
403
LIGHTGBM_C_EXPORT int LGBM_BoosterGetNumClasses(BoosterHandle handle, int* out_len);
wxchan's avatar
wxchan committed
404

Guolin Ke's avatar
Guolin Ke committed
405
406
407
/*!
* \brief update the model in one round
* \param handle handle
Guolin Ke's avatar
Guolin Ke committed
408
* \param is_finished 1 means finised(cannot split any more)
wxchan's avatar
wxchan committed
409
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
410
*/
411
LIGHTGBM_C_EXPORT int LGBM_BoosterUpdateOneIter(BoosterHandle handle, int* is_finished);
Guolin Ke's avatar
Guolin Ke committed
412
413
414
415
416
417
418

/*!
* \brief update the model, by directly specify gradient and second order gradient,
*       this can be used to support customized loss function
* \param handle handle
* \param grad gradient statistics
* \param hess second order gradient statistics
Guolin Ke's avatar
Guolin Ke committed
419
* \param is_finished 1 means finised(cannot split any more)
wxchan's avatar
wxchan committed
420
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
421
*/
422
LIGHTGBM_C_EXPORT int LGBM_BoosterUpdateOneIterCustom(BoosterHandle handle,
423
424
  const float* grad,
  const float* hess,
Guolin Ke's avatar
Guolin Ke committed
425
426
427
  int* is_finished);

/*!
wxchan's avatar
wxchan committed
428
* \brief Rollback one iteration
Guolin Ke's avatar
Guolin Ke committed
429
* \param handle handle
wxchan's avatar
wxchan committed
430
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
431
*/
432
LIGHTGBM_C_EXPORT int LGBM_BoosterRollbackOneIter(BoosterHandle handle);
wxchan's avatar
wxchan committed
433
434
435
436
437
438

/*!
* \brief Get iteration of current boosting rounds
* \param out_iteration iteration of boosting rounds
* \return 0 when succeed, -1 when failure happens
*/
439
LIGHTGBM_C_EXPORT int LGBM_BoosterGetCurrentIteration(BoosterHandle handle, int* out_iteration);
Guolin Ke's avatar
Guolin Ke committed
440

Guolin Ke's avatar
Guolin Ke committed
441
/*!
Guolin Ke's avatar
Guolin Ke committed
442
* \brief Get number of eval
wxchan's avatar
wxchan committed
443
444
445
* \param out_len total number of eval results
* \return 0 when succeed, -1 when failure happens
*/
446
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEvalCounts(BoosterHandle handle, int* out_len);
wxchan's avatar
wxchan committed
447
448

/*!
wxchan's avatar
wxchan committed
449
* \brief Get name of eval
wxchan's avatar
wxchan committed
450
* \param out_len total number of eval results
Guolin Ke's avatar
typo  
Guolin Ke committed
451
* \param out_strs names of eval result, need to pre-allocate memory before call this
wxchan's avatar
wxchan committed
452
453
* \return 0 when succeed, -1 when failure happens
*/
454
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEvalNames(BoosterHandle handle, int* out_len, char** out_strs);
wxchan's avatar
wxchan committed
455

wxchan's avatar
wxchan committed
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
/*!
* \brief Get name of features
* \param out_len total number of features
* \param out_strs names of features, need to pre-allocate memory before call this
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_BoosterGetFeatureNames(BoosterHandle handle, int* out_len, char** out_strs);

/*!
* \brief Get number of features
* \param out_len total number of features
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_BoosterGetNumFeature(BoosterHandle handle, int* out_len);

wxchan's avatar
wxchan committed
471
472
/*!
* \brief get evaluation for training data and validation data
Guolin Ke's avatar
Guolin Ke committed
473
474
Note: 1. you should call LGBM_BoosterGetEvalNames first to get the name of evaluation results
2. should pre-allocate memory for out_results, you can get its length by LGBM_BoosterGetEvalCounts
Guolin Ke's avatar
Guolin Ke committed
475
* \param handle handle
wxchan's avatar
wxchan committed
476
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
Guolin Ke's avatar
Guolin Ke committed
477
* \param out_len len of output result
wxchan's avatar
wxchan committed
478
479
* \param out_result float arrary contains result
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
480
*/
481
LIGHTGBM_C_EXPORT int LGBM_BoosterGetEval(BoosterHandle handle,
wxchan's avatar
wxchan committed
482
  int data_idx,
Guolin Ke's avatar
Guolin Ke committed
483
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
484
485
486
487
488
489
490
491
492
493
494
  double* out_results);

/*!
* \brief Get number of predict for inner dataset
this can be used to support customized eval function
Note:  should pre-allocate memory for out_result, its length is equal to num_class * num_data
* \param handle handle
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
* \param out_len len of output result
* \return 0 when succeed, -1 when failure happens
*/
495
LIGHTGBM_C_EXPORT int LGBM_BoosterGetNumPredict(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
496
497
  int data_idx,
  int64_t* out_len);
Guolin Ke's avatar
Guolin Ke committed
498

Guolin Ke's avatar
Guolin Ke committed
499
/*!
Guolin Ke's avatar
Guolin Ke committed
500
* \brief Get prediction for training data and validation data
Guolin Ke's avatar
Guolin Ke committed
501
502
this can be used to support customized eval function
Note:  should pre-allocate memory for out_result, its length is equal to num_class * num_data
Guolin Ke's avatar
Guolin Ke committed
503
* \param handle handle
wxchan's avatar
wxchan committed
504
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
Guolin Ke's avatar
Guolin Ke committed
505
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
506
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
507
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
508
*/
509
LIGHTGBM_C_EXPORT int LGBM_BoosterGetPredict(BoosterHandle handle,
wxchan's avatar
wxchan committed
510
  int data_idx,
511
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
512
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
513

514
515
516
517
/*!
* \brief make prediction for file
* \param handle handle
* \param data_filename filename of data file
wxchan's avatar
wxchan committed
518
519
520
521
522
523
* \param data_has_header data file has header or not
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
524
* \param result_filename filename of result file
wxchan's avatar
wxchan committed
525
* \return 0 when succeed, -1 when failure happens
526
*/
527
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForFile(BoosterHandle handle,
528
  const char* data_filename,
wxchan's avatar
wxchan committed
529
530
  int data_has_header,
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
531
  int num_iteration,
532
533
  const char* result_filename);

Guolin Ke's avatar
Guolin Ke committed
534
535
536
/*!
* \brief Get number of prediction
* \param handle handle
Guolin Ke's avatar
Guolin Ke committed
537
* \param num_row
Guolin Ke's avatar
Guolin Ke committed
538
539
540
541
542
543
544
545
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len lenght of prediction
* \return 0 when succeed, -1 when failure happens
*/
546
LIGHTGBM_C_EXPORT int LGBM_BoosterCalcNumPredict(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
547
  int num_row,
Guolin Ke's avatar
Guolin Ke committed
548
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
549
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
550
551
  int64_t* out_len);

Guolin Ke's avatar
Guolin Ke committed
552
553
/*!
* \brief make prediction for an new data set
Guolin Ke's avatar
Guolin Ke committed
554
*        Note:  should pre-allocate memory for out_result,
wxchan's avatar
wxchan committed
555
556
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
Guolin Ke's avatar
Guolin Ke committed
557
558
* \param handle handle
* \param indptr pointer to row headers
wxchan's avatar
wxchan committed
559
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
560
561
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
562
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
563
* \param nindptr number of rows in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
564
565
566
* \param nelem number of nonzero elements in the matrix
* \param num_col number of columns; when it's set to 0, then guess from data
* \param predict_type
wxchan's avatar
wxchan committed
567
568
569
570
571
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
572
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
573
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
574
*/
575
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForCSR(BoosterHandle handle,
576
577
  const void* indptr,
  int indptr_type,
Guolin Ke's avatar
Guolin Ke committed
578
  const int32_t* indices,
579
  const void* data,
580
581
582
583
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
Guolin Ke's avatar
Guolin Ke committed
584
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
585
  int num_iteration,
wxchan's avatar
wxchan committed
586
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
  double* out_result);

/*!
* \brief make prediction for an new data set
*        Note:  should pre-allocate memory for out_result,
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
* \param handle handle
* \param col_ptr pointer to col headers
* \param col_ptr_type type of col_ptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
* \param indices findex
* \param data fvalue
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param ncol_ptr number of cols in the matrix + 1
* \param nelem number of nonzero elements in the matrix
* \param num_row number of rows
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
* \param out_result used to set a pointer to array, should allocate memory before call this function
* \return 0 when succeed, -1 when failure happens
*/
612
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForCSC(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
613
614
615
616
617
618
619
620
621
  const void* col_ptr,
  int col_ptr_type,
  const int32_t* indices,
  const void* data,
  int data_type,
  int64_t ncol_ptr,
  int64_t nelem,
  int64_t num_row,
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
622
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
623
624
  int64_t* out_len,
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
625
626
627

/*!
* \brief make prediction for an new data set
wxchan's avatar
wxchan committed
628
629
630
*        Note:  should pre-allocate memory for out_result,
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
Guolin Ke's avatar
Guolin Ke committed
631
632
* \param handle handle
* \param data pointer to the data space
wxchan's avatar
wxchan committed
633
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
634
635
* \param nrow number of rows
* \param ncol number columns
Guolin Ke's avatar
Guolin Ke committed
636
* \param is_row_major 1 for row major, 0 for column major
Guolin Ke's avatar
Guolin Ke committed
637
* \param predict_type
wxchan's avatar
wxchan committed
638
639
640
641
642
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
643
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
644
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
645
*/
646
LIGHTGBM_C_EXPORT int LGBM_BoosterPredictForMat(BoosterHandle handle,
647
  const void* data,
648
  int data_type,
Guolin Ke's avatar
Guolin Ke committed
649
650
  int32_t nrow,
  int32_t ncol,
Guolin Ke's avatar
Guolin Ke committed
651
  int is_row_major,
Guolin Ke's avatar
Guolin Ke committed
652
  int predict_type,
Guolin Ke's avatar
Guolin Ke committed
653
  int num_iteration,
wxchan's avatar
wxchan committed
654
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
655
  double* out_result);
Guolin Ke's avatar
Guolin Ke committed
656
657
658
659

/*!
* \brief save model into file
* \param handle handle
wxchan's avatar
wxchan committed
660
* \param num_iteration, <= 0 means save all
Guolin Ke's avatar
Guolin Ke committed
661
* \param filename file name
wxchan's avatar
wxchan committed
662
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
663
*/
664
LIGHTGBM_C_EXPORT int LGBM_BoosterSaveModel(BoosterHandle handle,
wxchan's avatar
wxchan committed
665
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
666
667
  const char* filename);

668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
/*!
* \brief save model to string
* \param handle handle
* \param num_iteration, <= 0 means save all
* \param buffer_len string buffer length, if buffer_len < out_len, re-allocate buffer
* \param out_len actual output length
* \param out_str string of model, need to pre-allocate memory before call this
* \return 0 when succeed, -1 when failure happens
*/
LIGHTGBM_C_EXPORT int LGBM_BoosterSaveModelToString(BoosterHandle handle,
  int num_iteration,
  int buffer_len,
  int* out_len,
  char* out_str);

wxchan's avatar
wxchan committed
683
684
685
/*!
* \brief dump model to json
* \param handle handle
686
* \param num_iteration, <= 0 means save all
wxchan's avatar
wxchan committed
687
688
* \param buffer_len string buffer length, if buffer_len < out_len, re-allocate buffer
* \param out_len actual output length
Guolin Ke's avatar
typo  
Guolin Ke committed
689
* \param out_str json format string of model, need to pre-allocate memory before call this
wxchan's avatar
wxchan committed
690
691
* \return 0 when succeed, -1 when failure happens
*/
692
LIGHTGBM_C_EXPORT int LGBM_BoosterDumpModel(BoosterHandle handle,
693
  int num_iteration,
wxchan's avatar
wxchan committed
694
  int buffer_len,
Guolin Ke's avatar
Guolin Ke committed
695
  int* out_len,
Guolin Ke's avatar
Guolin Ke committed
696
  char* out_str);
697

Guolin Ke's avatar
Guolin Ke committed
698
/*!
Guolin Ke's avatar
Guolin Ke committed
699
* \brief Get leaf value
Guolin Ke's avatar
Guolin Ke committed
700
701
702
703
704
705
* \param handle handle
* \param tree_idx index of tree
* \param leaf_idx index of leaf
* \param out_val out result
* \return 0 when succeed, -1 when failure happens
*/
706
LIGHTGBM_C_EXPORT int LGBM_BoosterGetLeafValue(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
707
708
  int tree_idx,
  int leaf_idx,
Guolin Ke's avatar
Guolin Ke committed
709
  double* out_val);
Guolin Ke's avatar
Guolin Ke committed
710
711
712
713
714
715
716
717
718

/*!
* \brief Set leaf value
* \param handle handle
* \param tree_idx index of tree
* \param leaf_idx index of leaf
* \param val leaf value
* \return 0 when succeed, -1 when failure happens
*/
719
LIGHTGBM_C_EXPORT int LGBM_BoosterSetLeafValue(BoosterHandle handle,
Guolin Ke's avatar
Guolin Ke committed
720
721
  int tree_idx,
  int leaf_idx,
Guolin Ke's avatar
Guolin Ke committed
722
  double val);
723

wxchan's avatar
wxchan committed
724
#if defined(_MSC_VER)
725
// exception handle and error msg
wxchan's avatar
wxchan committed
726
727
728
729
static char* LastErrorMsg() { static __declspec(thread) char err_msg[512] = "Everything is fine"; return err_msg; }
#else
static char* LastErrorMsg() { static thread_local char err_msg[512] = "Everything is fine"; return err_msg; }
#endif
730
731

inline void LGBM_SetLastError(const char* msg) {
wxchan's avatar
wxchan committed
732
  std::strcpy(LastErrorMsg(), msg);
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
}

inline int LGBM_APIHandleException(const std::exception& ex) {
  LGBM_SetLastError(ex.what());
  return -1;
}
inline int LGBM_APIHandleException(const std::string& ex) {
  LGBM_SetLastError(ex.c_str());
  return -1;
}

#define API_BEGIN() try {

#define API_END() } \
catch(std::exception& ex) { return LGBM_APIHandleException(ex); } \
catch(std::string& ex) { return LGBM_APIHandleException(ex); } \
catch(...) { return LGBM_APIHandleException("unknown exception"); } \
wxchan's avatar
wxchan committed
750
return 0;
751

Guolin Ke's avatar
Guolin Ke committed
752
#endif // LIGHTGBM_C_API_H_