c_api.h 17.9 KB
Newer Older
Guolin Ke's avatar
Guolin Ke committed
1
2
#ifndef LIGHTGBM_C_API_H_
#define LIGHTGBM_C_API_H_
3
4
5
#include <cstdint>
#include <exception>
#include <stdexcept>
wxchan's avatar
wxchan committed
6
#include <cstring>
7
#include <string>
wxchan's avatar
wxchan committed
8

9
10
11
/*!
* To avoid type conversion on large data, most of our expose interface support both for float_32 and float_64.
* Except following:
wxchan's avatar
wxchan committed
12
* 1. gradients and hessians.
13
* 2. Get current score for training data and validation
wxchan's avatar
wxchan committed
14
* The reason is because they are called frequently, the type-conversion on them maybe time cost.
15
16
*/

Guolin Ke's avatar
Guolin Ke committed
17
18
19
20
21
22
23
24
25
26
27
28
#ifdef __cplusplus
#define DLL_EXTERN_C extern "C"
#else
#define DLL_EXTERN_C
#endif

#ifdef _MSC_VER
#define DllExport DLL_EXTERN_C __declspec(dllexport)
#else
#define DllExport DLL_EXTERN_C
#endif

Guolin Ke's avatar
typo  
Guolin Ke committed
29
typedef void* DatasetHandle;
Guolin Ke's avatar
Guolin Ke committed
30
31
typedef void* BoosterHandle;

Guolin Ke's avatar
Guolin Ke committed
32
33
34
35
36
37
38
39
#define C_API_DTYPE_FLOAT32 (0)
#define C_API_DTYPE_FLOAT64 (1)
#define C_API_DTYPE_INT32   (2)
#define C_API_DTYPE_INT64   (3)

#define C_API_PREDICT_NORMAL     (0)
#define C_API_PREDICT_RAW_SCORE  (1)
#define C_API_PREDICT_LEAF_INDEX (2)
40

Guolin Ke's avatar
Guolin Ke committed
41
42
/*!
* \brief get string message of the last error
wxchan's avatar
wxchan committed
43
*  all function in this file will return 0 when succeed
Guolin Ke's avatar
Guolin Ke committed
44
45
46
47
48
49
*  and -1 when an error occured,
* \return const char* error inforomation
*/
DllExport const char* LGBM_GetLastError();


Guolin Ke's avatar
Guolin Ke committed
50
// --- start Dataset interface
Guolin Ke's avatar
Guolin Ke committed
51
52
53
54

/*!
* \brief load data set from file like the command_line LightGBM do
* \param filename the name of the file
Guolin Ke's avatar
Guolin Ke committed
55
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
56
57
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out a loaded dataset
wxchan's avatar
wxchan committed
58
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
59
*/
wxchan's avatar
wxchan committed
60
DllExport int LGBM_DatasetCreateFromFile(const char* filename,
Guolin Ke's avatar
Guolin Ke committed
61
  const char* parameters,
62
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
63
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
64
65
66
67

/*!
* \brief create a dataset from CSR format
* \param indptr pointer to row headers
wxchan's avatar
wxchan committed
68
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
69
70
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
71
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
72
* \param nindptr number of rows in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
73
* \param nelem number of nonzero elements in the matrix
wxchan's avatar
wxchan committed
74
* \param num_col number of columns
Guolin Ke's avatar
Guolin Ke committed
75
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
76
77
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
78
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
79
*/
wxchan's avatar
wxchan committed
80
DllExport int LGBM_DatasetCreateFromCSR(const void* indptr,
81
  int indptr_type,
Guolin Ke's avatar
Guolin Ke committed
82
  const int32_t* indices,
83
  const void* data,
84
85
86
87
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
Guolin Ke's avatar
Guolin Ke committed
88
  const char* parameters,
89
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
90
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
91
92
93
94

/*!
* \brief create a dataset from CSC format
* \param col_ptr pointer to col headers
wxchan's avatar
wxchan committed
95
* \param col_ptr_type type of col_ptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
96
97
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
98
99
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
* \param ncol_ptr number of cols in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
100
* \param nelem number of nonzero elements in the matrix
wxchan's avatar
wxchan committed
101
* \param num_row number of rows
Guolin Ke's avatar
Guolin Ke committed
102
103
104
* \param parameters additional parameters
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
105
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
106
*/
wxchan's avatar
wxchan committed
107
DllExport int LGBM_DatasetCreateFromCSC(const void* col_ptr,
108
  int col_ptr_type,
Guolin Ke's avatar
Guolin Ke committed
109
110
  const int32_t* indices,
  const void* data,
111
112
113
114
  int data_type,
  int64_t ncol_ptr,
  int64_t nelem,
  int64_t num_row,
Guolin Ke's avatar
Guolin Ke committed
115
  const char* parameters,
116
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
117
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
118
119
120
121

/*!
* \brief create dataset from dense matrix
* \param data pointer to the data space
wxchan's avatar
wxchan committed
122
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
123
124
* \param nrow number of rows
* \param ncol number columns
125
* \param is_row_major 1 for row major, 0 for column major
Guolin Ke's avatar
Guolin Ke committed
126
* \param parameters additional parameters
Guolin Ke's avatar
Guolin Ke committed
127
128
* \param reference used to align bin mapper with other dataset, nullptr means don't used
* \param out created dataset
wxchan's avatar
wxchan committed
129
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
130
*/
wxchan's avatar
wxchan committed
131
DllExport int LGBM_DatasetCreateFromMat(const void* data,
132
  int data_type,
Guolin Ke's avatar
Guolin Ke committed
133
134
  int32_t nrow,
  int32_t ncol,
135
  int is_row_major,
Guolin Ke's avatar
Guolin Ke committed
136
  const char* parameters,
137
  const DatasetHandle reference,
Guolin Ke's avatar
typo  
Guolin Ke committed
138
  DatasetHandle* out);
Guolin Ke's avatar
Guolin Ke committed
139

wxchan's avatar
wxchan committed
140
141
142
143
144
145
146
147
148
149
/*!
* \brief Create subset of a data
* \param handle handle of full dataset
* \param used_row_indices Indices used in subset
* \param num_used_row_indices len of used_row_indices
* \param parameters additional parameters
* \param out subset of data
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_DatasetGetSubset(
150
  const DatasetHandle handle,
wxchan's avatar
wxchan committed
151
152
153
  const int32_t* used_row_indices,
  int32_t num_used_row_indices,
  const char* parameters,
Guolin Ke's avatar
typo  
Guolin Ke committed
154
  DatasetHandle* out);
wxchan's avatar
wxchan committed
155

Guolin Ke's avatar
Guolin Ke committed
156
157
158
159
160
161
162
163
/*!
* \brief save feature names to Dataset
* \param handle handle
* \param feature_names feature names
* \param num_feature_names number of feature names
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_DatasetSetFeatureNames(
Guolin Ke's avatar
typo  
Guolin Ke committed
164
  DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
165
166
167
  const char** feature_names,
  int64_t num_feature_names);

Guolin Ke's avatar
Guolin Ke committed
168
169
/*!
* \brief free space for dataset
wxchan's avatar
wxchan committed
170
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
171
*/
Guolin Ke's avatar
typo  
Guolin Ke committed
172
DllExport int LGBM_DatasetFree(DatasetHandle handle);
Guolin Ke's avatar
Guolin Ke committed
173
174
175
176
177

/*!
* \brief save dateset to binary file
* \param handle a instance of dataset
* \param filename file name
wxchan's avatar
wxchan committed
178
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
179
*/
Guolin Ke's avatar
typo  
Guolin Ke committed
180
DllExport int LGBM_DatasetSaveBinary(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
181
182
183
184
  const char* filename);

/*!
* \brief set vector to a content in info
wxchan's avatar
wxchan committed
185
186
*        Note: group and group only work for C_API_DTYPE_INT32
*              label and weight only work for C_API_DTYPE_FLOAT32
Guolin Ke's avatar
Guolin Ke committed
187
* \param handle a instance of dataset
wxchan's avatar
wxchan committed
188
* \param field_name field name, can be label, weight, group, group_id
189
* \param field_data pointer to vector
Guolin Ke's avatar
Guolin Ke committed
190
* \param num_element number of element in field_data
wxchan's avatar
wxchan committed
191
192
* \param type C_API_DTYPE_FLOAT32 or C_API_DTYPE_INT32
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
193
*/
Guolin Ke's avatar
typo  
Guolin Ke committed
194
DllExport int LGBM_DatasetSetField(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
195
196
  const char* field_name,
  const void* field_data,
197
  int64_t num_element,
Guolin Ke's avatar
Guolin Ke committed
198
199
200
  int type);

/*!
201
* \brief get info vector from dataset
Guolin Ke's avatar
Guolin Ke committed
202
203
204
205
* \param handle a instance of data matrix
* \param field_name field name
* \param out_len used to set result length
* \param out_ptr pointer to the result
wxchan's avatar
wxchan committed
206
207
* \param out_type  C_API_DTYPE_FLOAT32 or C_API_DTYPE_INT32
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
208
*/
Guolin Ke's avatar
typo  
Guolin Ke committed
209
DllExport int LGBM_DatasetGetField(DatasetHandle handle,
Guolin Ke's avatar
Guolin Ke committed
210
  const char* field_name,
211
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
212
213
214
215
216
217
218
  const void** out_ptr,
  int* out_type);

/*!
* \brief get number of data.
* \param handle the handle to the dataset
* \param out The address to hold number of data
wxchan's avatar
wxchan committed
219
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
220
*/
Guolin Ke's avatar
typo  
Guolin Ke committed
221
DllExport int LGBM_DatasetGetNumData(DatasetHandle handle,
222
  int64_t* out);
Guolin Ke's avatar
Guolin Ke committed
223
224
225
226
227

/*!
* \brief get number of features
* \param handle the handle to the dataset
* \param out The output of number of features
wxchan's avatar
wxchan committed
228
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
229
*/
Guolin Ke's avatar
typo  
Guolin Ke committed
230
DllExport int LGBM_DatasetGetNumFeature(DatasetHandle handle,
231
  int64_t* out);
Guolin Ke's avatar
Guolin Ke committed
232
233
234
235
236

// --- start Booster interfaces

/*!
* \brief create an new boosting learner
Guolin Ke's avatar
Guolin Ke committed
237
* \param train_data training data set
Guolin Ke's avatar
Guolin Ke committed
238
239
* \param parameters format: 'key1=value1 key2=value2'
* \prama out handle of created Booster
wxchan's avatar
wxchan committed
240
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
241
*/
Guolin Ke's avatar
typo  
Guolin Ke committed
242
DllExport int LGBM_BoosterCreate(const DatasetHandle train_data,
Guolin Ke's avatar
Guolin Ke committed
243
244
245
246
  const char* parameters,
  BoosterHandle* out);

/*!
Guolin Ke's avatar
Guolin Ke committed
247
* \brief load an existing boosting from model file
Guolin Ke's avatar
Guolin Ke committed
248
* \param filename filename of model
wxchan's avatar
wxchan committed
249
* \param out_num_iterations number of iterations of this booster
Guolin Ke's avatar
Guolin Ke committed
250
* \param out handle of created Booster
wxchan's avatar
wxchan committed
251
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
252
*/
wxchan's avatar
wxchan committed
253
DllExport int LGBM_BoosterCreateFromModelfile(
Guolin Ke's avatar
Guolin Ke committed
254
  const char* filename,
wxchan's avatar
wxchan committed
255
  int64_t* out_num_iterations,
Guolin Ke's avatar
Guolin Ke committed
256
257
  BoosterHandle* out);

wxchan's avatar
wxchan committed
258

Guolin Ke's avatar
Guolin Ke committed
259
260
261
/*!
* \brief free obj in handle
* \param handle handle to be freed
wxchan's avatar
wxchan committed
262
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
263
264
265
*/
DllExport int LGBM_BoosterFree(BoosterHandle handle);

wxchan's avatar
wxchan committed
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
/*!
* \brief Merge model in two booster to first handle
* \param handle handle, will merge other handle to this
* \param other_handle
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterMerge(BoosterHandle handle,
  BoosterHandle other_handle);

/*!
* \brief Add new validation to booster
* \param handle handle
* \param valid_data validation data set
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterAddValidData(BoosterHandle handle,
Guolin Ke's avatar
typo  
Guolin Ke committed
282
  const DatasetHandle valid_data);
wxchan's avatar
wxchan committed
283
284
285
286
287
288
289
290

/*!
* \brief Reset training data for booster
* \param handle handle
* \param train_data training data set
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterResetTrainingData(BoosterHandle handle,
Guolin Ke's avatar
typo  
Guolin Ke committed
291
  const DatasetHandle train_data);
wxchan's avatar
wxchan committed
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308

/*!
* \brief Reset config for current booster
* \param handle handle
* \param parameters format: 'key1=value1 key2=value2'
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterResetParameter(BoosterHandle handle, const char* parameters);

/*!
* \brief Get number of class 
* \param handle handle
* \param out_len number of class
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterGetNumClasses(BoosterHandle handle, int64_t* out_len);

Guolin Ke's avatar
Guolin Ke committed
309
310
311
/*!
* \brief update the model in one round
* \param handle handle
Guolin Ke's avatar
Guolin Ke committed
312
* \param is_finished 1 means finised(cannot split any more)
wxchan's avatar
wxchan committed
313
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
314
315
316
317
318
319
320
321
322
*/
DllExport int LGBM_BoosterUpdateOneIter(BoosterHandle handle, int* is_finished);

/*!
* \brief update the model, by directly specify gradient and second order gradient,
*       this can be used to support customized loss function
* \param handle handle
* \param grad gradient statistics
* \param hess second order gradient statistics
Guolin Ke's avatar
Guolin Ke committed
323
* \param is_finished 1 means finised(cannot split any more)
wxchan's avatar
wxchan committed
324
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
325
326
*/
DllExport int LGBM_BoosterUpdateOneIterCustom(BoosterHandle handle,
327
328
  const float* grad,
  const float* hess,
Guolin Ke's avatar
Guolin Ke committed
329
330
331
  int* is_finished);

/*!
wxchan's avatar
wxchan committed
332
* \brief Rollback one iteration
Guolin Ke's avatar
Guolin Ke committed
333
* \param handle handle
wxchan's avatar
wxchan committed
334
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
335
*/
wxchan's avatar
wxchan committed
336
337
338
339
340
341
342
343
DllExport int LGBM_BoosterRollbackOneIter(BoosterHandle handle);

/*!
* \brief Get iteration of current boosting rounds
* \param out_iteration iteration of boosting rounds
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterGetCurrentIteration(BoosterHandle handle, int64_t* out_iteration);
Guolin Ke's avatar
Guolin Ke committed
344

Guolin Ke's avatar
Guolin Ke committed
345
/*!
wxchan's avatar
wxchan committed
346
347
348
349
350
351
352
353
354
* \brief Get number of eval 
* \param out_len total number of eval results
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterGetEvalCounts(BoosterHandle handle, int64_t* out_len);

/*!
* \brief Get Name of eval
* \param out_len total number of eval results
Guolin Ke's avatar
typo  
Guolin Ke committed
355
* \param out_strs names of eval result, need to pre-allocate memory before call this
wxchan's avatar
wxchan committed
356
357
358
359
360
361
362
363
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterGetEvalNames(BoosterHandle handle, int64_t* out_len, char** out_strs);

/*!
* \brief get evaluation for training data and validation data
         Note: 1. you should call LGBM_BoosterGetEvalNames first to get the name of evaluation results
         2. should pre-allocate memory for out_results, you can get its length by LGBM_BoosterGetEvalCounts
Guolin Ke's avatar
Guolin Ke committed
364
* \param handle handle
wxchan's avatar
wxchan committed
365
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
Guolin Ke's avatar
Guolin Ke committed
366
* \param out_len len of output result
wxchan's avatar
wxchan committed
367
368
* \param out_result float arrary contains result
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
369
*/
wxchan's avatar
wxchan committed
370
371
DllExport int LGBM_BoosterGetEval(BoosterHandle handle,
  int data_idx,
372
  int64_t* out_len,
wxchan's avatar
wxchan committed
373
  float* out_results);
Guolin Ke's avatar
Guolin Ke committed
374

Guolin Ke's avatar
Guolin Ke committed
375
/*!
Guolin Ke's avatar
Guolin Ke committed
376
* \brief Get prediction for training data and validation data
wxchan's avatar
wxchan committed
377
378
         this can be used to support customized eval function
         Note:  should pre-allocate memory for out_result, its length is equal to num_class * num_data 
Guolin Ke's avatar
Guolin Ke committed
379
* \param handle handle
wxchan's avatar
wxchan committed
380
* \param data_idx 0:training data, 1: 1st valid data, 2:2nd valid data ...
Guolin Ke's avatar
Guolin Ke committed
381
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
382
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
383
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
384
*/
Guolin Ke's avatar
Guolin Ke committed
385
DllExport int LGBM_BoosterGetPredict(BoosterHandle handle,
wxchan's avatar
wxchan committed
386
  int data_idx,
387
  int64_t* out_len,
Guolin Ke's avatar
Guolin Ke committed
388
  float* out_result);
Guolin Ke's avatar
Guolin Ke committed
389

390
391
392
393
/*!
* \brief make prediction for file
* \param handle handle
* \param data_filename filename of data file
wxchan's avatar
wxchan committed
394
395
396
397
398
399
* \param data_has_header data file has header or not
* \param predict_type
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
400
* \param result_filename filename of result file
wxchan's avatar
wxchan committed
401
* \return 0 when succeed, -1 when failure happens
402
403
404
*/
DllExport int LGBM_BoosterPredictForFile(BoosterHandle handle,
  const char* data_filename,
wxchan's avatar
wxchan committed
405
406
407
  int data_has_header,
  int predict_type,
  int64_t num_iteration,
408
409
  const char* result_filename);

Guolin Ke's avatar
Guolin Ke committed
410
411
/*!
* \brief make prediction for an new data set
wxchan's avatar
wxchan committed
412
413
414
*        Note:  should pre-allocate memory for out_result, 
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
Guolin Ke's avatar
Guolin Ke committed
415
416
* \param handle handle
* \param indptr pointer to row headers
wxchan's avatar
wxchan committed
417
* \param indptr_type type of indptr, can be C_API_DTYPE_INT32 or C_API_DTYPE_INT64
Guolin Ke's avatar
Guolin Ke committed
418
419
* \param indices findex
* \param data fvalue
wxchan's avatar
wxchan committed
420
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
421
* \param nindptr number of rows in the matrix + 1
Guolin Ke's avatar
Guolin Ke committed
422
423
424
* \param nelem number of nonzero elements in the matrix
* \param num_col number of columns; when it's set to 0, then guess from data
* \param predict_type
wxchan's avatar
wxchan committed
425
426
427
428
429
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
430
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
431
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
432
433
*/
DllExport int LGBM_BoosterPredictForCSR(BoosterHandle handle,
434
435
  const void* indptr,
  int indptr_type,
Guolin Ke's avatar
Guolin Ke committed
436
  const int32_t* indices,
437
  const void* data,
438
439
440
441
  int data_type,
  int64_t nindptr,
  int64_t nelem,
  int64_t num_col,
Guolin Ke's avatar
Guolin Ke committed
442
  int predict_type,
wxchan's avatar
wxchan committed
443
444
445
  int64_t num_iteration,
  int64_t* out_len,
  float* out_result);
Guolin Ke's avatar
Guolin Ke committed
446
447
448

/*!
* \brief make prediction for an new data set
wxchan's avatar
wxchan committed
449
450
451
*        Note:  should pre-allocate memory for out_result,
*               for noraml and raw score: its length is equal to num_class * num_data
*               for leaf index, its length is equal to num_class * num_data * num_iteration
Guolin Ke's avatar
Guolin Ke committed
452
453
* \param handle handle
* \param data pointer to the data space
wxchan's avatar
wxchan committed
454
* \param data_type type of data pointer, can be C_API_DTYPE_FLOAT32 or C_API_DTYPE_FLOAT64
Guolin Ke's avatar
Guolin Ke committed
455
456
* \param nrow number of rows
* \param ncol number columns
Guolin Ke's avatar
Guolin Ke committed
457
* \param is_row_major 1 for row major, 0 for column major
Guolin Ke's avatar
Guolin Ke committed
458
* \param predict_type
wxchan's avatar
wxchan committed
459
460
461
462
463
*          C_API_PREDICT_NORMAL: normal prediction, with transform (if needed)
*          C_API_PREDICT_RAW_SCORE: raw score
*          C_API_PREDICT_LEAF_INDEX: leaf index
* \param num_iteration number of iteration for prediction, <= 0 means no limit
* \param out_len len of output result
Guolin Ke's avatar
Guolin Ke committed
464
* \param out_result used to set a pointer to array, should allocate memory before call this function
wxchan's avatar
wxchan committed
465
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
466
467
*/
DllExport int LGBM_BoosterPredictForMat(BoosterHandle handle,
468
  const void* data,
469
  int data_type,
Guolin Ke's avatar
Guolin Ke committed
470
471
  int32_t nrow,
  int32_t ncol,
Guolin Ke's avatar
Guolin Ke committed
472
  int is_row_major,
Guolin Ke's avatar
Guolin Ke committed
473
  int predict_type,
wxchan's avatar
wxchan committed
474
475
476
  int64_t num_iteration,
  int64_t* out_len,
  float* out_result);
Guolin Ke's avatar
Guolin Ke committed
477
478
479
480

/*!
* \brief save model into file
* \param handle handle
wxchan's avatar
wxchan committed
481
* \param num_iteration, <= 0 means save all
Guolin Ke's avatar
Guolin Ke committed
482
* \param filename file name
wxchan's avatar
wxchan committed
483
* \return 0 when succeed, -1 when failure happens
Guolin Ke's avatar
Guolin Ke committed
484
485
*/
DllExport int LGBM_BoosterSaveModel(BoosterHandle handle,
wxchan's avatar
wxchan committed
486
  int num_iteration,
Guolin Ke's avatar
Guolin Ke committed
487
488
  const char* filename);

wxchan's avatar
wxchan committed
489
490
491
492
493
/*!
* \brief dump model to json
* \param handle handle
* \param buffer_len string buffer length, if buffer_len < out_len, re-allocate buffer
* \param out_len actual output length
Guolin Ke's avatar
typo  
Guolin Ke committed
494
* \param out_str json format string of model, need to pre-allocate memory before call this
wxchan's avatar
wxchan committed
495
496
497
498
499
500
* \return 0 when succeed, -1 when failure happens
*/
DllExport int LGBM_BoosterDumpModel(BoosterHandle handle,
  int buffer_len,
  int64_t* out_len,
  char** out_str);
501

Guolin Ke's avatar
Guolin Ke committed
502
503
// some help functions used to convert data

504
505
506
507
508
509
510
std::function<std::vector<double>(int row_idx)>
RowFunctionFromDenseMatric(const void* data, int num_row, int num_col, int data_type, int is_row_major);

std::function<std::vector<std::pair<int, double>>(int row_idx)>
RowPairFunctionFromDenseMatric(const void* data, int num_row, int num_col, int data_type, int is_row_major);

std::function<std::vector<std::pair<int, double>>(int idx)>
wxchan's avatar
wxchan committed
511
RowFunctionFromCSR(const void* indptr, int indptr_type, const int32_t* indices,
512
513
514
  const void* data, int data_type, int64_t nindptr, int64_t nelem);

std::function<std::vector<std::pair<int, double>>(int idx)>
wxchan's avatar
wxchan committed
515
ColumnFunctionFromCSC(const void* col_ptr, int col_ptr_type, const int32_t* indices,
516
517
  const void* data, int data_type, int64_t ncol_ptr, int64_t nelem);

wxchan's avatar
wxchan committed
518
std::vector<double>
519
SampleFromOneColumn(const std::vector<std::pair<int, double>>& data, const std::vector<int>& indices);
520

wxchan's avatar
wxchan committed
521
#if defined(_MSC_VER)
522
// exception handle and error msg
wxchan's avatar
wxchan committed
523
524
525
526
static char* LastErrorMsg() { static __declspec(thread) char err_msg[512] = "Everything is fine"; return err_msg; }
#else
static char* LastErrorMsg() { static thread_local char err_msg[512] = "Everything is fine"; return err_msg; }
#endif
527
528

inline void LGBM_SetLastError(const char* msg) {
wxchan's avatar
wxchan committed
529
  std::strcpy(LastErrorMsg(), msg);
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
}

inline int LGBM_APIHandleException(const std::exception& ex) {
  LGBM_SetLastError(ex.what());
  return -1;
}
inline int LGBM_APIHandleException(const std::string& ex) {
  LGBM_SetLastError(ex.c_str());
  return -1;
}

#define API_BEGIN() try {

#define API_END() } \
catch(std::exception& ex) { return LGBM_APIHandleException(ex); } \
catch(std::string& ex) { return LGBM_APIHandleException(ex); } \
catch(...) { return LGBM_APIHandleException("unknown exception"); } \
wxchan's avatar
wxchan committed
547
return 0;
548

Guolin Ke's avatar
Guolin Ke committed
549
#endif // LIGHTGBM_C_API_H_