score_updater.hpp 3.42 KB
Newer Older
Guolin Ke's avatar
Guolin Ke committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
#ifndef LIGHTGBM_BOOSTING_SCORE_UPDATER_HPP_
#define LIGHTGBM_BOOSTING_SCORE_UPDATER_HPP_

#include <LightGBM/meta.h>
#include <LightGBM/dataset.h>
#include <LightGBM/tree.h>
#include <LightGBM/tree_learner.h>

#include <cstring>

namespace LightGBM {
/*!
* \brief Used to store and update score for data
*/
class ScoreUpdater {
public:
  /*!
  * \brief Constructor, will pass a const pointer of dataset
  * \param data This class will bind with this data set
  */
Guolin Ke's avatar
Guolin Ke committed
21
  ScoreUpdater(const Dataset* data, int num_class) : data_(data) {
Guolin Ke's avatar
Guolin Ke committed
22
    num_data_ = data->num_data();
Guolin Ke's avatar
Guolin Ke committed
23
    int64_t total_size = static_cast<int64_t>(num_data_) * num_class;
24
    score_.resize(total_size);
Guolin Ke's avatar
Guolin Ke committed
25
    // default start score is zero
Guolin Ke's avatar
Guolin Ke committed
26
27
28
29
30
#pragma omp parallel for schedule(static)
    for (int64_t i = 0; i < total_size; ++i) {
      score_[i] = 0.0f;
    }
    const double* init_score = data->metadata().init_score();
Guolin Ke's avatar
Guolin Ke committed
31
32
    // if exists initial score, will start from it
    if (init_score != nullptr) {
33
34
35
36
      if ((data->metadata().num_init_score() % num_data_) != 0 
        || (data->metadata().num_init_score() / num_data_) != num_class) {
        Log::Fatal("number of class for initial score error");
      }
Guolin Ke's avatar
Guolin Ke committed
37
38
#pragma omp parallel for schedule(static)
      for (int64_t i = 0; i < total_size; ++i) {
Guolin Ke's avatar
Guolin Ke committed
39
40
41
42
43
44
        score_[i] = init_score[i];
      }
    }
  }
  /*! \brief Destructor */
  ~ScoreUpdater() {
Guolin Ke's avatar
Guolin Ke committed
45

Guolin Ke's avatar
Guolin Ke committed
46
47
  }
  /*!
Qiwei Ye's avatar
Qiwei Ye committed
48
49
  * \brief Using tree model to get prediction number, then adding to scores for all data
  *        Note: this function generally will be used on validation data too.
Guolin Ke's avatar
Guolin Ke committed
50
  * \param tree Trained tree model
51
  * \param curr_class Current class for multiclass training
Guolin Ke's avatar
Guolin Ke committed
52
  */
53
  inline void AddScore(const Tree* tree, int curr_class) {
Guolin Ke's avatar
Guolin Ke committed
54
    tree->AddPredictionToScore(data_, num_data_, score_.data() + curr_class * num_data_);
Guolin Ke's avatar
Guolin Ke committed
55
56
  }
  /*!
Qiwei Ye's avatar
Qiwei Ye committed
57
58
59
  * \brief Adding prediction score, only used for training data.
  *        The training data is partitioned into tree leaves after training
  *        Based on which We can get prediction quckily.
Guolin Ke's avatar
Guolin Ke committed
60
  * \param tree_learner
61
  * \param curr_class Current class for multiclass training
Guolin Ke's avatar
Guolin Ke committed
62
  */
63
  inline void AddScore(const TreeLearner* tree_learner, int curr_class) {
Guolin Ke's avatar
Guolin Ke committed
64
    tree_learner->AddPredictionToScore(score_.data() + curr_class * num_data_);
Guolin Ke's avatar
Guolin Ke committed
65
66
  }
  /*!
Qiwei Ye's avatar
Qiwei Ye committed
67
68
  * \brief Using tree model to get prediction number, then adding to scores for parts of data
  *        Used for prediction of training out-of-bag data
Guolin Ke's avatar
Guolin Ke committed
69
  * \param tree Trained tree model
Hui Xue's avatar
Hui Xue committed
70
71
  * \param data_indices Indices of data that will be proccessed
  * \param data_cnt Number of data that will be proccessed
72
  * \param curr_class Current class for multiclass training
Guolin Ke's avatar
Guolin Ke committed
73
74
  */
  inline void AddScore(const Tree* tree, const data_size_t* data_indices,
75
                                                  data_size_t data_cnt, int curr_class) {
Guolin Ke's avatar
Guolin Ke committed
76
    tree->AddPredictionToScore(data_, data_indices, data_cnt, score_.data() + curr_class * num_data_);
Guolin Ke's avatar
Guolin Ke committed
77
78
  }
  /*! \brief Pointer of score */
79
  inline const double* score() const { return score_.data(); }
Guolin Ke's avatar
Guolin Ke committed
80
81
82
83
84
85
  inline const data_size_t num_data() const { return num_data_; }

  /*! \brief Disable copy */
  ScoreUpdater& operator=(const ScoreUpdater&) = delete;
  /*! \brief Disable copy */
  ScoreUpdater(const ScoreUpdater&) = delete;
Guolin Ke's avatar
Guolin Ke committed
86
87
88
89
90
private:
  /*! \brief Number of total data */
  data_size_t num_data_;
  /*! \brief Pointer of data set */
  const Dataset* data_;
91
  /*! \brief Scores for data set */
92
  std::vector<double> score_;
Guolin Ke's avatar
Guolin Ke committed
93
94
95
};

}  // namespace LightGBM
Guolin Ke's avatar
Guolin Ke committed
96
#endif   // LightGBM_BOOSTING_SCORE_UPDATER_HPP_