limit the max tree output. change hessian in multi-class objective.

6757a6aa · Guolin Ke · 3beee91d · 6757a6aa · 6757a6aa · 6757a6aa
Commit 6757a6aa authored Mar 24, 2017 by Guolin Ke
Showing with 17 additions and 18 deletions

include/LightGBM/tree.h include/LightGBM/tree.h +12 -9

src/objective/binary_objective.hpp src/objective/binary_objective.hpp +1 -5

src/objective/multiclass_objective.hpp src/objective/multiclass_objective.hpp +4 -4

No files found.
--- a/include/LightGBM/tree.h
+++ b/include/LightGBM/tree.h
@@ -10,6 +10,7 @@
 namespace LightGBM {
+#define kMaxTreeOutput (100)
 /*!
 * \brief Tree model
@@ -101,9 +102,11 @@ public:
  * \param rate The factor of shrinkage
  */
  inline void Shrinkage(double rate) {
-#pragma omp parallel for schedule(static)
+    #pragma omp parallel for schedule(static)
    for (int i = 0; i < num_leaves_; ++i) {
      leaf_value_[i] *= rate;
+      if (leaf_value_[i] > kMaxTreeOutput) { leaf_value_[i] = kMaxTreeOutput; } 
+      else if (leaf_value_[i] < -kMaxTreeOutput) { leaf_value_[i] = -kMaxTreeOutput; }
    }
    shrinkage_ *= rate;
  }

--- a/src/objective/binary_objective.hpp
+++ b/src/objective/binary_objective.hpp
@@ -37,10 +37,6 @@ public:
      }
    }
    Log::Info("Number of positive: %d, number of negative: %d", cnt_positive, cnt_negative);
-    // cannot continue if all sample are same class
-    if (cnt_positive == 0 || cnt_negative == 0) {
-      Log::Fatal("Training data only contains one class");
-    }
    // use -1 for negative class, and 1 for positive class
    label_val_[0] = -1;
    label_val_[1] = 1;
@@ -48,7 +44,7 @@ public:
    label_weights_[0] = 1.0f;
    label_weights_[1] = 1.0f;
    // if using unbalance, change the labels weight
-    if (is_unbalance_) {
+    if (is_unbalance_ && cnt_positive > 0 && cnt_negative > 0) {
      if (cnt_positive > cnt_negative) {
        label_weights_[1] = 1.0f;
        label_weights_[0] = static_cast<double>(cnt_positive) / cnt_negative;

--- a/src/objective/multiclass_objective.hpp
+++ b/src/objective/multiclass_objective.hpp
@@ -61,10 +61,10 @@ public:
          size_t idx = static_cast<size_t>(num_data_) * k + i;
          if (label_int_[i] == k) {
            gradients[idx] = static_cast<score_t>(p - 1.0f) * label_pos_weights_[k];
-            hessians[idx] = static_cast<score_t>(2.0f * p * (1.0f - p))* label_pos_weights_[k];
+            hessians[idx] = static_cast<score_t>(p * (1.0f - p))* label_pos_weights_[k];
          } else {
            gradients[idx] = static_cast<score_t>(p);
-            hessians[idx] = static_cast<score_t>(2.0f * p * (1.0f - p));
+            hessians[idx] = static_cast<score_t>(p * (1.0f - p));
          }
        }
      }
@@ -82,10 +82,10 @@ public:
          size_t idx = static_cast<size_t>(num_data_) * k + i;
          if (label_int_[i] == k) {
            gradients[idx] = static_cast<score_t>((p - 1.0f) * weights_[i]) * label_pos_weights_[k];
-            hessians[idx] = static_cast<score_t>(2.0f * p * (1.0f - p) * weights_[i]) * label_pos_weights_[k];
+            hessians[idx] = static_cast<score_t>(p * (1.0f - p) * weights_[i]) * label_pos_weights_[k];
          } else {
            gradients[idx] = static_cast<score_t>(p * weights_[i]);
-            hessians[idx] = static_cast<score_t>(2.0f * p * (1.0f - p) * weights_[i]);
+            hessians[idx] = static_cast<score_t>(p * (1.0f - p) * weights_[i]);
          }
        }