fix ranking tasks consistency (#1739)

* fix ndcg consistency. * more stable sorts * Update gbdt_model_text.cpp * Update dataset.cpp * Update gbdt_model_text.cpp

fix ranking tasks consistency (#1739)
* fix ndcg consistency. * more stable sorts * Update gbdt_model_text.cpp * Update dataset.cpp * Update gbdt_model_text.cpp
496a07d1 · Guolin Ke · GitHub · ac6951d3 · 496a07d1 · 496a07d1
Unverified Commit 496a07d1 authored Oct 10, 2018 by Guolin Ke Committed by GitHub Oct 10, 2018
9 changed files
--- a/include/LightGBM/utils/common.h
+++ b/include/LightGBM/utils/common.h
@@ -625,11 +625,11 @@ inline static void SortForPair(std::vector<T1>& keys, std::vector<T2>& values, s
    arr.emplace_back(keys[i], values[i]);
  }
  if (!is_reverse) {
-    std::sort(arr.begin(), arr.end(), [](const std::pair<T1, T2>& a, const std::pair<T1, T2>& b) {
+    std::stable_sort(arr.begin(), arr.end(), [](const std::pair<T1, T2>& a, const std::pair<T1, T2>& b) {
      return a.first < b.first;
    });
  } else {
-    std::sort(arr.begin(), arr.end(), [](const std::pair<T1, T2>& a, const std::pair<T1, T2>& b) {
+    std::stable_sort(arr.begin(), arr.end(), [](const std::pair<T1, T2>& a, const std::pair<T1, T2>& b) {
      return a.first > b.first;
    });
  }

--- a/src/boosting/gbdt_model_text.cpp
+++ b/src/boosting/gbdt_model_text.cpp
@@ -304,9 +304,9 @@ std::string GBDT::SaveModelToString(int start_iteration, int num_iteration) cons
    }
  }
  // sort the importance
-  std::sort(pairs.begin(), pairs.end(),
+  std::stable_sort(pairs.begin(), pairs.end(),
-            [](const std::pair<size_t, std::string>& lhs,
+                   [](const std::pair<size_t, std::string>& lhs,
-               const std::pair<size_t, std::string>& rhs) {
+                      const std::pair<size_t, std::string>& rhs) {
    return lhs.first > rhs.first;
  });
  ss << '\n' << "feature importances:" << '\n';

--- a/src/io/bin.cpp
+++ b/src/io/bin.cpp
@@ -235,7 +235,7 @@ namespace LightGBM {
    std::vector<double> distinct_values;
    std::vector<int> counts;
-    std::sort(values, values + num_sample_values);
+    std::stable_sort(values, values + num_sample_values);
    // push zero in the front
    if (num_sample_values == 0 || (values[0] > 0.0f && zero_cnt > 0)) {

--- a/src/io/dataset.cpp
+++ b/src/io/dataset.cpp
@@ -162,8 +162,8 @@ std::vector<std::vector<int>> FastFeatureBundling(std::vector<std::unique_ptr<Bi
    sorted_idx.emplace_back(i);
  }
  // sort by non zero cnt, bigger first
-  std::sort(sorted_idx.begin(), sorted_idx.end(),
+  std::stable_sort(sorted_idx.begin(), sorted_idx.end(),
-            [&feature_non_zero_cnt](int a, int b) {
+                   [&feature_non_zero_cnt](int a, int b) {
    return feature_non_zero_cnt[a] > feature_non_zero_cnt[b];
  });

--- a/src/metric/dcg_calculator.cpp
+++ b/src/metric/dcg_calculator.cpp
@@ -44,7 +44,7 @@ void DCGCalculator::Init(const std::vector<double>& input_label_gain) {
  }
  discount_.resize(kMaxPosition);
  for (data_size_t i = 0; i < kMaxPosition; ++i) {
-    discount_[i] = 1.0f / std::log2(2.0f + i);
+    discount_[i] = 1.0 / std::log2(2.0 + i);
  }
 }
@@ -111,8 +111,8 @@ double DCGCalculator::CalDCGAtK(data_size_t k, const label_t* label,
  for (data_size_t i = 0; i < num_data; ++i) {
    sorted_idx[i] = i;
  }
-  std::sort(sorted_idx.begin(), sorted_idx.end(),
+  std::stable_sort(sorted_idx.begin(), sorted_idx.end(),
-           [score](data_size_t a, data_size_t b) {return score[a] > score[b]; });
+                   [score](data_size_t a, data_size_t b) {return score[a] > score[b]; });
  if (k > num_data) { k = num_data; }
  double dcg = 0.0f;
@@ -131,8 +131,8 @@ void DCGCalculator::CalDCG(const std::vector<data_size_t>& ks, const label_t* la
  for (data_size_t i = 0; i < num_data; ++i) {
    sorted_idx[i] = i;
  }
-  std::sort(sorted_idx.begin(), sorted_idx.end(),
+  std::stable_sort(sorted_idx.begin(), sorted_idx.end(),
-            [score](data_size_t a, data_size_t b) {return score[a] > score[b]; });
+                   [score](data_size_t a, data_size_t b) {return score[a] > score[b]; });
  double cur_result = 0.0f;
  data_size_t cur_left = 0;

--- a/src/metric/map_metric.hpp
+++ b/src/metric/map_metric.hpp
@@ -79,8 +79,8 @@ public:
    for (data_size_t i = 0; i < num_data; ++i) {
      sorted_idx.emplace_back(i);
    }
-    std::sort(sorted_idx.begin(), sorted_idx.end(),
+    std::stable_sort(sorted_idx.begin(), sorted_idx.end(),
-              [score](data_size_t a, data_size_t b) {return score[a] > score[b]; });
+                     [score](data_size_t a, data_size_t b) {return score[a] > score[b]; });
    int num_hit = 0;
    double sum_ap = 0.0f;

--- a/src/objective/rank_objective.hpp
+++ b/src/objective/rank_objective.hpp
@@ -100,8 +100,8 @@ public:
    for (data_size_t i = 0; i < cnt; ++i) {
      sorted_idx.emplace_back(i);
    }
-    std::sort(sorted_idx.begin(), sorted_idx.end(),
+    std::stable_sort(sorted_idx.begin(), sorted_idx.end(),
-             [score](data_size_t a, data_size_t b) { return score[a] > score[b]; });
+                     [score](data_size_t a, data_size_t b) { return score[a] > score[b]; });
    // get best and worst score
    const double best_score = score[sorted_idx[0]];
    data_size_t worst_idx = cnt - 1;

--- a/src/objective/regression_objective.hpp
+++ b/src/objective/regression_objective.hpp
@@ -40,7 +40,7 @@ namespace LightGBM {
  for (data_size_t i = 0; i < cnt_data; ++i) {\
    sorted_idx[i] = i;\
  }\
-  std::sort(sorted_idx.begin(), sorted_idx.end(), [=](data_size_t a, data_size_t b) {return data_reader(a) < data_reader(b); });\
+  std::stable_sort(sorted_idx.begin(), sorted_idx.end(), [=](data_size_t a, data_size_t b) {return data_reader(a) < data_reader(b); });\
  std::vector<double> weighted_cdf(cnt_data);\
  weighted_cdf[0] = weight_reader(sorted_idx[0]);\
  for (data_size_t i = 1; i < cnt_data; ++i) {\

--- a/tests/python_package_test/test_sklearn.py
+++ b/tests/python_package_test/test_sklearn.py
@@ -65,6 +65,9 @@ class TestSklearn(unittest.TestCase):
        gbm.fit(X_train, y_train, group=q_train, eval_set=[(X_test, y_test)],
                eval_group=[q_test], eval_at=[1, 3], early_stopping_rounds=5, verbose=False,
                callbacks=[lgb.reset_parameter(learning_rate=lambda x: 0.95 ** x * 0.1)])
+        self.assertLessEqual(gbm.best_iteration_, 12)
+        self.assertGreater(gbm.best_score_['valid_0']['ndcg@1'], 0.65)
+        self.assertGreater(gbm.best_score_['valid_0']['ndcg@3'], 0.65)
    def test_regression_with_custom_objective(self):
        def objective_ls(y_true, y_pred):