Add L1 objective function (#175)

* Add L1 objective function * fix hessians * update

Add L1 objective function (#175)
* Add L1 objective function * fix hessians * update
6219df7a · Tsukasa OMOTO · Guolin Ke · a6f47d00 · 6219df7a · 6219df7a
Commit 6219df7a authored Jan 09, 2017 by Tsukasa OMOTO Committed by Guolin Ke Jan 09, 2017
4 changed files
--- a/docs/Parameters.md
+++ b/docs/Parameters.md
@@ -16,9 +16,11 @@ The parameter format is ```key1=value1 key2=value2 ... ``` . And parameters can
 * ```task```, default=```train```, type=enum, options=```train```,```prediction```
  * ```train``` for training
  * ```prediction``` for prediction.
-* ```application```, default=```regression```, type=enum, options=```regression```,```huber```,```binary```,```lambdarank```,```multiclass```, alias=```objective```,```app```
+* ```application```, default=```regression```, type=enum, options=```regression```,```regression_l1```,```huber```,```binary```,```lambdarank```,```multiclass```, alias=```objective```,```app```
  * ```regression```, regression application
-  * ```huber```, [Huber loss](https://en.wikipedia.org/wiki/Huber_loss "Huber loss - Wikipedia") for regression task
+    * ```regression_l2```, L2 loss, alias=```mean_squared_error```,```mse```
+    * ```regression_l1```, L1 loss, alias=```mean_absolute_error```,```mae```
+    * ```huber```, [Huber loss](https://en.wikipedia.org/wiki/Huber_loss "Huber loss - Wikipedia")
  * ```binary```, binary classification application 
  * ```lambdarank```, lambdarank application
  * ```multiclass```, multi-class classification application, should set ```num_class``` as well

--- a/include/LightGBM/utils/common.h
+++ b/include/LightGBM/utils/common.h
@@ -400,6 +400,24 @@ inline void SortForPair(std::vector<T1>& keys, std::vector<T2>& values, size_t s
 }
+/*
+* approximate hessians of absolute loss with Gaussian function
+* cf. https://en.wikipedia.org/wiki/Gaussian_function
+*
+* y is a prediction.
+* t mesas true target.
+* w means weights.
+*/
+inline static double ApproximateHessianWithGaussian(double y, double t, double w=1.0f) {
+  const double diff = y - t;
+  const double pi = M_PI;
+  const double x = (std::fabs(diff) > 0.0) ? std::fabs(diff) : 1.0e-6;
+  const double a = 2.0 * w;  // difference of two first derivatives, (zero to inf) and (zero to -inf).
+  const double b = 0.0;
+  const double c = (std::fabs(y) + std::fabs(t)) / 1.0e3;
+  return w * std::exp(-(x - b) * (x - b) / 2.0 * c * c) * a / std::sqrt(2.0 * pi) * c;
+}
 }  // namespace Common
 }  // namespace LightGBM

--- a/src/objective/objective_function.cpp
+++ b/src/objective/objective_function.cpp
@@ -7,8 +7,11 @@
 namespace LightGBM {
 ObjectiveFunction* ObjectiveFunction::CreateObjectiveFunction(const std::string& type, const ObjectiveConfig& config) {
-  if (type == std::string("regression")) {
+  if (type == std::string("regression") || type == std::string("regression_l2")
+      || type == std::string("mean_squared_error") || type == std::string("mse")) {
    return new RegressionL2loss(config);
+  } else if (type == std::string("regression_l1") || type == std::string("mean_absolute_error")  || type == std::string("mae")) {
+    return new RegressionL1loss(config);
  } else if (type == std::string("huber")) {
    return new RegressionLHuberLoss(config);
  } else if (type == std::string("binary")) {

--- a/src/objective/regression_objective.hpp
+++ b/src/objective/regression_objective.hpp
@@ -2,6 +2,7 @@
 #define LIGHTGBM_OBJECTIVE_REGRESSION_OBJECTIVE_HPP_
 #include <LightGBM/objective_function.h>
+#include <LightGBM/utils/common.h>
 namespace LightGBM {
 /*!
@@ -51,6 +52,60 @@ private:
  const float* weights_;
 };
+class RegressionL1loss: public ObjectiveFunction {
+public:
+  explicit RegressionL1loss(const ObjectiveConfig& config) {}
+  ~RegressionL1loss() {}
+  void Init(const Metadata& metadata, data_size_t num_data) override {
+    num_data_ = num_data;
+    label_ = metadata.label();
+    weights_ = metadata.weights();
+  }
+  void GetGradients(const score_t* score, score_t* gradients,
+                    score_t* hessians) const override {
+    if (weights_ == nullptr) {
+      #pragma omp parallel for schedule(static)
+      for (data_size_t i = 0; i < num_data_; ++i) {
+        const double diff = score[i] - label_[i];
+        if (diff >= 0.0) {
+          gradients[i] = 1.0;
+        } else {
+          gradients[i] = -1.0;
+        }
+        hessians[i] = Common::ApproximateHessianWithGaussian(score[i], label_[i]);
+      }
+    } else {
+      #pragma omp parallel for schedule(static)
+      for (data_size_t i = 0; i < num_data_; ++i) {
+        const double diff = score[i] - label_[i];
+        if (diff >= 0.0) {
+          gradients[i] = weights_[i];
+        } else {
+          gradients[i] = -weights_[i];
+        }
+        hessians[i] = Common::ApproximateHessianWithGaussian(score[i], label_[i], weights_[i]);
+      }
+    }
+  }
+  const char* GetName() const override {
+    return "regression_l1";
+  }
+private:
+  /*! \brief Number of data */
+  data_size_t num_data_;
+  /*! \brief Pointer of label */
+  const float* label_;
+  /*! \brief Pointer of weights */
+  const float* weights_;
+};
 class RegressionLHuberLoss: public ObjectiveFunction {
 public:
  explicit RegressionLHuberLoss(const ObjectiveConfig& config) {