Avoid using mean intercept for rmsle.

trivialfis · trivialfis · commit 7025754a3da6 · 2025-07-24T19:03:17.000+08:00
diff --git a/src/objective/quantile_obj.cu b/src/objective/quantile_obj.cu
@@ -1,5 +1,5 @@
 /**
- * Copyright 2023-2024, XGBoost contributors
+ * Copyright 2023-2025, XGBoost contributors
  */
 #include <array>                            // std::array
 #include <cstddef>                          // std::size_t
@@ -10,15 +10,13 @@
 #include "../common/quantile_loss_utils.h"  // QuantileLossParam
 #include "../common/stats.h"                // Quantile,WeightedQuantile
 #include "adaptive.h"                       // UpdateTreeLeaf
-#include "dmlc/parameter.h"                 // DMLC_DECLARE_PARAMETER
 #include "init_estimation.h"                // CheckInitInputs
 #include "xgboost/base.h"                   // GradientPair,XGBOOST_DEVICE,bst_target_t
 #include "xgboost/data.h"                   // MetaInfo
 #include "xgboost/host_device_vector.h"     // HostDeviceVector
 #include "xgboost/json.h"                   // Json,String,ToJson,FromJson
 #include "xgboost/linalg.h"                 // Tensor,MakeTensorView,MakeVec
 #include "xgboost/objective.h"              // ObjFunction
-#include "xgboost/parameter.h"              // XGBoostParameter
 
 #if defined(XGBOOST_USE_CUDA)
 
diff --git a/src/objective/regression_loss.h b/src/objective/regression_loss.h
@@ -1,5 +1,5 @@
 /**
- * Copyright 2017-2023 by XGBoost contributors
+ * Copyright 2017-2025, XGBoost contributors
  */
 #ifndef XGBOOST_OBJECTIVE_REGRESSION_LOSS_H_
 #define XGBOOST_OBJECTIVE_REGRESSION_LOSS_H_
@@ -9,7 +9,6 @@
 #include <cmath>
 
 #include "../common/math.h"
-#include "xgboost/data.h"  // MetaInfo
 #include "xgboost/logging.h"
 #include "xgboost/task.h"  // ObjInfo
 
diff --git a/src/objective/regression_obj.cu b/src/objective/regression_obj.cu
@@ -1,5 +1,5 @@
 /**
- * Copyright 2015-2024, XGBoost Contributors
+ * Copyright 2015-2025, XGBoost Contributors
  * \file regression_obj.cu
  * \brief Definition of single-value regression and classification objectives.
  * \author Tianqi Chen, Kailong Chen
@@ -9,7 +9,6 @@
 #include <algorithm>
 #include <cmath>
 #include <cstdint>  // std::int32_t
-#include <memory>
 #include <vector>
 
 #include "../common/common.h"
@@ -53,54 +52,55 @@ void CheckRegInputs(MetaInfo const& info, HostDeviceVector<bst_float> const& pre
   CheckInitInputs(info);
   CHECK_EQ(info.labels.Size(), preds.Size()) << "Invalid shape of labels.";
 }
+
+template <typename Loss>
+void ValidateLabel(Context const* ctx, MetaInfo const& info) {
+  auto label = info.labels.View(ctx->Device());
+  auto valid = ctx->DispatchDevice(
+      [&] {
+        return std::all_of(linalg::cbegin(label), linalg::cend(label),
+                           [](float y) -> bool { return Loss::CheckLabel(y); });
+      },
+      [&] {
+#if defined(XGBOOST_USE_CUDA)
+        auto cuctx = ctx->CUDACtx();
+        auto it = dh::MakeTransformIterator<bool>(
+            thrust::make_counting_iterator(0ul), [=] XGBOOST_DEVICE(std::size_t i) -> bool {
+              auto [m, n] = linalg::UnravelIndex(i, label.Shape());
+              return Loss::CheckLabel(label(m, n));
+            });
+        return dh::Reduce(cuctx->CTP(), it, it + label.Size(), true, thrust::logical_and<>{});
+#else
+        common::AssertGPUSupport();
+        return false;
+#endif  // defined(XGBOOST_USE_CUDA)
+      },
+      [&] {
+#if defined(XGBOOST_USE_SYCL)
+        return sycl::linalg::Validate(ctx_->Device(), label,
+                                      [](float y) -> bool { return Loss::CheckLabel(y); });
+#else
+        common::AssertSYCLSupport();
+        return false;
+#endif  // defined(XGBOOST_USE_SYCL)
+      });
+  if (!valid) {
+    LOG(FATAL) << Loss::LabelErrorMsg();
+  }
+}
 }  // anonymous namespace
 
 #if defined(XGBOOST_USE_CUDA)
 DMLC_REGISTRY_FILE_TAG(regression_obj_gpu);
 #endif  // defined(XGBOOST_USE_CUDA)
 
-
-
 template<typename Loss>
 class RegLossObj : public FitInterceptGlmLike {
  protected:
   HostDeviceVector<float> additional_input_;
 
  public:
-  void ValidateLabel(MetaInfo const& info) {
-    auto label = info.labels.View(ctx_->Device());
-    auto valid = ctx_->DispatchDevice(
-        [&] {
-          return std::all_of(linalg::cbegin(label), linalg::cend(label),
-                             [](float y) -> bool { return Loss::CheckLabel(y); });
-        },
-        [&] {
-#if defined(XGBOOST_USE_CUDA)
-          auto cuctx = ctx_->CUDACtx();
-          auto it = dh::MakeTransformIterator<bool>(
-              thrust::make_counting_iterator(0ul), [=] XGBOOST_DEVICE(std::size_t i) -> bool {
-                auto [m, n] = linalg::UnravelIndex(i, label.Shape());
-                return Loss::CheckLabel(label(m, n));
-              });
-          return dh::Reduce(cuctx->CTP(), it, it + label.Size(), true, thrust::logical_and<>{});
-#else
-          common::AssertGPUSupport();
-          return false;
-#endif  // defined(XGBOOST_USE_CUDA)
-        },
-        [&] {
-#if defined(XGBOOST_USE_SYCL)
-          return sycl::linalg::Validate(ctx_->Device(), label,
-                                        [](float y) -> bool { return Loss::CheckLabel(y); });
-#else
-          common::AssertSYCLSupport();
-          return false;
-#endif  // defined(XGBOOST_USE_SYCL)
-        });
-    if (!valid) {
-      LOG(FATAL) << Loss::LabelErrorMsg();
-    }
-  }
+
   // 0 - scale_pos_weight, 1 - is_null_weight
   RegLossObj(): additional_input_(2) {}
 
@@ -117,7 +117,7 @@ class RegLossObj : public FitInterceptGlmLike {
                    std::int32_t iter, linalg::Matrix<GradientPair>* out_gpair) override {
     CheckRegInputs(info, preds);
     if (iter == 0) {
-      ValidateLabel(info);
+      ValidateLabel<Loss>(this->ctx_, info);
     }
 
     size_t const ndata = preds.Size();
@@ -224,10 +224,6 @@ XGBOOST_REGISTER_OBJECTIVE(SquaredLossRegression, LinearSquareLoss::Name())
 .describe("Regression with squared error.")
 .set_body([]() { return new RegLossObj<LinearSquareLoss>(); });
 
-XGBOOST_REGISTER_OBJECTIVE(SquareLogError, SquaredLogError::Name())
-.describe("Regression with root mean squared logarithmic error.")
-.set_body([]() { return new RegLossObj<SquaredLogError>(); });
-
 XGBOOST_REGISTER_OBJECTIVE(LogisticRegression, LogisticRegression::Name())
 .describe("Logistic regression for probability regression task.")
 .set_body([]() { return new RegLossObj<LogisticRegression>(); });
@@ -253,6 +249,55 @@ XGBOOST_REGISTER_OBJECTIVE(LinearRegression, "reg:linear")
     return new RegLossObj<LinearSquareLoss>(); });
 // End deprecated
 
+class SquaredLogErrorRegression : public FitIntercept {
+ public:
+  static auto Name() { return SquaredLogError::Name(); }
+
+  void Configure(Args const&) override {}
+  [[nodiscard]] ObjInfo Task() const override { return ObjInfo::kRegression; }
+  [[nodiscard]] bst_target_t Targets(MetaInfo const& info) const override {
+    return std::max(static_cast<std::size_t>(1), info.labels.Shape(1));
+  }
+  void GetGradient(HostDeviceVector<bst_float> const& preds, const MetaInfo& info,
+                   std::int32_t iter, linalg::Matrix<GradientPair>* out_gpair) override {
+    if (iter == 0) {
+      ValidateLabel<SquaredLogError>(this->ctx_, info);
+    }
+    auto labels = info.labels.View(ctx_->Device());
+
+    out_gpair->SetDevice(ctx_->Device());
+    out_gpair->Reshape(info.num_row_, this->Targets(info));
+    auto gpair = out_gpair->View(ctx_->Device());
+
+    preds.SetDevice(ctx_->Device());
+    auto predt = linalg::MakeTensorView(ctx_, &preds, info.num_row_, this->Targets(info));
+
+    info.weights_.SetDevice(ctx_->Device());
+    common::OptionalWeights weight{ctx_->IsCPU() ? info.weights_.ConstHostSpan()
+                                                 : info.weights_.ConstDeviceSpan()};
+    linalg::ElementWiseKernel(this->ctx_, labels,
+                              [=] XGBOOST_DEVICE(std::size_t i, std::size_t j) mutable {
+                                auto p = predt(i, j);
+                                auto y = labels(i, j);
+                                auto w = weight[i];
+                                auto grad = SquaredLogError::FirstOrderGradient(p, y);
+                                auto hess = SquaredLogError::SecondOrderGradient(p, y);
+                                gpair(i) = {grad * w, hess * w};
+                              });
+  }
+  [[nodiscard]] const char* DefaultEvalMetric() const override { return "rmsle"; }
+
+  void SaveConfig(Json* p_out) const override {
+    auto& out = *p_out;
+    out["name"] = String(Name());
+  }
+  void LoadConfig(Json const&) override {}
+};
+
+XGBOOST_REGISTER_OBJECTIVE(SquaredLogErrorRegression, SquaredLogErrorRegression::Name())
+    .describe("Root mean squared log error.")
+    .set_body([]() { return new SquaredLogErrorRegression(); });
+
 class PseudoHuberRegression : public FitIntercept {
   PesudoHuberParam param_;