/** * Copyright 2014-2024, XGBoost Contributors * \file learner.cc * \brief Implementation of learning algorithm. * \author Tianqi Chen */ #include "xgboost/learner.h" #include // for Stream #include // for FieldEntry, DMLC_DECLARE_FIELD, Parameter, DMLC... #include // for ThreadLocalStore #include // for equal, max, transform, sort, find_if, all_of #include // for array #include // for atomic #include // for isalpha, isspace #include // for isnan, isinf #include // for int32_t, uint32_t, int64_t, uint64_t #include // for atoi #include // for memcpy, size_t, memset #include // for operator<<, setiosflags #include // for back_insert_iterator, distance, back_inserter #include // for numeric_limits #include // for allocator, unique_ptr, shared_ptr, operator== #include // for mutex, lock_guard #include // for set #include // for operator<<, basic_ostream, basic_ostream::opera... #include // for stack #include // for basic_string, char_traits, operator<, string #include // for errc #include // for get #include // for operator!=, unordered_map #include // for pair, as_const, move, swap #include // for vector #include "collective/aggregator.h" // for ApplyWithLabels #include "collective/communicator-inl.h" // for Allreduce, Broadcast, GetRank, IsDistributed #include "collective/communicator.h" // for Operation #include "common/api_entry.h" // for XGBAPIThreadLocalEntry #include "common/charconv.h" // for to_chars, to_chars_result, NumericLimits, from_... #include "common/common.h" // for ToString, Split #include "common/error_msg.h" // for MaxFeatureSize, WarnOldSerialization, ... #include "common/io.h" // for PeekableInStream, ReadAll, FixedSizeStream, Mem... #include "common/observer.h" // for TrainingObserver #include "common/random.h" // for GlobalRandom #include "common/timer.h" // for Monitor #include "common/version.h" // for Version #include "dmlc/endian.h" // for ByteSwap, DMLC_IO_NO_ENDIAN_SWAP #include "xgboost/base.h" // for Args, bst_float, GradientPair, bst_feature_t, ... #include "xgboost/context.h" // for Context #include "xgboost/data.h" // for DMatrix, MetaInfo #include "xgboost/gbm.h" // for GradientBooster #include "xgboost/global_config.h" // for GlobalConfiguration, GlobalConfigThreadLocalStore #include "xgboost/host_device_vector.h" // for HostDeviceVector #include "xgboost/json.h" // for Json, get, Object, String, IsA, Array, ToJson #include "xgboost/linalg.h" // for Tensor, TensorView #include "xgboost/logging.h" // for CHECK, LOG, CHECK_EQ #include "xgboost/metric.h" // for Metric #include "xgboost/objective.h" // for ObjFunction #include "xgboost/parameter.h" // for DECLARE_FIELD_ENUM_CLASS, XGBoostParameter #include "xgboost/predictor.h" // for PredictionContainer, PredictionCacheEntry #include "xgboost/string_view.h" // for operator<<, StringView #include "xgboost/task.h" // for ObjInfo #include #include namespace { const char* kMaxDeltaStepDefaultValue = "0.7"; } // anonymous namespace DECLARE_FIELD_ENUM_CLASS(xgboost::MultiStrategy); namespace xgboost { Learner::~Learner() = default; namespace { StringView ModelNotFitted() { return "Model is not yet initialized (not fitted)."; } template T& UsePtr(T& ptr) { // NOLINT CHECK(ptr); return ptr; } } // anonymous namespace /*! \brief training parameter for regression * * Should be deprecated, but still used for being compatible with binary IO. * Once it's gone, `LearnerModelParam` should handle transforming `base_margin` * with objective by itself. */ struct LearnerModelParamLegacy : public dmlc::Parameter { /* \brief global bias */ bst_float base_score; /* \brief number of features */ bst_feature_t num_feature; /* \brief number of classes, if it is multi-class classification */ std::int32_t num_class; /*! \brief Model contain additional properties */ int32_t contain_extra_attrs; /*! \brief Model contain eval metrics */ int32_t contain_eval_metrics; /*! \brief the version of XGBoost. */ std::uint32_t major_version; std::uint32_t minor_version; /** * \brief Number of target variables. */ bst_target_t num_target; /** * \brief Whether we should calculate the base score from training data. * * This is a private parameter as we can't expose it as boolean due to binary model * format. Exposing it as integer creates inconsistency with other parameters. * * Automatically disabled when base_score is specifed by user. int32 is used instead * of bool for the ease of serialization. */ std::int32_t boost_from_average{true}; /*! \brief reserved field */ int reserved[25]; /*! \brief constructor */ LearnerModelParamLegacy() { std::memset(this, 0, sizeof(LearnerModelParamLegacy)); base_score = ObjFunction::DefaultBaseScore(); num_target = 1; major_version = std::get<0>(Version::Self()); minor_version = std::get<1>(Version::Self()); boost_from_average = true; static_assert(sizeof(LearnerModelParamLegacy) == 136, "Do not change the size of this struct, as it will break binary IO."); } // Skip other legacy fields. [[nodiscard]] Json ToJson() const { Json obj{Object{}}; char floats[NumericLimits::kToCharsSize]; auto ret = to_chars(floats, floats + NumericLimits::kToCharsSize, base_score); CHECK(ret.ec == std::errc{}); obj["base_score"] = std::string{floats, static_cast(std::distance(floats, ret.ptr))}; char integers[NumericLimits::kToCharsSize]; ret = to_chars(integers, integers + NumericLimits::kToCharsSize, static_cast(num_feature)); CHECK(ret.ec == std::errc()); obj["num_feature"] = std::string{integers, static_cast(std::distance(integers, ret.ptr))}; ret = to_chars(integers, integers + NumericLimits::kToCharsSize, static_cast(num_class)); CHECK(ret.ec == std::errc()); obj["num_class"] = std::string{integers, static_cast(std::distance(integers, ret.ptr))}; ret = to_chars(integers, integers + NumericLimits::kToCharsSize, static_cast(num_target)); obj["num_target"] = std::string{integers, static_cast(std::distance(integers, ret.ptr))}; ret = to_chars(integers, integers + NumericLimits::kToCharsSize, static_cast(boost_from_average)); obj["boost_from_average"] = std::string{integers, static_cast(std::distance(integers, ret.ptr))}; return obj; } void FromJson(Json const& obj) { auto const& j_param = get