/** * Copyright 2019-2023, XGBoost contributors */ #include #include #include // for HostDeviceVector #include // for Json, Object #include // for Learner #include // for numeric_limits #include // for shared_ptr #include // for optional #include // for string #include "../../../src/data/proxy_dmatrix.h" // for DMatrixProxy #include "../../../src/gbm/gbtree.h" #include "../filesystem.h" // dmlc::TemporaryDirectory #include "../helpers.h" #include "xgboost/base.h" #include "xgboost/predictor.h" namespace xgboost { TEST(GBTree, SelectTreeMethod) { size_t constexpr kCols = 10; Context ctx; LearnerModelParam mparam{MakeMP(kCols, .5, 1)}; std::unique_ptr p_gbm { GradientBooster::Create("gbtree", &ctx, &mparam)}; auto& gbtree = dynamic_cast (*p_gbm); // Test if `tree_method` can be set Args args {{"tree_method", "approx"}}; gbtree.Configure({args.cbegin(), args.cend()}); gbtree.Configure(args); auto const& tparam = gbtree.GetTrainParam(); gbtree.Configure({{"tree_method", "approx"}}); ASSERT_EQ(tparam.updater_seq, "grow_histmaker"); gbtree.Configure({{"tree_method", "exact"}}); ASSERT_EQ(tparam.updater_seq, "grow_colmaker,prune"); gbtree.Configure({{"tree_method", "hist"}}); ASSERT_EQ(tparam.updater_seq, "grow_quantile_histmaker"); gbtree.Configure({{"booster", "dart"}, {"tree_method", "hist"}}); ASSERT_EQ(tparam.updater_seq, "grow_quantile_histmaker"); #ifdef XGBOOST_USE_CUDA ctx.UpdateAllowUnknown(Args{{"gpu_id", "0"}}); gbtree.Configure({{"tree_method", "gpu_hist"}}); ASSERT_EQ(tparam.updater_seq, "grow_gpu_hist"); gbtree.Configure({{"booster", "dart"}, {"tree_method", "gpu_hist"}}); ASSERT_EQ(tparam.updater_seq, "grow_gpu_hist"); #endif // XGBOOST_USE_CUDA } TEST(GBTree, PredictionCache) { size_t constexpr kRows = 100, kCols = 10; Context ctx; LearnerModelParam mparam{MakeMP(kCols, .5, 1)}; std::unique_ptr p_gbm { GradientBooster::Create("gbtree", &ctx, &mparam)}; auto& gbtree = dynamic_cast (*p_gbm); gbtree.Configure({{"tree_method", "hist"}}); auto p_m = RandomDataGenerator{kRows, kCols, 0}.GenerateDMatrix(); linalg::Matrix gpair({kRows}, ctx.Device()); gpair.Data()->Copy(GenerateRandomGradients(kRows)); PredictionCacheEntry out_predictions; gbtree.DoBoost(p_m.get(), &gpair, &out_predictions, nullptr); gbtree.PredictBatch(p_m.get(), &out_predictions, false, 0, 0); ASSERT_EQ(1, out_predictions.version); std::vector first_iter = out_predictions.predictions.HostVector(); // Add 1 more boosted round gbtree.DoBoost(p_m.get(), &gpair, &out_predictions, nullptr); gbtree.PredictBatch(p_m.get(), &out_predictions, false, 0, 0); ASSERT_EQ(2, out_predictions.version); // Update the cache for all rounds out_predictions.version = 0; gbtree.PredictBatch(p_m.get(), &out_predictions, false, 0, 0); ASSERT_EQ(2, out_predictions.version); gbtree.DoBoost(p_m.get(), &gpair, &out_predictions, nullptr); // drop the cache. gbtree.PredictBatch(p_m.get(), &out_predictions, false, 1, 2); ASSERT_EQ(0, out_predictions.version); // half open set [1, 3) gbtree.PredictBatch(p_m.get(), &out_predictions, false, 1, 3); ASSERT_EQ(0, out_predictions.version); // iteration end gbtree.PredictBatch(p_m.get(), &out_predictions, false, 0, 2); ASSERT_EQ(2, out_predictions.version); // restart the cache when end iteration is smaller than cache version gbtree.PredictBatch(p_m.get(), &out_predictions, false, 0, 1); ASSERT_EQ(1, out_predictions.version); ASSERT_EQ(out_predictions.predictions.HostVector(), first_iter); } TEST(GBTree, WrongUpdater) { size_t constexpr kRows = 17; size_t constexpr kCols = 15; auto p_dmat = RandomDataGenerator(kRows, kCols, 0).GenerateDMatrix(); p_dmat->Info().labels.Reshape(kRows); auto learner = std::unique_ptr(Learner::Create({p_dmat})); // Hist can not be used for updating tree. learner->SetParams(Args{{"tree_method", "hist"}, {"process_type", "update"}}); ASSERT_THROW(learner->UpdateOneIter(0, p_dmat), dmlc::Error); // Prune can not be used for learning new tree. learner->SetParams( Args{{"tree_method", "prune"}, {"process_type", "default"}}); ASSERT_THROW(learner->UpdateOneIter(0, p_dmat), dmlc::Error); } #ifdef XGBOOST_USE_CUDA TEST(GBTree, ChoosePredictor) { // The test ensures data don't get pulled into device. std::size_t constexpr kRows = 17, kCols = 15; auto p_dmat = RandomDataGenerator(kRows, kCols, 0).GenerateDMatrix(); auto const& data = (*(p_dmat->GetBatches().begin())).data; p_dmat->Info().labels.Reshape(kRows); auto learner = std::unique_ptr(Learner::Create({p_dmat})); learner->SetParams(Args{{"tree_method", "gpu_hist"}, {"gpu_id", "0"}}); for (size_t i = 0; i < 4; ++i) { learner->UpdateOneIter(i, p_dmat); } ASSERT_TRUE(data.HostCanWrite()); dmlc::TemporaryDirectory tempdir; const std::string fname = tempdir.path + "/model_param.bst"; { std::unique_ptr fo(dmlc::Stream::Create(fname.c_str(), "w")); learner->Save(fo.get()); } // a new learner learner = std::unique_ptr(Learner::Create({p_dmat})); { std::unique_ptr fi(dmlc::Stream::Create(fname.c_str(), "r")); learner->Load(fi.get()); } learner->SetParams(Args{{"tree_method", "gpu_hist"}, {"gpu_id", "0"}}); for (size_t i = 0; i < 4; ++i) { learner->UpdateOneIter(i, p_dmat); } ASSERT_TRUE(data.HostCanWrite()); ASSERT_FALSE(data.DeviceCanWrite()); ASSERT_FALSE(data.DeviceCanRead()); // pull data into device. data.HostVector(); data.SetDevice(DeviceOrd::CUDA(0)); data.DeviceSpan(); ASSERT_FALSE(data.HostCanWrite()); // another new learner learner = std::unique_ptr(Learner::Create({p_dmat})); learner->SetParams(Args{{"tree_method", "gpu_hist"}, {"gpu_id", "0"}}); for (size_t i = 0; i < 4; ++i) { learner->UpdateOneIter(i, p_dmat); } // data is not pulled back into host ASSERT_FALSE(data.HostCanWrite()); } TEST(GBTree, ChooseTreeMethod) { bst_idx_t n_samples{128}; bst_feature_t n_features{64}; auto Xy = RandomDataGenerator{n_samples, n_features, 0.5f}.GenerateDMatrix(true); auto with_update = [&](std::optional device, std::optional tree_method) { auto learner = std::unique_ptr(Learner::Create({Xy})); if (tree_method.has_value()) { learner->SetParam("tree_method", tree_method.value()); } if (device.has_value()) { auto const& d = device.value(); if (std::isdigit(d.front()) || d.front() == '-') { learner->SetParam("gpu_id", d); } else { learner->SetParam("device", d); } } learner->Configure(); for (std::int32_t i = 0; i < 3; ++i) { learner->UpdateOneIter(0, Xy); } Json config{Object{}}; learner->SaveConfig(&config); auto updater = config["learner"]["gradient_booster"]["updater"]; CHECK(!IsA(updater)); return updater; }; auto with_boost = [&](std::optional device, std::optional tree_method) { auto learner = std::unique_ptr(Learner::Create({Xy})); if (tree_method.has_value()) { learner->SetParam("tree_method", tree_method.value()); } if (device.has_value()) { auto const& d = device.value(); if (std::isdigit(d.front()) || d.front() == '-') { learner->SetParam("gpu_id", d); } else { learner->SetParam("device", d); } } learner->Configure(); for (std::int32_t i = 0; i < 3; ++i) { linalg::Matrix gpair{{Xy->Info().num_row_}, DeviceOrd::CPU()}; gpair.Data()->Copy(GenerateRandomGradients(Xy->Info().num_row_)); learner->BoostOneIter(0, Xy, &gpair); } Json config{Object{}}; learner->SaveConfig(&config); auto updater = config["learner"]["gradient_booster"]["updater"]; return updater; }; // | | hist | gpu_hist | exact | NA | // |--------+---------+----------+-------+-----| // | CUDA:0 | GPU | GPU (w) | Err | GPU | // | CPU | CPU | GPU (w) | CPU | CPU | // |--------+---------+----------+-------+-----| // | -1 | CPU | GPU (w) | CPU | CPU | // | 0 | GPU | GPU (w) | Err | GPU | // |--------+---------+----------+-------+-----| // | NA | CPU | GPU (w) | CPU | CPU | // // - (w): warning // - CPU: Run on CPU. // - GPU: Run on CUDA. // - Err: Not feasible. // - NA: Parameter is not specified. // When GPU hist is specified with a CPU context, we should emit an error. However, it's // quite difficult to detect whether the CPU context is being used because it's the // default or because it's specified by the user. std::map, std::optional>, std::string> expectation{ // hist {{"hist", "-1"}, "grow_quantile_histmaker"}, {{"hist", "0"}, "grow_gpu_hist"}, {{"hist", "cpu"}, "grow_quantile_histmaker"}, {{"hist", "cuda"}, "grow_gpu_hist"}, {{"hist", "cuda:0"}, "grow_gpu_hist"}, {{"hist", std::nullopt}, "grow_quantile_histmaker"}, // gpu_hist {{"gpu_hist", "-1"}, "grow_gpu_hist"}, {{"gpu_hist", "0"}, "grow_gpu_hist"}, {{"gpu_hist", "cpu"}, "grow_gpu_hist"}, {{"gpu_hist", "cuda"}, "grow_gpu_hist"}, {{"gpu_hist", "cuda:0"}, "grow_gpu_hist"}, {{"gpu_hist", std::nullopt}, "grow_gpu_hist"}, // exact {{"exact", "-1"}, "grow_colmaker,prune"}, {{"exact", "0"}, "err"}, {{"exact", "cpu"}, "grow_colmaker,prune"}, {{"exact", "cuda"}, "err"}, {{"exact", "cuda:0"}, "err"}, {{"exact", std::nullopt}, "grow_colmaker,prune"}, // NA {{std::nullopt, "-1"}, "grow_quantile_histmaker"}, {{std::nullopt, "0"}, "grow_gpu_hist"}, // default to hist {{std::nullopt, "cpu"}, "grow_quantile_histmaker"}, {{std::nullopt, "cuda"}, "grow_gpu_hist"}, {{std::nullopt, "cuda:0"}, "grow_gpu_hist"}, {{std::nullopt, std::nullopt}, "grow_quantile_histmaker"}, }; auto run_test = [&](auto fn) { for (auto const& kv : expectation) { auto device = kv.first.second; auto tm = kv.first.first; if (kv.second == "err") { ASSERT_THROW({ fn(device, tm); }, dmlc::Error) << " device:" << device.value_or("NA") << " tm:" << tm.value_or("NA"); continue; } auto up = fn(device, tm); auto ups = get(up); auto exp_names = common::Split(kv.second, ','); ASSERT_EQ(exp_names.size(), ups.size()); for (std::size_t i = 0; i < exp_names.size(); ++i) { ASSERT_EQ(get(ups[i]["name"]), exp_names[i]) << " device:" << device.value_or("NA") << " tm:" << tm.value_or("NA"); } } }; run_test(with_update); run_test(with_boost); } #endif // XGBOOST_USE_CUDA // Some other parts of test are in `Tree.JsonIO'. TEST(GBTree, JsonIO) { size_t constexpr kRows = 16, kCols = 16; Context ctx; LearnerModelParam mparam{MakeMP(kCols, .5, 1)}; std::unique_ptr gbm{ CreateTrainedGBM("gbtree", Args{{"tree_method", "exact"}, {"default_direction", "left"}}, kRows, kCols, &mparam, &ctx)}; Json model{Object()}; model["model"] = Object(); auto j_model = model["model"]; model["config"] = Object(); auto j_config = model["config"]; gbm->SaveModel(&j_model); gbm->SaveConfig(&j_config); std::string model_str; Json::Dump(model, &model_str); model = Json::Load({model_str.c_str(), model_str.size()}); j_model = model["model"]; j_config = model["config"]; ASSERT_EQ(get(j_model["name"]), "gbtree"); auto gbtree_model = j_model["model"]; ASSERT_EQ(get(gbtree_model["trees"]).size(), 1ul); ASSERT_EQ(get(get