xgboost/tests/cpp/tree/test_prediction_cache.cc

/*!
 * Copyright 2021-2022 by XGBoost contributors
 */
#include <gtest/gtest.h>
#include <xgboost/host_device_vector.h>
#include <xgboost/tree_updater.h>

#include <memory>

#include "../helpers.h"

namespace xgboost {

class TestPredictionCache : public ::testing::Test {
  std::shared_ptr<DMatrix> Xy_;
  size_t n_samples_{2048};

 protected:
  void SetUp() override {
    size_t n_features = 13;
    Xy_ = RandomDataGenerator{n_samples_, n_features, 0}.GenerateDMatrix(true);
  }

  void RunLearnerTest(std::string updater_name, float subsample, std::string grow_policy) {
    std::unique_ptr<Learner> learner{Learner::Create({Xy_})};
    if (updater_name == "grow_gpu_hist") {
      // gpu_id setup
      learner->SetParam("tree_method", "gpu_hist");
    } else {
      learner->SetParam("updater", updater_name);
    }
    learner->SetParam("grow_policy", grow_policy);
    learner->SetParam("subsample", std::to_string(subsample));
    learner->SetParam("nthread", "0");
    learner->Configure();

    for (size_t i = 0; i < 8; ++i) {
      learner->UpdateOneIter(i, Xy_);
    }

    HostDeviceVector<float> out_prediction_cached;
    learner->Predict(Xy_, false, &out_prediction_cached, 0, 0);

    Json model{Object()};
    learner->SaveModel(&model);

    HostDeviceVector<float> out_prediction;
    {
      std::unique_ptr<Learner> learner{Learner::Create({Xy_})};
      learner->LoadModel(model);
      learner->Predict(Xy_, false, &out_prediction, 0, 0);
    }

    auto const h_predt_cached = out_prediction_cached.ConstHostSpan();
    auto const h_predt = out_prediction.ConstHostSpan();

    ASSERT_EQ(h_predt.size(), h_predt_cached.size());
    for (size_t i = 0; i < h_predt.size(); ++i) {
      ASSERT_NEAR(h_predt[i], h_predt_cached[i], kRtEps);
    }
  }

  void RunTest(std::string updater_name) {
    {
      omp_set_num_threads(1);
      GenericParameter ctx;
      ctx.InitAllowUnknown(Args{{"nthread", "8"}});
      if (updater_name == "grow_gpu_hist") {
        ctx.gpu_id = 0;
      } else {
        ctx.gpu_id = GenericParameter::kCpuId;
      }

      std::unique_ptr<TreeUpdater> updater{
          TreeUpdater::Create(updater_name, &ctx, ObjInfo{ObjInfo::kRegression})};
      RegTree tree;
      std::vector<RegTree *> trees{&tree};
      auto gpair = GenerateRandomGradients(n_samples_);
      updater->Configure(Args{{"max_bin", "64"}});
      std::vector<HostDeviceVector<bst_node_t>> position(1);
      updater->Update(&gpair, Xy_.get(), position, trees);
      HostDeviceVector<float> out_prediction_cached;
      out_prediction_cached.SetDevice(ctx.gpu_id);
      out_prediction_cached.Resize(n_samples_);
      auto cache = linalg::VectorView<float>{ctx.gpu_id == GenericParameter::kCpuId
                                                 ? out_prediction_cached.HostSpan()
                                                 : out_prediction_cached.DeviceSpan(),
                                             {out_prediction_cached.Size()},
                                             ctx.gpu_id};
      ASSERT_TRUE(updater->UpdatePredictionCache(Xy_.get(), cache));
    }

    for (auto policy : {"depthwise", "lossguide"}) {
      for (auto subsample : {1.0f, 0.4f}) {
        this->RunLearnerTest(updater_name, subsample, policy);
        this->RunLearnerTest(updater_name, subsample, policy);
      }
    }
  }
};

TEST_F(TestPredictionCache, Approx) { this->RunTest("grow_histmaker"); }

TEST_F(TestPredictionCache, Hist) { this->RunTest("grow_quantile_histmaker"); }

#if defined(XGBOOST_USE_CUDA)
TEST_F(TestPredictionCache, GpuHist) { this->RunTest("grow_gpu_hist"); }
#endif  // defined(XGBOOST_USE_CUDA)
}  // namespace xgboost