[sycl] add loss guided hist building (#10251)

Co-authored-by: Dmitry Razdoburdin <>
2024-05-10 16:35:13 +02:00
parent 9b465052ce
commit f588252481
7 changed files with 459 additions and 30 deletions
--- a/tests/cpp/plugin/test_sycl_hist_updater.cc
+++ b/tests/cpp/plugin/test_sycl_hist_updater.cc
@@ -28,16 +28,40 @@ class TestHistUpdater : public HistUpdater<GradientSumT> {
    HistUpdater<GradientSumT>::InitSampling(gpair, row_indices);
  }

-  const auto* TestInitData(Context const * ctx,
+  auto* TestInitData(Context const * ctx,
                    const common::GHistIndexMatrix& gmat,
                    const USMVector<GradientPair, MemoryType::on_device> &gpair,
                    const DMatrix& fmat,
                    const RegTree& tree) {
    HistUpdater<GradientSumT>::InitData(ctx, gmat, gpair, fmat, tree);
-    return &(HistUpdater<GradientSumT>::row_set_collection_.Data());
+    return &(HistUpdater<GradientSumT>::row_set_collection_);
+  }
+
+  const auto* TestBuildHistogramsLossGuide(ExpandEntry entry,
+                                    const common::GHistIndexMatrix &gmat,
+                                    RegTree *p_tree,
+                                    const USMVector<GradientPair, MemoryType::on_device> &gpair) {
+    HistUpdater<GradientSumT>::BuildHistogramsLossGuide(entry, gmat, p_tree, gpair);
+    return &(HistUpdater<GradientSumT>::hist_);
  }
 };

+void GenerateRandomGPairs(::sycl::queue* qu, GradientPair* gpair_ptr, size_t num_rows, bool has_neg_hess) {
+  qu->submit([&](::sycl::handler& cgh) {
+    cgh.parallel_for<>(::sycl::range<1>(::sycl::range<1>(num_rows)),
+                                        [=](::sycl::item<1> pid) {
+      uint64_t i = pid.get_linear_id();
+
+      constexpr uint32_t seed = 777;
+      oneapi::dpl::minstd_rand engine(seed, i);
+      GradientPair::ValueT smallest_hess_val = has_neg_hess ? -1. : 0.;
+      oneapi::dpl::uniform_real_distribution<GradientPair::ValueT> distr(smallest_hess_val, 1.);
+      gpair_ptr[i] = {distr(engine), distr(engine)};
+    });
+  });
+  qu->wait();
+}
+
 template <typename GradientSumT>
 void TestHistUpdaterSampling(const xgboost::tree::TrainParam& param) {
  const size_t num_rows = 1u << 12;
@@ -60,18 +84,7 @@ void TestHistUpdaterSampling(const xgboost::tree::TrainParam& param) {
  USMVector<size_t, MemoryType::on_device> row_indices_0(&qu, num_rows);
  USMVector<size_t, MemoryType::on_device> row_indices_1(&qu, num_rows);
  USMVector<GradientPair, MemoryType::on_device> gpair(&qu, num_rows);
-  auto* gpair_ptr = gpair.Data();
-  qu.submit([&](::sycl::handler& cgh) {
-    cgh.parallel_for<>(::sycl::range<1>(::sycl::range<1>(num_rows)),
-                                        [=](::sycl::item<1> pid) {
-      uint64_t i = pid.get_linear_id();
-
-      constexpr uint32_t seed = 777;
-      oneapi::dpl::minstd_rand engine(seed, i);
-      oneapi::dpl::uniform_real_distribution<GradientPair::ValueT> distr(-1., 1.);
-      gpair_ptr[i] = {distr(engine), distr(engine)};
-    });
-  }).wait();
+  GenerateRandomGPairs(&qu, gpair.Data(), num_rows, true);

  updater.TestInitSampling(gpair, &row_indices_0);
  
@@ -125,19 +138,7 @@ void TestHistUpdaterInitData(const xgboost::tree::TrainParam& param, bool has_ne
  TestHistUpdater<GradientSumT> updater(qu, param, std::move(pruner), int_constraints, p_fmat.get());

  USMVector<GradientPair, MemoryType::on_device> gpair(&qu, num_rows);
-  auto* gpair_ptr = gpair.Data();
-  qu.submit([&](::sycl::handler& cgh) {
-    cgh.parallel_for<>(::sycl::range<1>(::sycl::range<1>(num_rows)),
-                                        [=](::sycl::item<1> pid) {
-      uint64_t i = pid.get_linear_id();
-
-      constexpr uint32_t seed = 777;
-      oneapi::dpl::minstd_rand engine(seed, i);
-      GradientPair::ValueT smallest_hess_val = has_neg_hess ? -1. : 0.;
-      oneapi::dpl::uniform_real_distribution<GradientPair::ValueT> distr(smallest_hess_val, 1.);
-      gpair_ptr[i] = {distr(engine), distr(engine)};
-    });
-  }).wait();
+  GenerateRandomGPairs(&qu, gpair.Data(), num_rows, has_neg_hess);

  DeviceMatrix dmat;
  dmat.Init(qu, p_fmat.get());
@@ -145,10 +146,11 @@ void TestHistUpdaterInitData(const xgboost::tree::TrainParam& param, bool has_ne
  gmat.Init(qu, &ctx, dmat, n_bins);
  RegTree tree;

-  const auto* row_indices = updater.TestInitData(&ctx, gmat, gpair, *p_fmat, tree);
+  auto* row_set_collection = updater.TestInitData(&ctx, gmat, gpair, *p_fmat, tree);
+  auto& row_indices = row_set_collection->Data();

-  std::vector<size_t> row_indices_host(row_indices->Size());
-  qu.memcpy(row_indices_host.data(), row_indices->DataConst(), row_indices->Size()*sizeof(size_t)).wait();
+  std::vector<size_t> row_indices_host(row_indices.Size());
+  qu.memcpy(row_indices_host.data(), row_indices.DataConst(), row_indices.Size()*sizeof(size_t)).wait();

  if (!has_neg_hess) {
    for (size_t i = 0; i < num_rows; ++i) {
@@ -171,6 +173,70 @@ void TestHistUpdaterInitData(const xgboost::tree::TrainParam& param, bool has_ne
  }
 }

+template <typename GradientSumT>
+void TestHistUpdaterBuildHistogramsLossGuide(const xgboost::tree::TrainParam& param, float sparsity) {
+  const size_t num_rows = 1u << 8;
+  const size_t num_columns = 1;
+  const size_t n_bins = 32;
+
+  Context ctx;
+  ctx.UpdateAllowUnknown(Args{{"device", "sycl"}});
+
+  DeviceManager device_manager;
+  auto qu = device_manager.GetQueue(ctx.Device());
+  ObjInfo task{ObjInfo::kRegression};
+
+  auto p_fmat = RandomDataGenerator{num_rows, num_columns, sparsity}.GenerateDMatrix();
+
+  FeatureInteractionConstraintHost int_constraints;
+  std::unique_ptr<TreeUpdater> pruner{TreeUpdater::Create("prune", &ctx, &task)};
+
+  TestHistUpdater<GradientSumT> updater(qu, param, std::move(pruner), int_constraints, p_fmat.get());
+  updater.SetHistSynchronizer(new BatchHistSynchronizer<GradientSumT>());
+  updater.SetHistRowsAdder(new BatchHistRowsAdder<GradientSumT>());
+
+  USMVector<GradientPair, MemoryType::on_device> gpair(&qu, num_rows);
+  auto* gpair_ptr = gpair.Data();
+  GenerateRandomGPairs(&qu, gpair_ptr, num_rows, false);
+
+  DeviceMatrix dmat;
+  dmat.Init(qu, p_fmat.get());
+  common::GHistIndexMatrix gmat;
+  gmat.Init(qu, &ctx, dmat, n_bins);
+
+  RegTree tree;
+  tree.ExpandNode(0, 0, 0, false, 0, 0, 0, 0, 0, 0, 0);
+  tree.ExpandNode(tree[0].LeftChild(), 0, 0, false, 0, 0, 0, 0, 0, 0, 0);
+  tree.ExpandNode(tree[0].RightChild(), 0, 0, false, 0, 0, 0, 0, 0, 0, 0);
+
+  ExpandEntry node0(0, tree.GetDepth(0));
+  ExpandEntry node1(1, tree.GetDepth(1));
+  ExpandEntry node2(2, tree.GetDepth(2));
+
+  auto* row_set_collection = updater.TestInitData(&ctx, gmat, gpair, *p_fmat, tree);
+  row_set_collection->AddSplit(0, 1, 2, 42, num_rows - 42);
+
+  updater.TestBuildHistogramsLossGuide(node0, gmat, &tree, gpair);
+  const auto* hist = updater.TestBuildHistogramsLossGuide(node1, gmat, &tree, gpair);
+
+  ASSERT_EQ((*hist)[0].Size(), n_bins);
+  ASSERT_EQ((*hist)[1].Size(), n_bins);
+  ASSERT_EQ((*hist)[2].Size(), n_bins);
+
+  std::vector<xgboost::detail::GradientPairInternal<GradientSumT>> hist0_host(n_bins);
+  std::vector<xgboost::detail::GradientPairInternal<GradientSumT>> hist1_host(n_bins);
+  std::vector<xgboost::detail::GradientPairInternal<GradientSumT>> hist2_host(n_bins);
+  qu.memcpy(hist0_host.data(), (*hist)[0].DataConst(), sizeof(xgboost::detail::GradientPairInternal<GradientSumT>) * n_bins);
+  qu.memcpy(hist1_host.data(), (*hist)[1].DataConst(), sizeof(xgboost::detail::GradientPairInternal<GradientSumT>) * n_bins);
+  qu.memcpy(hist2_host.data(), (*hist)[2].DataConst(), sizeof(xgboost::detail::GradientPairInternal<GradientSumT>) * n_bins);
+  qu.wait();
+
+  for (size_t idx_bin = 0; idx_bin < n_bins; ++idx_bin) {
+    EXPECT_NEAR(hist0_host[idx_bin].GetGrad(), hist1_host[idx_bin].GetGrad() + hist2_host[idx_bin].GetGrad(), 1e-6);
+    EXPECT_NEAR(hist0_host[idx_bin].GetHess(), hist1_host[idx_bin].GetHess() + hist2_host[idx_bin].GetHess(), 1e-6);
+  }
+}
+
 TEST(SyclHistUpdater, Sampling) {
  xgboost::tree::TrainParam param;
  param.UpdateAllowUnknown(Args{{"subsample", "0.7"}});
@@ -190,4 +256,14 @@ TEST(SyclHistUpdater, InitData) {
  TestHistUpdaterInitData<double>(param, false);
 }

+TEST(SyclHistUpdater, BuildHistogramsLossGuide) {
+  xgboost::tree::TrainParam param;
+  param.UpdateAllowUnknown(Args{{"max_depth", "3"}});
+
+  TestHistUpdaterBuildHistogramsLossGuide<float>(param, 0.0);
+  TestHistUpdaterBuildHistogramsLossGuide<float>(param, 0.5);
+  TestHistUpdaterBuildHistogramsLossGuide<double>(param, 0.0);
+  TestHistUpdaterBuildHistogramsLossGuide<double>(param, 0.5);
+}
+
 }  // namespace xgboost::sycl::tree