Initial support for column-split cpu predictor (#8676)

2023-01-17 14:33:13 -08:00
parent 980233e648
commit 78396f8a6e
4 changed files with 334 additions and 11 deletions
--- a/tests/cpp/collective/test_communicator.cc
+++ b/tests/cpp/collective/test_communicator.cc
@@ -12,14 +12,17 @@ namespace collective {
 TEST(CommunicatorFactory, TypeFromEnv) {
  EXPECT_EQ(CommunicatorType::kUnknown, Communicator::GetTypeFromEnv());

+  dmlc::SetEnv<std::string>("XGBOOST_COMMUNICATOR", "foo");
+  EXPECT_THROW(Communicator::GetTypeFromEnv(), dmlc::Error);
+
  dmlc::SetEnv<std::string>("XGBOOST_COMMUNICATOR", "rabit");
  EXPECT_EQ(CommunicatorType::kRabit, Communicator::GetTypeFromEnv());

  dmlc::SetEnv<std::string>("XGBOOST_COMMUNICATOR", "Federated");
  EXPECT_EQ(CommunicatorType::kFederated, Communicator::GetTypeFromEnv());

-  dmlc::SetEnv<std::string>("XGBOOST_COMMUNICATOR", "foo");
-  EXPECT_THROW(Communicator::GetTypeFromEnv(), dmlc::Error);
+  dmlc::SetEnv<std::string>("XGBOOST_COMMUNICATOR", "In-Memory");
+  EXPECT_EQ(CommunicatorType::kInMemory, Communicator::GetTypeFromEnv());
 }

 TEST(CommunicatorFactory, TypeFromArgs) {
@@ -32,6 +35,9 @@ TEST(CommunicatorFactory, TypeFromArgs) {
  config["xgboost_communicator"] = String("federated");
  EXPECT_EQ(CommunicatorType::kFederated, Communicator::GetTypeFromConfig(config));

+  config["xgboost_communicator"] = String("in-memory");
+  EXPECT_EQ(CommunicatorType::kInMemory, Communicator::GetTypeFromConfig(config));
+
  config["xgboost_communicator"] = String("foo");
  EXPECT_THROW(Communicator::GetTypeFromConfig(config), dmlc::Error);
 }
@@ -46,6 +52,9 @@ TEST(CommunicatorFactory, TypeFromArgsUpperCase) {
  config["XGBOOST_COMMUNICATOR"] = String("federated");
  EXPECT_EQ(CommunicatorType::kFederated, Communicator::GetTypeFromConfig(config));

+  config["XGBOOST_COMMUNICATOR"] = String("in-memory");
+  EXPECT_EQ(CommunicatorType::kInMemory, Communicator::GetTypeFromConfig(config));
+
  config["XGBOOST_COMMUNICATOR"] = String("foo");
  EXPECT_THROW(Communicator::GetTypeFromConfig(config), dmlc::Error);
 }
--- a/tests/cpp/predictor/test_cpu_predictor.cc
+++ b/tests/cpp/predictor/test_cpu_predictor.cc
@@ -4,6 +4,9 @@
 #include <gtest/gtest.h>
 #include <xgboost/predictor.h>

+#include <thread>
+
+#include "../../../src/collective/communicator-inl.h"
 #include "../../../src/data/adapter.h"
 #include "../../../src/data/proxy_dmatrix.h"
 #include "../../../src/gbm/gbtree.h"
@@ -86,6 +89,49 @@ TEST(CpuPredictor, Basic) {
  }
 }

+TEST(CpuPredictor, ColumnSplit) {
+  size_t constexpr kRows = 5;
+  size_t constexpr kCols = 5;
+  auto dmat = RandomDataGenerator(kRows, kCols, 0).GenerateDMatrix();
+
+  std::vector<std::thread> threads;
+  size_t constexpr kWorldSize = 2;
+  size_t constexpr kSliceSize = (kCols + 1) / kWorldSize;
+   for (auto rank = 0; rank < kWorldSize; rank++) {
+    threads.emplace_back([=, &dmat]() {
+      Json config{JsonObject()};
+      config["xgboost_communicator"] = String("in-memory");
+      config["in_memory_world_size"] = kWorldSize;
+      config["in_memory_rank"] = rank;
+      xgboost::collective::Init(config);
+
+      auto lparam = CreateEmptyGenericParam(GPUIDX);
+      std::unique_ptr<Predictor> cpu_predictor =
+          std::unique_ptr<Predictor>(Predictor::Create("cpu_predictor", &lparam));
+
+      LearnerModelParam mparam{MakeMP(kCols, .0, 1)};
+
+      Context ctx;
+      ctx.UpdateAllowUnknown(Args{});
+      gbm::GBTreeModel model = CreateTestModel(&mparam, &ctx);
+
+      // Test predict batch
+      PredictionCacheEntry out_predictions;
+      cpu_predictor->InitOutPredictions(dmat->Info(), &out_predictions.predictions, model);
+      auto sliced = std::unique_ptr<DMatrix>{dmat->SliceCol(rank * kSliceSize, kSliceSize)};
+      cpu_predictor->PredictBatch(sliced.get(), &out_predictions, model, 0);
+
+      std::vector<float>& out_predictions_h = out_predictions.predictions.HostVector();
+      for (size_t i = 0; i < out_predictions.predictions.Size(); i++) {
+        ASSERT_EQ(out_predictions_h[i], 1.5);
+      }
+      xgboost::collective::Finalize();
+    });
+   }
+  for (auto& thread : threads) {
+    thread.join();
+  }
+}

 TEST(CpuPredictor, IterationRange) {
  TestIterationRange("cpu_predictor");