[BREAKING] prevent multi-gpu usage (#4749)

* prevent multi-gpu usage * fix distributed test * combine gpu predictor tests * set upper bound on n_gpus
2019-08-12 14:11:35 -07:00
parent 198f3a6c4a
commit c5b229632d
14 changed files with 59 additions and 298 deletions
--- a/tests/cpp/predictor/test_gpu_predictor.cu
+++ b/tests/cpp/predictor/test_gpu_predictor.cu
@@ -12,7 +12,6 @@
 #include "gtest/gtest.h"
 #include "../helpers.h"

-#if defined(XGBOOST_USE_NCCL)
 namespace {

 inline void CheckCAPICall(int ret) {
@@ -20,7 +19,6 @@ inline void CheckCAPICall(int ret) {
 }

 }  // namespace anonymous
-#endif

 const std::map<std::string, std::string>&
 QueryBoosterConfigurationArguments(BoosterHandle handle) {
@@ -46,26 +44,28 @@ TEST(gpu_predictor, Test) {
  gpu_predictor->Configure({}, {});
  cpu_predictor->Configure({}, {});

-  int n_row = 5;
-  int n_col = 5;
+  for (size_t i = 1; i < 33; i *= 2) {
+    int n_row = i, n_col = i;
+    auto dmat = CreateDMatrix(n_row, n_col, 0);

-  gbm::GBTreeModel model = CreateTestModel();
-  model.param.num_feature = n_col;
-  auto dmat = CreateDMatrix(n_row, n_col, 0);
+    gbm::GBTreeModel model = CreateTestModel();
+    model.param.num_feature = n_col;

-  // Test predict batch
-  HostDeviceVector<float> gpu_out_predictions;
-  HostDeviceVector<float> cpu_out_predictions;
-  gpu_predictor->PredictBatch((*dmat).get(), &gpu_out_predictions, model, 0);
-  cpu_predictor->PredictBatch((*dmat).get(), &cpu_out_predictions, model, 0);
-  std::vector<float>& gpu_out_predictions_h = gpu_out_predictions.HostVector();
-  std::vector<float>& cpu_out_predictions_h = cpu_out_predictions.HostVector();
-  float abs_tolerance = 0.001;
-  for (int i = 0; i < gpu_out_predictions.Size(); i++) {
-    ASSERT_NEAR(gpu_out_predictions_h[i], cpu_out_predictions_h[i], abs_tolerance);
+    // Test predict batch
+    HostDeviceVector<float> gpu_out_predictions;
+    HostDeviceVector<float> cpu_out_predictions;
+
+    gpu_predictor->PredictBatch((*dmat).get(), &gpu_out_predictions, model, 0);
+    cpu_predictor->PredictBatch((*dmat).get(), &cpu_out_predictions, model, 0);
+
+    std::vector<float>& gpu_out_predictions_h = gpu_out_predictions.HostVector();
+    std::vector<float>& cpu_out_predictions_h = cpu_out_predictions.HostVector();
+    float abs_tolerance = 0.001;
+    for (int j = 0; j < gpu_out_predictions.Size(); j++) {
+      ASSERT_NEAR(gpu_out_predictions_h[j], cpu_out_predictions_h[j], abs_tolerance);
+    }
+    delete dmat;
  }
-
-  delete dmat;
 }

 TEST(gpu_predictor, ExternalMemoryTest) {
@@ -74,25 +74,35 @@ TEST(gpu_predictor, ExternalMemoryTest) {
      std::unique_ptr<Predictor>(Predictor::Create("gpu_predictor", &lparam));
  gpu_predictor->Configure({}, {});
  gbm::GBTreeModel model = CreateTestModel();
-  int n_col = 3;
-  model.param.num_feature = n_col;
+  model.param.num_feature = 3;
+  const int n_classes = 3;
+  model.param.num_output_group = n_classes;
+  std::vector<std::unique_ptr<DMatrix>> dmats;
  dmlc::TemporaryDirectory tmpdir;
-  std::string filename = tmpdir.path + "/big.libsvm";
-  std::unique_ptr<DMatrix> dmat = CreateSparsePageDMatrix(32, 64, filename);
+  std::string file0 = tmpdir.path + "/big_0.libsvm";
+  std::string file1 = tmpdir.path + "/big_1.libsvm";
+  std::string file2 = tmpdir.path + "/big_2.libsvm";
+  dmats.push_back(CreateSparsePageDMatrix(9, 64UL, file0));
+  dmats.push_back(CreateSparsePageDMatrix(128, 128UL, file1));
+  dmats.push_back(CreateSparsePageDMatrix(1024, 1024UL, file2));

-  // Test predict batch
-  HostDeviceVector<float> out_predictions;
-  gpu_predictor->PredictBatch(dmat.get(), &out_predictions, model, 0);
-  EXPECT_EQ(out_predictions.Size(), dmat->Info().num_row_);
-  for (const auto& v : out_predictions.HostVector()) {
-    ASSERT_EQ(v, 1.5);
+  for (const auto& dmat: dmats) {
+    // Test predict batch
+    HostDeviceVector<float> out_predictions;
+    gpu_predictor->PredictBatch(dmat.get(), &out_predictions, model, 0);
+    EXPECT_EQ(out_predictions.Size(), dmat->Info().num_row_ * n_classes);
+    const std::vector<float> &host_vector = out_predictions.ConstHostVector();
+    for (int i = 0; i < host_vector.size() / n_classes; i++) {
+      ASSERT_EQ(host_vector[i * n_classes], 1.5);
+      ASSERT_EQ(host_vector[i * n_classes + 1], 0.);
+      ASSERT_EQ(host_vector[i * n_classes + 2], 0.);
+    }
  }
 }

-#if defined(XGBOOST_USE_NCCL)
 // Test whether pickling preserves predictor parameters
-TEST(gpu_predictor, MGPU_PicklingTest) {
-  int const ngpu = GPUSet::AllVisible().Size();
+TEST(gpu_predictor, PicklingTest) {
+  int const ngpu = 1;

  dmlc::TemporaryDirectory tempdir;
  const std::string tmp_file = tempdir.path + "/simple.libsvm";
@@ -153,12 +163,6 @@ TEST(gpu_predictor, MGPU_PicklingTest) {
    ASSERT_EQ(kwargs.at("n_gpus"), std::to_string(ngpu).c_str());
  }

-  {  // Change n_gpus and query again
-    CheckCAPICall(XGBoosterSetParam(bst2, "n_gpus", "1"));
-    const auto& kwargs = QueryBoosterConfigurationArguments(bst2);
-    ASSERT_EQ(kwargs.at("n_gpus"), "1");
-  }
-
  {  // Change predictor and query again
    CheckCAPICall(XGBoosterSetParam(bst2, "predictor", "cpu_predictor"));
    const auto& kwargs = QueryBoosterConfigurationArguments(bst2);
@@ -167,77 +171,5 @@ TEST(gpu_predictor, MGPU_PicklingTest) {

  CheckCAPICall(XGBoosterFree(bst2));
 }
-
-// multi-GPU predictor test
-TEST(gpu_predictor, MGPU_Test) {
-  auto cpu_lparam = CreateEmptyGenericParam(0, 0);
-  auto gpu_lparam = CreateEmptyGenericParam(0, -1);
-
-  std::unique_ptr<Predictor> gpu_predictor =
-      std::unique_ptr<Predictor>(Predictor::Create("gpu_predictor", &gpu_lparam));
-  std::unique_ptr<Predictor> cpu_predictor =
-      std::unique_ptr<Predictor>(Predictor::Create("cpu_predictor", &cpu_lparam));
-
-  cpu_predictor->Configure({}, {});
-
-  for (size_t i = 1; i < 33; i *= 2) {
-    int n_row = i, n_col = i;
-    auto dmat = CreateDMatrix(n_row, n_col, 0);
-
-    gbm::GBTreeModel model = CreateTestModel();
-    model.param.num_feature = n_col;
-
-    // Test predict batch
-    HostDeviceVector<float> gpu_out_predictions;
-    HostDeviceVector<float> cpu_out_predictions;
-
-    gpu_predictor->PredictBatch((*dmat).get(), &gpu_out_predictions, model, 0);
-    cpu_predictor->PredictBatch((*dmat).get(), &cpu_out_predictions, model, 0);
-
-    std::vector<float>& gpu_out_predictions_h = gpu_out_predictions.HostVector();
-    std::vector<float>& cpu_out_predictions_h = cpu_out_predictions.HostVector();
-    float abs_tolerance = 0.001;
-    for (int j = 0; j < gpu_out_predictions.Size(); j++) {
-      ASSERT_NEAR(gpu_out_predictions_h[j], cpu_out_predictions_h[j], abs_tolerance);
-    }
-    delete dmat;
-  }
-}
-
-// multi-GPU predictor external memory test
-TEST(gpu_predictor, MGPU_ExternalMemoryTest) {
-  auto gpu_lparam = CreateEmptyGenericParam(0, -1);
-
-  std::unique_ptr<Predictor> gpu_predictor =
-      std::unique_ptr<Predictor>(Predictor::Create("gpu_predictor", &gpu_lparam));
-  gpu_predictor->Configure({}, {});
-
-  gbm::GBTreeModel model = CreateTestModel();
-  model.param.num_feature = 3;
-  const int n_classes = 3;
-  model.param.num_output_group = n_classes;
-  std::vector<std::unique_ptr<DMatrix>> dmats;
-  dmlc::TemporaryDirectory tmpdir;
-  std::string file0 = tmpdir.path + "/big_0.libsvm";
-  std::string file1 = tmpdir.path + "/big_1.libsvm";
-  std::string file2 = tmpdir.path + "/big_2.libsvm";
-  dmats.push_back(CreateSparsePageDMatrix(9, 64UL, file0));
-  dmats.push_back(CreateSparsePageDMatrix(128, 128UL, file1));
-  dmats.push_back(CreateSparsePageDMatrix(1024, 1024UL, file2));
-
-  for (const auto& dmat: dmats) {
-    // Test predict batch
-    HostDeviceVector<float> out_predictions;
-    gpu_predictor->PredictBatch(dmat.get(), &out_predictions, model, 0);
-    EXPECT_EQ(out_predictions.Size(), dmat->Info().num_row_ * n_classes);
-    const std::vector<float> &host_vector = out_predictions.ConstHostVector();
-    for (int i = 0; i < host_vector.size() / n_classes; i++) {
-      ASSERT_EQ(host_vector[i * n_classes], 1.5);
-      ASSERT_EQ(host_vector[i * n_classes + 1], 0.);
-      ASSERT_EQ(host_vector[i * n_classes + 2], 0.);
-    }
-  }
-}
-#endif  // defined(XGBOOST_USE_NCCL)
 }  // namespace predictor
 }  // namespace xgboost