Rename IterativeDMatrix. (#8045)

2022-07-04 18:52:31 +08:00
parent f24bfc7684
commit 8746f9cddf
5 changed files with 29 additions and 32 deletions
--- a/src/data/iterative_dmatrix.cu
+++ b/src/data/iterative_dmatrix.cu
@@ -0,0 +1,174 @@
+/*!
+ * Copyright 2020-2022 XGBoost contributors
+ */
+#include <memory>
+#include <type_traits>
+#include <algorithm>
+
+#include "../common/hist_util.cuh"
+#include "simple_batch_iterator.h"
+#include "iterative_dmatrix.h"
+#include "sparse_page_source.h"
+#include "ellpack_page.cuh"
+#include "proxy_dmatrix.h"
+#include "proxy_dmatrix.cuh"
+#include "device_adapter.cuh"
+
+namespace xgboost {
+namespace data {
+void IterativeDMatrix::InitFromCUDA(DataIterHandle iter_handle, float missing) {
+  // A handle passed to external iterator.
+  DMatrixProxy* proxy = MakeProxy(proxy_);
+  CHECK(proxy);
+
+  // The external iterator
+  auto iter = DataIterProxy<DataIterResetCallback, XGDMatrixCallbackNext>{
+    iter_handle, reset_, next_};
+
+  dh::XGBCachingDeviceAllocator<char> alloc;
+
+  auto num_rows = [&]() {
+    return Dispatch(proxy, [](auto const &value) { return value.NumRows(); });
+  };
+  auto num_cols = [&]() {
+    return Dispatch(proxy, [](auto const &value) { return value.NumCols(); });
+  };
+
+  size_t row_stride = 0;
+  size_t nnz = 0;
+  // Sketch for all batches.
+  iter.Reset();
+
+  std::vector<common::SketchContainer> sketch_containers;
+  size_t batches = 0;
+  size_t accumulated_rows = 0;
+  bst_feature_t cols = 0;
+
+  int32_t current_device;
+  dh::safe_cuda(cudaGetDevice(&current_device));
+  auto get_device = [&]() -> int32_t {
+    int32_t d = (ctx_.gpu_id == Context::kCpuId) ? current_device : ctx_.gpu_id;
+    CHECK_NE(d, Context::kCpuId);
+    return d;
+  };
+
+  while (iter.Next()) {
+    ctx_.gpu_id = proxy->DeviceIdx();
+    CHECK_LT(ctx_.gpu_id, common::AllVisibleGPUs());
+    dh::safe_cuda(cudaSetDevice(get_device()));
+    if (cols == 0) {
+      cols = num_cols();
+      rabit::Allreduce<rabit::op::Max>(&cols, 1);
+    } else {
+      CHECK_EQ(cols, num_cols()) << "Inconsistent number of columns.";
+    }
+    sketch_containers.emplace_back(proxy->Info().feature_types,
+                                   batch_param_.max_bin, cols, num_rows(), get_device());
+    auto* p_sketch = &sketch_containers.back();
+    proxy->Info().weights_.SetDevice(get_device());
+    Dispatch(proxy, [&](auto const &value) {
+        common::AdapterDeviceSketch(value, batch_param_.max_bin,
+                                    proxy->Info(), missing, p_sketch);
+      });
+    auto batch_rows = num_rows();
+    accumulated_rows += batch_rows;
+    dh::caching_device_vector<size_t> row_counts(batch_rows + 1, 0);
+    common::Span<size_t> row_counts_span(row_counts.data().get(),
+                                         row_counts.size());
+    row_stride = std::max(row_stride, Dispatch(proxy, [=](auto const &value) {
+          return GetRowCounts(value, row_counts_span,
+                              get_device(), missing);
+        }));
+    nnz += thrust::reduce(thrust::cuda::par(alloc), row_counts.begin(),
+                          row_counts.end());
+    batches++;
+  }
+  iter.Reset();
+  dh::safe_cuda(cudaSetDevice(get_device()));
+  HostDeviceVector<FeatureType> ft;
+  common::SketchContainer final_sketch(
+      sketch_containers.empty() ? ft : sketch_containers.front().FeatureTypes(),
+      batch_param_.max_bin, cols, accumulated_rows, get_device());
+  for (auto const& sketch : sketch_containers) {
+    final_sketch.Merge(sketch.ColumnsPtr(), sketch.Data());
+    final_sketch.FixError();
+  }
+  sketch_containers.clear();
+  sketch_containers.shrink_to_fit();
+
+  common::HistogramCuts cuts;
+  final_sketch.MakeCuts(&cuts);
+
+  this->info_.num_col_ = cols;
+  this->info_.num_row_ = accumulated_rows;
+  this->info_.num_nonzero_ = nnz;
+
+  auto init_page = [this, &proxy, &cuts, row_stride, accumulated_rows,
+                    get_device]() {
+    if (!page_) {
+      // Should be put inside the while loop to protect against empty batch.  In
+      // that case device id is invalid.
+      page_.reset(new EllpackPage);
+      *(page_->Impl()) = EllpackPageImpl(get_device(), cuts, this->IsDense(),
+                                         row_stride, accumulated_rows);
+    }
+  };
+
+  // Construct the final ellpack page.
+  size_t offset = 0;
+  iter.Reset();
+  size_t n_batches_for_verification = 0;
+  while (iter.Next()) {
+    init_page();
+    dh::safe_cuda(cudaSetDevice(get_device()));
+    auto rows = num_rows();
+    dh::caching_device_vector<size_t> row_counts(rows + 1, 0);
+    common::Span<size_t> row_counts_span(row_counts.data().get(),
+                                         row_counts.size());
+    Dispatch(proxy, [=](auto const& value) {
+        return GetRowCounts(value, row_counts_span, get_device(), missing);
+      });
+    auto is_dense = this->IsDense();
+
+    proxy->Info().feature_types.SetDevice(get_device());
+    auto d_feature_types = proxy->Info().feature_types.ConstDeviceSpan();
+    auto new_impl = Dispatch(proxy, [&](auto const& value) {
+      return EllpackPageImpl(value, missing, get_device(), is_dense, row_counts_span,
+                             d_feature_types, row_stride, rows, cuts);
+    });
+    size_t num_elements = page_->Impl()->Copy(get_device(), &new_impl, offset);
+    offset += num_elements;
+
+    proxy->Info().num_row_ = num_rows();
+    proxy->Info().num_col_ = cols;
+    if (batches != 1) {
+      this->info_.Extend(std::move(proxy->Info()), false, true);
+    }
+    n_batches_for_verification++;
+  }
+  CHECK_EQ(batches, n_batches_for_verification)
+      << "Different number of batches returned between 2 iterations";
+
+  if (batches == 1) {
+    this->info_ = std::move(proxy->Info());
+    this->info_.num_nonzero_ = nnz;
+    CHECK_EQ(proxy->Info().labels.Size(), 0);
+  }
+
+  iter.Reset();
+  // Synchronise worker columns
+  rabit::Allreduce<rabit::op::Max>(&info_.num_col_, 1);
+}
+
+BatchSet<EllpackPage> IterativeDMatrix::GetEllpackBatches(const BatchParam& param) {
+  CHECK(page_);
+  // FIXME(Jiamingy): https://github.com/dmlc/xgboost/issues/7976
+  if (param.max_bin != batch_param_.max_bin) {
+    LOG(WARNING) << "Inconsistent max_bin between Quantile DMatrix and Booster:" << param.max_bin
+                 << " vs. " << batch_param_.max_bin;
+  }
+  auto begin_iter = BatchIterator<EllpackPage>(new SimpleBatchIteratorImpl<EllpackPage>(page_));
+  return BatchSet<EllpackPage>(begin_iter);
+}
+}  // namespace data
+}  // namespace xgboost