Fix calling GPU predictor (#4836)

* Fix calling GPU predictor
2019-09-05 19:09:38 -04:00
parent 52d44e07fe
commit a5f232feb8
5 changed files with 85 additions and 5 deletions
--- a/src/gbm/gbtree.h
+++ b/src/gbm/gbtree.h
@@ -191,7 +191,7 @@ class GBTree : public GradientBooster {
                    HostDeviceVector<bst_float>* out_preds,
                    unsigned ntree_limit) override {
    CHECK(configured_);
-    GetPredictor()->PredictBatch(p_fmat, out_preds, model_, 0, ntree_limit);
+    GetPredictor(out_preds, p_fmat)->PredictBatch(p_fmat, out_preds, model_, 0, ntree_limit);
  }

  void PredictInstance(const SparsePage::Inst& inst,
@@ -242,8 +242,22 @@ class GBTree : public GradientBooster {
                     int bst_group,
                     std::vector<std::unique_ptr<RegTree> >* ret);

-  std::unique_ptr<Predictor> const& GetPredictor() const {
+  std::unique_ptr<Predictor> const& GetPredictor(HostDeviceVector<float> const* out_pred = nullptr,
+                                                 DMatrix* f_dmat = nullptr) const {
    CHECK(configured_);
+    // GPU_Hist by default has prediction cache calculated from quantile values, so GPU
+    // Predictor is not used for training dataset.  But when XGBoost performs continue
+    // training with an existing model, the prediction cache is not availbale and number
+    // of tree doesn't equal zero, the whole training dataset got copied into GPU for
+    // precise prediction.  This condition tries to avoid such copy by calling CPU
+    // Predictor.
+    if ((out_pred && out_pred->Size() == 0) &&
+        (model_.param.num_trees != 0) &&
+        // FIXME(trivialfis): Implement a better method for testing whether data is on
+        // device after DMatrix refactoring is done.
+        (f_dmat && !((*(f_dmat->GetBatches<SparsePage>().begin())).data.DeviceCanRead()))) {
+      return cpu_predictor_;
+    }
    if (tparam_.predictor == "cpu_predictor") {
      CHECK(cpu_predictor_);
      return cpu_predictor_;