Add GPU accelerated tree construction plugin (#1679)

2016-10-21 16:14:47 +13:00
parent 9b2e41340b
commit ac41845d4b
16 changed files with 3040 additions and 275 deletions
--- a/src/tree/param.h
+++ b/src/tree/param.h
@@ -7,10 +7,16 @@
 #ifndef XGBOOST_TREE_PARAM_H_
 #define XGBOOST_TREE_PARAM_H_

-#include <vector>
+#include <cmath>
 #include <cstring>
 #include <limits>
-#include <cmath>
+#include <vector>
+
+#ifdef __NVCC__
+#define XGB_DEVICE __host__ __device__
+#else
+#define XGB_DEVICE
+#endif

 namespace xgboost {
 namespace tree {
@@ -60,47 +66,80 @@ struct TrainParam : public dmlc::Parameter<TrainParam> {
  std::vector<int> monotone_constraints;
  // declare the parameters
  DMLC_DECLARE_PARAMETER(TrainParam) {
-    DMLC_DECLARE_FIELD(learning_rate).set_lower_bound(0.0f).set_default(0.3f)
+    DMLC_DECLARE_FIELD(learning_rate)
+        .set_lower_bound(0.0f)
+        .set_default(0.3f)
        .describe("Learning rate(step size) of update.");
-    DMLC_DECLARE_FIELD(min_split_loss).set_lower_bound(0.0f).set_default(0.0f)
-        .describe("Minimum loss reduction required to make a further partition.");
-    DMLC_DECLARE_FIELD(max_depth).set_lower_bound(0).set_default(6)
-        .describe("Maximum depth of the tree.");
-    DMLC_DECLARE_FIELD(min_child_weight).set_lower_bound(0.0f).set_default(1.0f)
+    DMLC_DECLARE_FIELD(min_split_loss)
+        .set_lower_bound(0.0f)
+        .set_default(0.0f)
+        .describe(
+            "Minimum loss reduction required to make a further partition.");
+    DMLC_DECLARE_FIELD(max_depth).set_lower_bound(0).set_default(6).describe(
+        "Maximum depth of the tree.");
+    DMLC_DECLARE_FIELD(min_child_weight)
+        .set_lower_bound(0.0f)
+        .set_default(1.0f)
        .describe("Minimum sum of instance weight(hessian) needed in a child.");
-    DMLC_DECLARE_FIELD(reg_lambda).set_lower_bound(0.0f).set_default(1.0f)
+    DMLC_DECLARE_FIELD(reg_lambda)
+        .set_lower_bound(0.0f)
+        .set_default(1.0f)
        .describe("L2 regularization on leaf weight");
-    DMLC_DECLARE_FIELD(reg_alpha).set_lower_bound(0.0f).set_default(0.0f)
+    DMLC_DECLARE_FIELD(reg_alpha)
+        .set_lower_bound(0.0f)
+        .set_default(0.0f)
        .describe("L1 regularization on leaf weight");
-    DMLC_DECLARE_FIELD(default_direction).set_default(0)
+    DMLC_DECLARE_FIELD(default_direction)
+        .set_default(0)
        .add_enum("learn", 0)
        .add_enum("left", 1)
        .add_enum("right", 2)
        .describe("Default direction choice when encountering a missing value");
-    DMLC_DECLARE_FIELD(max_delta_step).set_lower_bound(0.0f).set_default(0.0f)
-        .describe("Maximum delta step we allow each tree's weight estimate to be. "\
-                  "If the value is set to 0, it means there is no constraint");
-    DMLC_DECLARE_FIELD(subsample).set_range(0.0f, 1.0f).set_default(1.0f)
+    DMLC_DECLARE_FIELD(max_delta_step)
+        .set_lower_bound(0.0f)
+        .set_default(0.0f)
+        .describe(
+            "Maximum delta step we allow each tree's weight estimate to be. "
+            "If the value is set to 0, it means there is no constraint");
+    DMLC_DECLARE_FIELD(subsample)
+        .set_range(0.0f, 1.0f)
+        .set_default(1.0f)
        .describe("Row subsample ratio of training instance.");
-    DMLC_DECLARE_FIELD(colsample_bylevel).set_range(0.0f, 1.0f).set_default(1.0f)
+    DMLC_DECLARE_FIELD(colsample_bylevel)
+        .set_range(0.0f, 1.0f)
+        .set_default(1.0f)
        .describe("Subsample ratio of columns, resample on each level.");
-    DMLC_DECLARE_FIELD(colsample_bytree).set_range(0.0f, 1.0f).set_default(1.0f)
-        .describe("Subsample ratio of columns, resample on each tree construction.");
-    DMLC_DECLARE_FIELD(opt_dense_col).set_range(0.0f, 1.0f).set_default(1.0f)
+    DMLC_DECLARE_FIELD(colsample_bytree)
+        .set_range(0.0f, 1.0f)
+        .set_default(1.0f)
+        .describe(
+            "Subsample ratio of columns, resample on each tree construction.");
+    DMLC_DECLARE_FIELD(opt_dense_col)
+        .set_range(0.0f, 1.0f)
+        .set_default(1.0f)
        .describe("EXP Param: speed optimization for dense column.");
-    DMLC_DECLARE_FIELD(sketch_eps).set_range(0.0f, 1.0f).set_default(0.03f)
+    DMLC_DECLARE_FIELD(sketch_eps)
+        .set_range(0.0f, 1.0f)
+        .set_default(0.03f)
        .describe("EXP Param: Sketch accuracy of approximate algorithm.");
-    DMLC_DECLARE_FIELD(sketch_ratio).set_lower_bound(0.0f).set_default(2.0f)
-        .describe("EXP Param: Sketch accuracy related parameter of approximate algorithm.");
-    DMLC_DECLARE_FIELD(size_leaf_vector).set_lower_bound(0).set_default(0)
+    DMLC_DECLARE_FIELD(sketch_ratio)
+        .set_lower_bound(0.0f)
+        .set_default(2.0f)
+        .describe("EXP Param: Sketch accuracy related parameter of approximate "
+                  "algorithm.");
+    DMLC_DECLARE_FIELD(size_leaf_vector)
+        .set_lower_bound(0)
+        .set_default(0)
        .describe("Size of leaf vectors, reserved for vector trees");
-    DMLC_DECLARE_FIELD(parallel_option).set_default(0)
+    DMLC_DECLARE_FIELD(parallel_option)
+        .set_default(0)
        .describe("Different types of parallelization algorithm.");
-    DMLC_DECLARE_FIELD(cache_opt).set_default(true)
-        .describe("EXP Param: Cache aware optimization.");
-    DMLC_DECLARE_FIELD(silent).set_default(false)
-        .describe("Do not print information during trainig.");
-    DMLC_DECLARE_FIELD(monotone_constraints).set_default(std::vector<int>())
+    DMLC_DECLARE_FIELD(cache_opt).set_default(true).describe(
+        "EXP Param: Cache aware optimization.");
+    DMLC_DECLARE_FIELD(silent).set_default(false).describe(
+        "Do not print information during trainig.");
+    DMLC_DECLARE_FIELD(monotone_constraints)
+        .set_default(std::vector<int>())
        .describe("Constraint of variable monotinicity");
    // add alias of parameters
    DMLC_DECLARE_ALIAS(reg_lambda, lambda);
@@ -108,61 +147,11 @@ struct TrainParam : public dmlc::Parameter<TrainParam> {
    DMLC_DECLARE_ALIAS(min_split_loss, gamma);
    DMLC_DECLARE_ALIAS(learning_rate, eta);
  }
-  // calculate the cost of loss function
-  inline double CalcGainGivenWeight(double sum_grad,
-                                    double sum_hess,
-                                    double w) const {
-    return -(2.0 * sum_grad * w  + (sum_hess + reg_lambda) * Sqr(w));
-  }
-  // calculate the cost of loss function
-  inline double CalcGain(double sum_grad, double sum_hess) const {
-    if (sum_hess < min_child_weight) return 0.0;
-    if (max_delta_step == 0.0f) {
-      if (reg_alpha == 0.0f) {
-        return Sqr(sum_grad) / (sum_hess + reg_lambda);
-      } else {
-        return Sqr(ThresholdL1(sum_grad, reg_alpha)) / (sum_hess + reg_lambda);
-      }
-    } else {
-      double w = CalcWeight(sum_grad, sum_hess);
-      double ret = sum_grad * w + 0.5 * (sum_hess + reg_lambda) * Sqr(w);
-      if (reg_alpha == 0.0f) {
-        return - 2.0 * ret;
-      } else {
-        return - 2.0 * (ret + reg_alpha * std::abs(w));
-      }
-    }
-  }
-  // calculate cost of loss function with four statistics
-  inline double CalcGain(double sum_grad, double sum_hess,
-                         double test_grad, double test_hess) const {
-    double w = CalcWeight(sum_grad, sum_hess);
-    double ret = test_grad * w  + 0.5 * (test_hess + reg_lambda) * Sqr(w);
-    if (reg_alpha == 0.0f) {
-      return - 2.0 * ret;
-    } else {
-      return - 2.0 * (ret + reg_alpha * std::abs(w));
-    }
-  }
-  // calculate weight given the statistics
-  inline double CalcWeight(double sum_grad, double sum_hess) const {
-    if (sum_hess < min_child_weight) return 0.0;
-    double dw;
-    if (reg_alpha == 0.0f) {
-      dw = -sum_grad / (sum_hess + reg_lambda);
-    } else {
-      dw = -ThresholdL1(sum_grad, reg_alpha) / (sum_hess + reg_lambda);
-    }
-    if (max_delta_step != 0.0f) {
-      if (dw > max_delta_step) dw = max_delta_step;
-      if (dw < -max_delta_step) dw = -max_delta_step;
-    }
-    return dw;
-  }
  /*! \brief whether need forward small to big search: default right */
  inline bool need_forward_search(float col_density, bool indicator) const {
    return this->default_direction == 2 ||
-        (default_direction == 0 && (col_density < opt_dense_col) && !indicator);
+           (default_direction == 0 && (col_density < opt_dense_col) &&
+            !indicator);
  }
  /*! \brief whether need backward big to small search: default left */
  inline bool need_backward_search(float col_density, bool indicator) const {
@@ -182,19 +171,85 @@ struct TrainParam : public dmlc::Parameter<TrainParam> {
    CHECK_GT(ret, 0);
    return ret;
  }
-
- protected:
-  // functions for L1 cost
-  inline static double ThresholdL1(double w, double lambda) {
-    if (w > +lambda) return w - lambda;
-    if (w < -lambda) return w + lambda;
-    return 0.0;
-  }
-  inline static double Sqr(double a) {
-    return a * a;
-  }
 };

+/*! \brief Loss functions */
+
+// functions for L1 cost
+template <typename T1, typename T2>
+XGB_DEVICE inline static T1 ThresholdL1(T1 w, T2 lambda) {
+  if (w > +lambda)
+    return w - lambda;
+  if (w < -lambda)
+    return w + lambda;
+  return 0.0;
+}
+
+template <typename T>
+XGB_DEVICE inline static T Sqr(T a) { return a * a; }
+
+// calculate the cost of loss function
+template <typename TrainingParams, typename T>
+XGB_DEVICE inline T CalcGainGivenWeight(const TrainingParams &p, T sum_grad,
+                                        T sum_hess, T w) {
+  return -(2.0 * sum_grad * w + (sum_hess + p.reg_lambda) * Sqr(w));
+}
+
+// calculate the cost of loss function
+template <typename TrainingParams, typename T>
+XGB_DEVICE inline T CalcGain(const TrainingParams &p, T sum_grad, T sum_hess) {
+  if (sum_hess < p.min_child_weight)
+    return 0.0;
+  if (p.max_delta_step == 0.0f) {
+    if (p.reg_alpha == 0.0f) {
+      return Sqr(sum_grad) / (sum_hess + p.reg_lambda);
+    } else {
+      return Sqr(ThresholdL1(sum_grad, p.reg_alpha)) /
+             (sum_hess + p.reg_lambda);
+    }
+  } else {
+    T w = CalcWeight(p, sum_grad, sum_hess);
+    T ret = sum_grad * w + 0.5 * (sum_hess + p.reg_lambda) * Sqr(w);
+    if (p.reg_alpha == 0.0f) {
+      return -2.0 * ret;
+    } else {
+      return -2.0 * (ret + p.reg_alpha * std::abs(w));
+    }
+  }
+}
+// calculate cost of loss function with four statistics
+template <typename TrainingParams, typename T>
+XGB_DEVICE inline T CalcGain(const TrainingParams &p, T sum_grad, T sum_hess,
+                             T test_grad, T test_hess) {
+  T w = CalcWeight(sum_grad, sum_hess);
+  T ret = test_grad * w + 0.5 * (test_hess + p.reg_lambda) * Sqr(w);
+  if (p.reg_alpha == 0.0f) {
+    return -2.0 * ret;
+  } else {
+    return -2.0 * (ret + p.reg_alpha * std::abs(w));
+  }
+}
+// calculate weight given the statistics
+template <typename TrainingParams, typename T>
+XGB_DEVICE inline T CalcWeight(const TrainingParams &p, T sum_grad,
+                               T sum_hess) {
+  if (sum_hess < p.min_child_weight)
+    return 0.0;
+  T dw;
+  if (p.reg_alpha == 0.0f) {
+    dw = -sum_grad / (sum_hess + p.reg_lambda);
+  } else {
+    dw = -ThresholdL1(sum_grad, p.reg_alpha) / (sum_hess + p.reg_lambda);
+  }
+  if (p.max_delta_step != 0.0f) {
+    if (dw > p.max_delta_step)
+      dw = p.max_delta_step;
+    if (dw < -p.max_delta_step)
+      dw = -p.max_delta_step;
+  }
+  return dw;
+}
+
 /*! \brief core statistics used for tree construction */
 struct GradStats {
  /*! \brief sum gradient statistics */
@@ -207,109 +262,87 @@ struct GradStats {
   */
  static const int kSimpleStats = 1;
  /*! \brief constructor, the object must be cleared during construction */
-  explicit GradStats(const TrainParam& param) {
-    this->Clear();
-  }
+  explicit GradStats(const TrainParam &param) { this->Clear(); }
  /*! \brief clear the statistics */
-  inline void Clear() {
-    sum_grad = sum_hess = 0.0f;
-  }
+  inline void Clear() { sum_grad = sum_hess = 0.0f; }
  /*! \brief check if necessary information is ready */
-  inline static void CheckInfo(const MetaInfo& info) {
-  }
+  inline static void CheckInfo(const MetaInfo &info) {}
  /*!
   * \brief accumulate statistics
   * \param p the gradient pair
   */
-  inline void Add(bst_gpair p) {
-    this->Add(p.grad, p.hess);
-  }
+  inline void Add(bst_gpair p) { this->Add(p.grad, p.hess); }
  /*!
   * \brief accumulate statistics, more complicated version
   * \param gpair the vector storing the gradient statistics
   * \param info the additional information
   * \param ridx instance index of this instance
   */
-  inline void Add(const std::vector<bst_gpair>& gpair,
-                  const MetaInfo& info,
+  inline void Add(const std::vector<bst_gpair> &gpair, const MetaInfo &info,
                  bst_uint ridx) {
-    const bst_gpair& b = gpair[ridx];
+    const bst_gpair &b = gpair[ridx];
    this->Add(b.grad, b.hess);
  }
  /*! \brief calculate leaf weight */
-  inline double CalcWeight(const TrainParam& param) const {
-    return param.CalcWeight(sum_grad, sum_hess);
+  inline double CalcWeight(const TrainParam &param) const {
+    return xgboost::tree::CalcWeight(param, sum_grad, sum_hess);
  }
  /*! \brief calculate gain of the solution */
-  inline double CalcGain(const TrainParam& param) const {
-    return param.CalcGain(sum_grad, sum_hess);
+  inline double CalcGain(const TrainParam &param) const {
+    return xgboost::tree::CalcGain(param, sum_grad, sum_hess);
  }
  /*! \brief add statistics to the data */
-  inline void Add(const GradStats& b) {
-    this->Add(b.sum_grad, b.sum_hess);
-  }
+  inline void Add(const GradStats &b) { this->Add(b.sum_grad, b.sum_hess); }
  /*! \brief same as add, reduce is used in All Reduce */
-  inline static void Reduce(GradStats& a, const GradStats& b) { // NOLINT(*)
+  inline static void Reduce(GradStats &a, const GradStats &b) { // NOLINT(*)
    a.Add(b);
  }
  /*! \brief set current value to a - b */
-  inline void SetSubstract(const GradStats& a, const GradStats& b) {
+  inline void SetSubstract(const GradStats &a, const GradStats &b) {
    sum_grad = a.sum_grad - b.sum_grad;
    sum_hess = a.sum_hess - b.sum_hess;
  }
  /*! \return whether the statistics is not used yet */
-  inline bool Empty() const {
-    return sum_hess == 0.0;
-  }
+  inline bool Empty() const { return sum_hess == 0.0; }
  /*! \brief set leaf vector value based on statistics */
-  inline void SetLeafVec(const TrainParam& param, bst_float *vec) const {
-  }
+  inline void SetLeafVec(const TrainParam &param, bst_float *vec) const {}
  // constructor to allow inheritance
  GradStats() {}
  /*! \brief add statistics to the data */
  inline void Add(double grad, double hess) {
-    sum_grad += grad; sum_hess += hess;
+    sum_grad += grad;
+    sum_hess += hess;
  }
 };

 struct NoConstraint {
-  inline static void Init(TrainParam* param, unsigned num_feature) {
-  }
-  inline double CalcSplitGain(
-      const TrainParam& param, bst_uint split_index,
-      GradStats left, GradStats right) const {
+  inline static void Init(TrainParam *param, unsigned num_feature) {}
+  inline double CalcSplitGain(const TrainParam &param, bst_uint split_index,
+                              GradStats left, GradStats right) const {
    return left.CalcGain(param) + right.CalcGain(param);
  }
-  inline double CalcWeight(
-      const TrainParam& param,
-      GradStats stats) const {
+  inline double CalcWeight(const TrainParam &param, GradStats stats) const {
    return stats.CalcWeight(param);
  }
-  inline double CalcGain(const TrainParam& param,
-                         GradStats stats) const {
+  inline double CalcGain(const TrainParam &param, GradStats stats) const {
    return stats.CalcGain(param);
  }
-  inline void SetChild(
-      const TrainParam& param, bst_uint split_index,
-      GradStats left, GradStats right,
-      NoConstraint* cleft, NoConstraint* cright) {
-  }
+  inline void SetChild(const TrainParam &param, bst_uint split_index,
+                       GradStats left, GradStats right, NoConstraint *cleft,
+                       NoConstraint *cright) {}
 };

 struct ValueConstraint {
  double lower_bound;
  double upper_bound;
-  ValueConstraint() :
-      lower_bound(-std::numeric_limits<double>::max()),
-      upper_bound(std::numeric_limits<double>::max()) {
-  }
-  inline static void Init(TrainParam* param, unsigned num_feature) {
+  ValueConstraint()
+      : lower_bound(-std::numeric_limits<double>::max()),
+        upper_bound(std::numeric_limits<double>::max()) {}
+  inline static void Init(TrainParam *param, unsigned num_feature) {
    param->monotone_constraints.resize(num_feature, 1);
  }
-  inline double CalcWeight(
-      const TrainParam& param,
-      GradStats stats) const {
-    double w  = stats.CalcWeight(param);
+  inline double CalcWeight(const TrainParam &param, GradStats stats) const {
+    double w = stats.CalcWeight(param);
    if (w < lower_bound) {
      return lower_bound;
    }
@@ -319,41 +352,36 @@ struct ValueConstraint {
    return w;
  }

-  inline double CalcGain(const TrainParam& param,
-                         GradStats stats) const {
-    return param.CalcGainGivenWeight(
-        stats.sum_grad, stats.sum_hess,
-        CalcWeight(param, stats));
+  inline double CalcGain(const TrainParam &param, GradStats stats) const {
+    return CalcGainGivenWeight(param, stats.sum_grad, stats.sum_hess,
+                               CalcWeight(param, stats));
  }

-  inline double CalcSplitGain(
-      const TrainParam& param,
-      bst_uint split_index,
-      GradStats left, GradStats right) const {
+  inline double CalcSplitGain(const TrainParam &param, bst_uint split_index,
+                              GradStats left, GradStats right) const {
    double wleft = CalcWeight(param, left);
    double wright = CalcWeight(param, right);
    int c = param.monotone_constraints[split_index];
    double gain =
-        param.CalcGainGivenWeight(left.sum_grad, left.sum_hess, wleft) +
-        param.CalcGainGivenWeight(right.sum_grad, right.sum_hess, wright);
+        CalcGainGivenWeight(param, left.sum_grad, left.sum_hess, wleft) +
+        CalcGainGivenWeight(param, right.sum_grad, right.sum_hess, wright);
    if (c == 0) {
      return gain;
-    }  else if (c > 0) {
+    } else if (c > 0) {
      return wleft < wright ? gain : 0.0;
    } else {
      return wleft > wright ? gain : 0.0;
    }
  }

-  inline void SetChild(
-      const TrainParam& param,
-      bst_uint split_index,
-      GradStats left, GradStats right,
-      ValueConstraint* cleft, ValueConstraint *cright) {
+  inline void SetChild(const TrainParam &param, bst_uint split_index,
+                       GradStats left, GradStats right, ValueConstraint *cleft,
+                       ValueConstraint *cright) {
    int c = param.monotone_constraints.at(split_index);
    *cleft = *this;
    *cright = *this;
-    if (c == 0) return;
+    if (c == 0)
+      return;
    double wleft = CalcWeight(param, left);
    double wright = CalcWeight(param, right);
    double mid = (wleft + wright) / 2;
@@ -382,9 +410,12 @@ struct SplitEntry {
  /*! \brief constructor */
  SplitEntry() : loss_chg(0.0f), sindex(0), split_value(0.0f) {}
  /*!
-   * \brief decides whether we can replace current entry with the given statistics
-   *   This function gives better priority to lower index when loss_chg == new_loss_chg.
-   *   Not the best way, but helps to give consistent result during multi-thread execution.
+   * \brief decides whether we can replace current entry with the given
+   * statistics
+   *   This function gives better priority to lower index when loss_chg ==
+   * new_loss_chg.
+   *   Not the best way, but helps to give consistent result during multi-thread
+   * execution.
   * \param new_loss_chg the loss reduction get through the split
   * \param split_index the feature index where the split is on
   */
@@ -400,7 +431,7 @@ struct SplitEntry {
   * \param e candidate split solution
   * \return whether the proposed split is better and can replace current split
   */
-  inline bool Update(const SplitEntry& e) {
+  inline bool Update(const SplitEntry &e) {
    if (this->NeedReplace(e.loss_chg, e.split_index())) {
      this->loss_chg = e.loss_chg;
      this->sindex = e.sindex;
@@ -422,7 +453,8 @@ struct SplitEntry {
                     float new_split_value, bool default_left) {
    if (this->NeedReplace(new_loss_chg, split_index)) {
      this->loss_chg = new_loss_chg;
-      if (default_left) split_index |= (1U << 31);
+      if (default_left)
+        split_index |= (1U << 31);
      this->sindex = split_index;
      this->split_value = new_split_value;
      return true;
@@ -431,17 +463,14 @@ struct SplitEntry {
    }
  }
  /*! \brief same as update, used by AllReduce*/
-  inline static void Reduce(SplitEntry& dst, const SplitEntry& src) { // NOLINT(*)
+  inline static void Reduce(SplitEntry &dst, // NOLINT(*)
+                            const SplitEntry &src) { // NOLINT(*)
    dst.Update(src);
  }
  /*!\return feature index to split on */
-  inline unsigned split_index() const {
-    return sindex & ((1U << 31) - 1U);
-  }
+  inline unsigned split_index() const { return sindex & ((1U << 31) - 1U); }
  /*!\return whether missing value goes to left branch */
-  inline bool default_left() const {
-    return (sindex >> 31) != 0;
-  }
+  inline bool default_left() const { return (sindex >> 31) != 0; }
 };

 }  // namespace tree
@@ -451,13 +480,14 @@ struct SplitEntry {
 namespace std {
 inline std::ostream &operator<<(std::ostream &os, const std::vector<int> &t) {
  os << '(';
-  for (std::vector<int>::const_iterator
-           it = t.begin(); it != t.end(); ++it) {
-    if (it != t.begin()) os << ',';
+  for (std::vector<int>::const_iterator it = t.begin(); it != t.end(); ++it) {
+    if (it != t.begin())
+      os << ',';
    os << *it;
  }
  // python style tuple
-  if (t.size() == 1) os << ',';
+  if (t.size() == 1)
+    os << ',';
  os << ')';
  return os;
 }
@@ -474,7 +504,8 @@ inline std::istream &operator>>(std::istream &is, std::vector<int> &t) {
      return is;
    }
    is.get();
-    if (ch == '(') break;
+    if (ch == '(')
+      break;
    if (!isspace(ch)) {
      is.setstate(std::ios::failbit);
      return is;
@@ -495,14 +526,17 @@ inline std::istream &operator>>(std::istream &is, std::vector<int> &t) {
      while (true) {
        ch = is.peek();
        if (isspace(ch)) {
-          is.get(); continue;
+          is.get();
+          continue;
        }
        if (ch == ')') {
-          is.get(); break;
+          is.get();
+          break;
        }
        break;
      }
-      if (ch == ')') break;
+      if (ch == ')')
+        break;
    } else if (ch == ')') {
      break;
    } else {
--- a/src/tree/updater_skmaker.cc
+++ b/src/tree/updater_skmaker.cc
@@ -107,7 +107,7 @@ class SketchMaker: public BaseMaker {
    }
    /*! \brief calculate gain of the solution */
    inline double CalcGain(const TrainParam &param) const {
-      return param.CalcGain(pos_grad - neg_grad, sum_hess);
+      return xgboost::tree::CalcGain(param, pos_grad - neg_grad, sum_hess);
    }
    /*! \brief set current value to a - b */
    inline void SetSubstract(const SKStats &a, const SKStats &b) {
@@ -117,7 +117,7 @@ class SketchMaker: public BaseMaker {
    }
    // calculate leaf weight
    inline double CalcWeight(const TrainParam &param) const {
-      return param.CalcWeight(pos_grad - neg_grad, sum_hess);
+      return xgboost::tree::CalcWeight(param, pos_grad - neg_grad, sum_hess);
    }
    /*! \brief add statistics to the data */
    inline void Add(const SKStats &b) {