[REFACTOR] cleanup structure

2015-11-24 14:25:56 -08:00
parent 5ed4dc4f60
commit d530e0c14f
60 changed files with 42 additions and 51 deletions
--- a/old_src/learner/dmatrix.h
+++ b/old_src/learner/dmatrix.h
@@ -0,0 +1,176 @@
+/*!
+ * Copyright 2014 by Contributors
+ * \file dmatrix.h
+ * \brief meta data and template data structure
+ *        used for regression/classification/ranking
+ * \author Tianqi Chen
+ */
+#ifndef XGBOOST_LEARNER_DMATRIX_H_
+#define XGBOOST_LEARNER_DMATRIX_H_
+
+#include <vector>
+#include <cstring>
+#include "../data.h"
+#include "../utils/io.h"
+namespace xgboost {
+namespace learner {
+/*!
+ * \brief meta information needed in training, including label, weight
+ */
+struct MetaInfo {
+  /*!
+   * \brief information needed by booster
+   * BoosterInfo does not implement save and load,
+   * all serialization is done in MetaInfo
+   */
+  BoosterInfo info;
+  /*! \brief label of each instance */
+  std::vector<float> labels;
+  /*!
+   * \brief the index of begin and end of a group
+   * needed when the learning task is ranking
+   */
+  std::vector<bst_uint> group_ptr;
+  /*! \brief weights of each instance, optional */
+  std::vector<float> weights;
+  /*!
+   * \brief initialized margins,
+   * if specified, xgboost will start from this initial margin
+   * can be used to specify initial prediction to boost from
+   */
+  std::vector<float> base_margin;
+  /*! \brief version flag, used to check version of this info */
+  static const int kVersion = 0;
+  // constructor
+  MetaInfo(void) {}
+  /*! \return number of rows in dataset */
+  inline size_t num_row(void) const {
+    return info.num_row;
+  }
+  /*! \return number of columns in dataset */
+  inline size_t num_col(void) const {
+    return info.num_col;
+  }
+  /*! \brief clear all the information */
+  inline void Clear(void) {
+    labels.clear();
+    group_ptr.clear();
+    weights.clear();
+    info.root_index.clear();
+    base_margin.clear();
+    info.num_row = info.num_col = 0;
+  }
+  /*! \brief get weight of each instances */
+  inline float GetWeight(size_t i) const {
+    if (weights.size() != 0) {
+      return weights[i];
+    } else {
+      return 1.0f;
+    }
+  }
+  inline void SaveBinary(utils::IStream &fo) const { // NOLINT(*)
+    int version = kVersion;
+    fo.Write(&version, sizeof(version));
+    fo.Write(&info.num_row, sizeof(info.num_row));
+    fo.Write(&info.num_col, sizeof(info.num_col));
+    fo.Write(labels);
+    fo.Write(group_ptr);
+    fo.Write(weights);
+    fo.Write(info.root_index);
+    fo.Write(base_margin);
+  }
+  inline void LoadBinary(utils::IStream &fi) { // NOLINT(*)
+    int version;
+    utils::Check(fi.Read(&version, sizeof(version)) != 0, "MetaInfo: invalid format");
+    utils::Check(fi.Read(&info.num_row, sizeof(info.num_row)) != 0, "MetaInfo: invalid format");
+    utils::Check(fi.Read(&info.num_col, sizeof(info.num_col)) != 0, "MetaInfo: invalid format");
+    utils::Check(fi.Read(&labels), "MetaInfo: invalid format");
+    utils::Check(fi.Read(&group_ptr), "MetaInfo: invalid format");
+    utils::Check(fi.Read(&weights), "MetaInfo: invalid format");
+    utils::Check(fi.Read(&info.root_index), "MetaInfo: invalid format");
+    utils::Check(fi.Read(&base_margin), "MetaInfo: invalid format");
+  }
+  // try to load group information from file, if exists
+  inline bool TryLoadGroup(const char* fname, bool silent = false) {
+    using namespace std;
+    FILE *fi = fopen64(fname, "r");
+    if (fi == NULL) return false;
+    group_ptr.push_back(0);
+    unsigned nline;
+    while (fscanf(fi, "%u", &nline) == 1) {
+      group_ptr.push_back(group_ptr.back()+nline);
+    }
+    if (!silent) {
+      utils::Printf("%u groups are loaded from %s\n",
+                    static_cast<unsigned>(group_ptr.size()-1), fname);
+    }
+    fclose(fi);
+    return true;
+  }
+  inline std::vector<float>& GetFloatInfo(const char *field) {
+    using namespace std;
+    if (!strcmp(field, "label")) return labels;
+    if (!strcmp(field, "weight")) return weights;
+    if (!strcmp(field, "base_margin")) return base_margin;
+    utils::Error("unknown field %s", field);
+    return labels;
+  }
+  inline const std::vector<float>& GetFloatInfo(const char *field) const {
+    return ((MetaInfo*)this)->GetFloatInfo(field); // NOLINT(*)
+  }
+  inline std::vector<unsigned> &GetUIntInfo(const char *field) {
+    using namespace std;
+    if (!strcmp(field, "root_index")) return info.root_index;
+    if (!strcmp(field, "fold_index")) return info.fold_index;
+    utils::Error("unknown field %s", field);
+    return info.root_index;
+  }
+  inline const std::vector<unsigned> &GetUIntInfo(const char *field) const {
+    return ((MetaInfo*)this)->GetUIntInfo(field);  // NOLINT(*)
+  }
+  // try to load weight information from file, if exists
+  inline bool TryLoadFloatInfo(const char *field, const char* fname, bool silent = false) {
+    using namespace std;
+    std::vector<float> &data = this->GetFloatInfo(field);
+    FILE *fi = fopen64(fname, "r");
+    if (fi == NULL) return false;
+    float wt;
+    while (fscanf(fi, "%f", &wt) == 1) {
+      data.push_back(wt);
+    }
+    if (!silent) {
+      utils::Printf("loading %s from %s\n", field, fname);
+    }
+    fclose(fi);
+    return true;
+  }
+};
+
+/*!
+ * \brief data object used for learning,
+ * \tparam FMatrix type of feature data source
+ */
+struct DMatrix {
+  /*!
+   * \brief magic number associated with this object
+   *    used to check if it is specific instance
+   */
+  const int magic;
+  /*! \brief meta information about the dataset */
+  MetaInfo info;
+  /*!
+   * \brief cache pointer to verify if the data structure is cached in some learner
+   *  used to verify if DMatrix is cached
+   */
+  void *cache_learner_ptr_;
+  /*! \brief default constructor */
+  explicit DMatrix(int magic) : magic(magic), cache_learner_ptr_(NULL) {}
+  /*! \brief get feature matrix about data content */
+  virtual IFMatrix *fmat(void) const = 0;
+  // virtual destructor
+  virtual ~DMatrix(void){}
+};
+
+}  // namespace learner
+}  // namespace xgboost
+#endif  // XGBOOST_LEARNER_DMATRIX_H_
--- a/old_src/learner/evaluation-inl.hpp
+++ b/old_src/learner/evaluation-inl.hpp
@@ -0,0 +1,589 @@
+/*!
+ * Copyright 2014 by Contributors
+ * \file xgboost_evaluation-inl.hpp
+ * \brief evaluation metrics for regression and classification and rank
+ * \author Kailong Chen, Tianqi Chen
+ */
+#ifndef XGBOOST_LEARNER_EVALUATION_INL_HPP_
+#define XGBOOST_LEARNER_EVALUATION_INL_HPP_
+
+#include <vector>
+#include <utility>
+#include <string>
+#include <cmath>
+#include <climits>
+#include <algorithm>
+#include "../sync/sync.h"
+#include "../utils/math.h"
+#include "./evaluation.h"
+#include "./helper_utils.h"
+
+namespace xgboost {
+namespace learner {
+/*!
+ * \brief base class of element-wise evaluation
+ * \tparam Derived the name of subclass
+ */
+template<typename Derived>
+struct EvalEWiseBase : public IEvaluator {
+  virtual float Eval(const std::vector<float> &preds,
+                     const MetaInfo &info,
+                     bool distributed) const {
+    utils::Check(info.labels.size() != 0, "label set cannot be empty");
+    utils::Check(preds.size() == info.labels.size(),
+                 "label and prediction size not match"\
+                 "hint: use merror or mlogloss for multi-class classification");
+
+    const bst_omp_uint ndata = static_cast<bst_omp_uint>(info.labels.size());
+
+    float sum = 0.0, wsum = 0.0;
+    #pragma omp parallel for reduction(+: sum, wsum) schedule(static)
+    for (bst_omp_uint i = 0; i < ndata; ++i) {
+      const float wt = info.GetWeight(i);
+      sum += Derived::EvalRow(info.labels[i], preds[i]) * wt;
+      wsum += wt;
+    }
+    float dat[2]; dat[0] = sum, dat[1] = wsum;
+    if (distributed) {
+      rabit::Allreduce<rabit::op::Sum>(dat, 2);
+    }
+    return Derived::GetFinal(dat[0], dat[1]);
+  }
+  /*!
+   * \brief to be implemented by subclass,
+   *   get evaluation result from one row
+   * \param label label of current instance
+   * \param pred prediction value of current instance
+   */
+  inline static float EvalRow(float label, float pred);
+  /*!
+   * \brief to be overridden by subclass, final transformation
+   * \param esum the sum statistics returned by EvalRow
+   * \param wsum sum of weight
+   */
+  inline static float GetFinal(float esum, float wsum) {
+    return esum / wsum;
+  }
+};
+
+/*! \brief RMSE */
+struct EvalRMSE : public EvalEWiseBase<EvalRMSE> {
+  virtual const char *Name(void) const {
+    return "rmse";
+  }
+  inline static float EvalRow(float label, float pred) {
+    float diff = label - pred;
+    return diff * diff;
+  }
+  inline static float GetFinal(float esum, float wsum) {
+    return std::sqrt(esum / wsum);
+  }
+};
+
+/*! \brief logloss */
+struct EvalLogLoss : public EvalEWiseBase<EvalLogLoss> {
+  virtual const char *Name(void) const {
+    return "logloss";
+  }
+  inline static float EvalRow(float y, float py) {
+    const float eps = 1e-16f;
+    const float pneg = 1.0f - py;
+    if (py < eps) {
+      return -y * std::log(eps) - (1.0f - y)  * std::log(1.0f - eps);
+    } else if (pneg < eps) {
+      return -y * std::log(1.0f - eps) - (1.0f - y)  * std::log(eps);
+    } else {
+      return -y * std::log(py) - (1.0f - y) * std::log(pneg);
+    }
+  }
+};
+
+/*! \brief error */
+struct EvalError : public EvalEWiseBase<EvalError> {
+  virtual const char *Name(void) const {
+    return "error";
+  }
+  inline static float EvalRow(float label, float pred) {
+    // assume label is in [0,1]
+    return pred > 0.5f ? 1.0f - label : label;
+  }
+};
+
+/*! \brief log-likelihood of Poission distribution */
+struct EvalPoissionNegLogLik : public EvalEWiseBase<EvalPoissionNegLogLik> {
+  virtual const char *Name(void) const {
+    return "poisson-nloglik";
+  }
+  inline static float EvalRow(float y, float py) {
+    const float eps = 1e-16f;
+    if (py < eps) py = eps;
+    return utils::LogGamma(y + 1.0f) + py - std::log(py) * y;
+  }
+};
+
+/*!
+ * \brief base class of multi-class evaluation
+ * \tparam Derived the name of subclass
+ */
+template<typename Derived>
+struct EvalMClassBase : public IEvaluator {
+  virtual float Eval(const std::vector<float> &preds,
+                     const MetaInfo &info,
+                     bool distributed) const {
+    utils::Check(info.labels.size() != 0, "label set cannot be empty");
+    utils::Check(preds.size() % info.labels.size() == 0,
+                 "label and prediction size not match");
+    const size_t nclass = preds.size() / info.labels.size();
+    utils::Check(nclass > 1,
+                 "mlogloss and merror are only used for multi-class classification,"\
+                 " use logloss for binary classification");
+    const bst_omp_uint ndata = static_cast<bst_omp_uint>(info.labels.size());
+    float sum = 0.0, wsum = 0.0;
+    int label_error = 0;
+    #pragma omp parallel for reduction(+: sum, wsum) schedule(static)
+    for (bst_omp_uint i = 0; i < ndata; ++i) {
+      const float wt = info.GetWeight(i);
+      int label =  static_cast<int>(info.labels[i]);
+      if (label >= 0 && label < static_cast<int>(nclass)) {
+        sum += Derived::EvalRow(label,
+                                BeginPtr(preds) + i * nclass,
+                                nclass) * wt;
+        wsum += wt;
+      } else {
+        label_error = label;
+      }
+    }
+    utils::Check(label_error >= 0 && label_error < static_cast<int>(nclass),
+                 "MultiClassEvaluation: label must be in [0, num_class)," \
+                 " num_class=%d but found %d in label",
+                 static_cast<int>(nclass), label_error);
+    float dat[2]; dat[0] = sum, dat[1] = wsum;
+    if (distributed) {
+      rabit::Allreduce<rabit::op::Sum>(dat, 2);
+    }
+    return Derived::GetFinal(dat[0], dat[1]);
+  }
+  /*!
+   * \brief to be implemented by subclass,
+   *   get evaluation result from one row
+   * \param label label of current instance
+   * \param pred prediction value of current instance
+   * \param nclass number of class in the prediction
+   */
+  inline static float EvalRow(int label,
+                              const float *pred,
+                              size_t nclass);
+  /*!
+   * \brief to be overridden by subclass, final transformation
+   * \param esum the sum statistics returned by EvalRow
+   * \param wsum sum of weight
+   */
+  inline static float GetFinal(float esum, float wsum) {
+    return esum / wsum;
+  }
+  // used to store error message
+  const char *error_msg_;
+};
+/*! \brief match error */
+struct EvalMatchError : public EvalMClassBase<EvalMatchError> {
+  virtual const char *Name(void) const {
+    return "merror";
+  }
+  inline static float EvalRow(int label,
+                              const float *pred,
+                              size_t nclass) {
+    return FindMaxIndex(pred, nclass) != static_cast<int>(label);
+  }
+};
+/*! \brief match error */
+struct EvalMultiLogLoss : public EvalMClassBase<EvalMultiLogLoss> {
+  virtual const char *Name(void) const {
+    return "mlogloss";
+  }
+  inline static float EvalRow(int label,
+                              const float *pred,
+                              size_t nclass) {
+    const float eps = 1e-16f;
+    size_t k = static_cast<size_t>(label);
+    if (pred[k] > eps) {
+      return -std::log(pred[k]);
+    } else {
+      return -std::log(eps);
+    }
+  }
+};
+
+/*! \brief ctest */
+struct EvalCTest: public IEvaluator {
+  EvalCTest(IEvaluator *base, const char *name)
+      : base_(base), name_(name) {}
+  virtual ~EvalCTest(void) {
+    delete base_;
+  }
+  virtual const char *Name(void) const {
+    return name_.c_str();
+  }
+  virtual float Eval(const std::vector<float> &preds,
+                     const MetaInfo &info,
+                     bool distributed) const {
+    utils::Check(!distributed, "metric %s do not support distributed evaluation", name_.c_str());
+    utils::Check(preds.size() % info.labels.size() == 0,
+                 "label and prediction size not match");
+    size_t ngroup = preds.size() / info.labels.size() - 1;
+    const unsigned ndata = static_cast<unsigned>(info.labels.size());
+    utils::Check(ngroup > 1, "pred size does not meet requirement");
+    utils::Check(ndata == info.info.fold_index.size(), "need fold index");
+    double wsum = 0.0;
+    for (size_t k = 0; k < ngroup; ++k) {
+      std::vector<float> tpred;
+      MetaInfo tinfo;
+      for (unsigned i = 0; i < ndata; ++i) {
+        if (info.info.fold_index[i] == k) {
+          tpred.push_back(preds[i + (k + 1) * ndata]);
+          tinfo.labels.push_back(info.labels[i]);
+          tinfo.weights.push_back(info.GetWeight(i));
+        }
+      }
+      wsum += base_->Eval(tpred, tinfo);
+    }
+    return static_cast<float>(wsum / ngroup);
+  }
+
+ private:
+  IEvaluator *base_;
+  std::string name_;
+};
+
+/*! \brief AMS: also records best threshold */
+struct EvalAMS : public IEvaluator {
+ public:
+  explicit EvalAMS(const char *name) {
+    name_ = name;
+    // note: ams@0 will automatically select which ratio to go
+    utils::Check(std::sscanf(name, "ams@%f", &ratio_) == 1, "invalid ams format");
+  }
+  virtual float Eval(const std::vector<float> &preds,
+                     const MetaInfo &info,
+                     bool distributed) const {
+    utils::Check(!distributed, "metric AMS do not support distributed evaluation");
+    using namespace std;
+    const bst_omp_uint ndata = static_cast<bst_omp_uint>(info.labels.size());
+
+    utils::Check(info.weights.size() == ndata, "we need weight to evaluate ams");
+    std::vector< std::pair<float, unsigned> > rec(ndata);
+
+    #pragma omp parallel for schedule(static)
+    for (bst_omp_uint i = 0; i < ndata; ++i) {
+      rec[i] = std::make_pair(preds[i], i);
+    }
+    std::sort(rec.begin(), rec.end(), CmpFirst);
+    unsigned ntop = static_cast<unsigned>(ratio_ * ndata);
+    if (ntop == 0) ntop = ndata;
+    const double br = 10.0;
+    unsigned thresindex = 0;
+    double s_tp = 0.0, b_fp = 0.0, tams = 0.0;
+    for (unsigned i = 0; i < static_cast<unsigned>(ndata-1) && i < ntop; ++i) {
+      const unsigned ridx = rec[i].second;
+      const float wt = info.weights[ridx];
+      if (info.labels[ridx] > 0.5f) {
+        s_tp += wt;
+      } else {
+        b_fp += wt;
+      }
+      if (rec[i].first != rec[i+1].first) {
+        double ams = sqrt(2*((s_tp+b_fp+br) * log(1.0 + s_tp/(b_fp+br)) - s_tp));
+        if (tams < ams) {
+          thresindex = i;
+          tams = ams;
+        }
+      }
+    }
+    if (ntop == ndata) {
+      utils::Printf("\tams-ratio=%g", static_cast<float>(thresindex) / ndata);
+      return static_cast<float>(tams);
+    } else {
+      return static_cast<float>(sqrt(2*((s_tp+b_fp+br) * log(1.0 + s_tp/(b_fp+br)) - s_tp)));
+    }
+  }
+  virtual const char *Name(void) const {
+    return name_.c_str();
+  }
+
+ private:
+  std::string name_;
+  float ratio_;
+};
+
+/*! \brief precision with cut off at top percentile */
+struct EvalPrecisionRatio : public IEvaluator{
+ public:
+  explicit EvalPrecisionRatio(const char *name) : name_(name) {
+    using namespace std;
+    if (sscanf(name, "apratio@%f", &ratio_) == 1) {
+      use_ap = 1;
+    } else {
+      utils::Assert(sscanf(name, "pratio@%f", &ratio_) == 1, "BUG");
+      use_ap = 0;
+    }
+  }
+  virtual float Eval(const std::vector<float> &preds,
+                     const MetaInfo &info,
+                     bool distributed) const {
+    utils::Check(!distributed, "metric %s do not support distributed evaluation", Name());
+    utils::Check(info.labels.size() != 0, "label set cannot be empty");
+    utils::Assert(preds.size() % info.labels.size() == 0,
+                  "label size predict size not match");
+    std::vector< std::pair<float, unsigned> > rec;
+    for (size_t j = 0; j < info.labels.size(); ++j) {
+      rec.push_back(std::make_pair(preds[j], static_cast<unsigned>(j)));
+    }
+    std::sort(rec.begin(), rec.end(), CmpFirst);
+    double pratio = CalcPRatio(rec, info);
+    return static_cast<float>(pratio);
+  }
+  virtual const char *Name(void) const {
+    return name_.c_str();
+  }
+
+ protected:
+  inline double CalcPRatio(const std::vector< std::pair<float, unsigned> >& rec,
+                           const MetaInfo &info) const {
+    size_t cutoff = static_cast<size_t>(ratio_ * rec.size());
+    double wt_hit = 0.0, wsum = 0.0, wt_sum = 0.0;
+    for (size_t j = 0; j < cutoff; ++j) {
+      const float wt = info.GetWeight(j);
+      wt_hit += info.labels[rec[j].second] * wt;
+      wt_sum += wt;
+      wsum += wt_hit / wt_sum;
+    }
+    if (use_ap != 0) {
+      return wsum / cutoff;
+    } else {
+      return wt_hit / wt_sum;
+    }
+  }
+  int use_ap;
+  float ratio_;
+  std::string name_;
+};
+
+/*! \brief Area Under Curve, for both classification and rank */
+struct EvalAuc : public IEvaluator {
+  virtual float Eval(const std::vector<float> &preds,
+                     const MetaInfo &info,
+                     bool distributed) const {
+    utils::Check(info.labels.size() != 0, "label set cannot be empty");
+    utils::Check(preds.size() % info.labels.size() == 0,
+                 "label size predict size not match");
+    std::vector<unsigned> tgptr(2, 0);
+    tgptr[1] = static_cast<unsigned>(info.labels.size());
+
+    const std::vector<unsigned> &gptr = info.group_ptr.size() == 0 ? tgptr : info.group_ptr;
+    utils::Check(gptr.back() == info.labels.size(),
+                 "EvalAuc: group structure must match number of prediction");
+    const bst_omp_uint ngroup = static_cast<bst_omp_uint>(gptr.size() - 1);
+    // sum statistics
+    double sum_auc = 0.0f;
+    #pragma omp parallel reduction(+:sum_auc)
+    {
+      // each thread takes a local rec
+      std::vector< std::pair<float, unsigned> > rec;
+      #pragma omp for schedule(static)
+      for (bst_omp_uint k = 0; k < ngroup; ++k) {
+        rec.clear();
+        for (unsigned j = gptr[k]; j < gptr[k + 1]; ++j) {
+          rec.push_back(std::make_pair(preds[j], j));
+        }
+        std::sort(rec.begin(), rec.end(), CmpFirst);
+        // calculate AUC
+        double sum_pospair = 0.0;
+        double sum_npos = 0.0, sum_nneg = 0.0, buf_pos = 0.0, buf_neg = 0.0;
+        for (size_t j = 0; j < rec.size(); ++j) {
+          const float wt = info.GetWeight(rec[j].second);
+          const float ctr = info.labels[rec[j].second];
+          // keep bucketing predictions in same bucket
+          if (j != 0 && rec[j].first != rec[j - 1].first) {
+            sum_pospair += buf_neg * (sum_npos + buf_pos *0.5);
+            sum_npos += buf_pos;
+            sum_nneg += buf_neg;
+            buf_neg = buf_pos = 0.0f;
+          }
+          buf_pos += ctr * wt;
+          buf_neg += (1.0f - ctr) * wt;
+        }
+        sum_pospair += buf_neg * (sum_npos + buf_pos *0.5);
+        sum_npos += buf_pos;
+        sum_nneg += buf_neg;
+        // check weird conditions
+        utils::Check(sum_npos > 0.0 && sum_nneg > 0.0,
+                     "AUC: the dataset only contains pos or neg samples");
+        // this is the AUC
+        sum_auc += sum_pospair / (sum_npos*sum_nneg);
+      }
+    }
+    if (distributed) {
+      float dat[2];
+      dat[0] = static_cast<float>(sum_auc);
+      dat[1] = static_cast<float>(ngroup);
+      // approximately estimate auc using mean
+      rabit::Allreduce<rabit::op::Sum>(dat, 2);
+      return dat[0] / dat[1];
+    } else {
+      return static_cast<float>(sum_auc) / ngroup;
+    }
+  }
+  virtual const char *Name(void) const {
+    return "auc";
+  }
+};
+
+/*! \brief Evaluate rank list */
+struct EvalRankList : public IEvaluator {
+ public:
+  virtual float Eval(const std::vector<float> &preds,
+                     const MetaInfo &info,
+                     bool distributed) const {
+    utils::Check(preds.size() == info.labels.size(),
+                  "label size predict size not match");
+    // quick consistency when group is not available
+    std::vector<unsigned> tgptr(2, 0);
+    tgptr[1] = static_cast<unsigned>(preds.size());
+    const std::vector<unsigned> &gptr = info.group_ptr.size() == 0 ? tgptr : info.group_ptr;
+    utils::Assert(gptr.size() != 0, "must specify group when constructing rank file");
+    utils::Assert(gptr.back() == preds.size(),
+                   "EvalRanklist: group structure must match number of prediction");
+    const bst_omp_uint ngroup = static_cast<bst_omp_uint>(gptr.size() - 1);
+    // sum statistics
+    double sum_metric = 0.0f;
+    #pragma omp parallel reduction(+:sum_metric)
+    {
+      // each thread takes a local rec
+      std::vector< std::pair<float, unsigned> > rec;
+      #pragma omp for schedule(static)
+      for (bst_omp_uint k = 0; k < ngroup; ++k) {
+        rec.clear();
+        for (unsigned j = gptr[k]; j < gptr[k + 1]; ++j) {
+          rec.push_back(std::make_pair(preds[j], static_cast<int>(info.labels[j])));
+        }
+        sum_metric += this->EvalMetric(rec);
+      }
+    }
+    if (distributed) {
+      float dat[2];
+      dat[0] = static_cast<float>(sum_metric);
+      dat[1] = static_cast<float>(ngroup);
+      // approximately estimate the metric using mean
+      rabit::Allreduce<rabit::op::Sum>(dat, 2);
+      return dat[0] / dat[1];
+    } else {
+      return static_cast<float>(sum_metric) / ngroup;
+    }
+  }
+  virtual const char *Name(void) const {
+    return name_.c_str();
+  }
+
+ protected:
+  explicit EvalRankList(const char *name) {
+    using namespace std;
+    name_ = name;
+    minus_ = false;
+    if (sscanf(name, "%*[^@]@%u[-]?", &topn_) != 1) {
+      topn_ = UINT_MAX;
+    }
+    if (name[strlen(name) - 1] == '-') {
+      minus_ = true;
+    }
+  }
+  /*! \return evaluation metric, given the pair_sort record, (pred,label) */
+  virtual float EvalMetric(std::vector< std::pair<float, unsigned> > &pair_sort) const = 0; // NOLINT(*)
+
+ protected:
+  unsigned topn_;
+  std::string name_;
+  bool minus_;
+};
+
+/*! \brief Precision at N, for both classification and rank */
+struct EvalPrecision : public EvalRankList{
+ public:
+  explicit EvalPrecision(const char *name) : EvalRankList(name) {}
+
+ protected:
+  virtual float EvalMetric(std::vector< std::pair<float, unsigned> > &rec) const {
+    // calculate Precision
+    std::sort(rec.begin(), rec.end(), CmpFirst);
+    unsigned nhit = 0;
+    for (size_t j = 0; j < rec.size() && j < this->topn_; ++j) {
+      nhit += (rec[j].second != 0);
+    }
+    return static_cast<float>(nhit) / topn_;
+  }
+};
+
+/*! \brief NDCG: Normalized Discounted Cumulative Gain at N */
+struct EvalNDCG : public EvalRankList{
+ public:
+  explicit EvalNDCG(const char *name) : EvalRankList(name) {}
+
+ protected:
+  inline float CalcDCG(const std::vector< std::pair<float, unsigned> > &rec) const {
+    double sumdcg = 0.0;
+    for (size_t i = 0; i < rec.size() && i < this->topn_; ++i) {
+      const unsigned rel = rec[i].second;
+      if (rel != 0) {
+        sumdcg += ((1 << rel) - 1) / std::log(i + 2.0);
+      }
+    }
+    return static_cast<float>(sumdcg);
+  }
+  virtual float EvalMetric(std::vector< std::pair<float, unsigned> > &rec) const { // NOLINT(*)
+    std::stable_sort(rec.begin(), rec.end(), CmpFirst);
+    float dcg = this->CalcDCG(rec);
+    std::stable_sort(rec.begin(), rec.end(), CmpSecond);
+    float idcg = this->CalcDCG(rec);
+    if (idcg == 0.0f) {
+      if (minus_) {
+        return 0.0f;
+      } else {
+        return 1.0f;
+      }
+    }
+    return dcg/idcg;
+  }
+};
+
+/*! \brief Mean Average Precision at N, for both classification and rank */
+struct EvalMAP : public EvalRankList {
+ public:
+  explicit EvalMAP(const char *name) : EvalRankList(name) {}
+
+ protected:
+  virtual float EvalMetric(std::vector< std::pair<float, unsigned> > &rec) const {
+    std::sort(rec.begin(), rec.end(), CmpFirst);
+    unsigned nhits = 0;
+    double sumap = 0.0;
+    for (size_t i = 0; i < rec.size(); ++i) {
+      if (rec[i].second != 0) {
+        nhits += 1;
+        if (i < this->topn_) {
+          sumap += static_cast<float>(nhits) / (i+1);
+        }
+      }
+    }
+    if (nhits != 0) {
+      sumap /= nhits;
+      return static_cast<float>(sumap);
+    } else {
+      if (minus_) {
+        return 0.0f;
+      } else {
+        return 1.0f;
+      }
+    }
+  }
+};
+
+}  // namespace learner
+}  // namespace xgboost
+#endif  // XGBOOST_LEARNER_EVALUATION_INL_HPP_
--- a/old_src/learner/evaluation.h
+++ b/old_src/learner/evaluation.h
@@ -0,0 +1,101 @@
+/*!
+ * Copyright 2014 by Contributors
+ * \file evaluation.h
+ * \brief interface of evaluation function supported in xgboost
+ * \author Tianqi Chen, Kailong Chen
+ */
+#ifndef XGBOOST_LEARNER_EVALUATION_H_
+#define XGBOOST_LEARNER_EVALUATION_H_
+
+#include <string>
+#include <vector>
+#include <cstdio>
+#include "../utils/utils.h"
+#include "./dmatrix.h"
+
+namespace xgboost {
+namespace learner {
+/*! \brief evaluator that evaluates the loss metrics */
+struct IEvaluator{
+  /*!
+   * \brief evaluate a specific metric
+   * \param preds prediction
+   * \param info information, including label etc.
+   * \param distributed whether a call to Allreduce is needed to gather
+   *        the average statistics across all the node,
+   *        this is only supported by some metrics
+   */
+  virtual float Eval(const std::vector<float> &preds,
+                     const MetaInfo &info,
+                     bool distributed = false) const = 0;
+  /*! \return name of metric */
+  virtual const char *Name(void) const = 0;
+  /*! \brief virtual destructor */
+  virtual ~IEvaluator(void) {}
+};
+}  // namespace learner
+}  // namespace xgboost
+
+// include implementations of evaluation functions
+#include "evaluation-inl.hpp"
+// factory function
+namespace xgboost {
+namespace learner {
+inline IEvaluator* CreateEvaluator(const char *name) {
+  using namespace std;
+  if (!strcmp(name, "rmse")) return new EvalRMSE();
+  if (!strcmp(name, "error")) return new EvalError();
+  if (!strcmp(name, "merror")) return new EvalMatchError();
+  if (!strcmp(name, "logloss")) return new EvalLogLoss();
+  if (!strcmp(name, "mlogloss")) return new EvalMultiLogLoss();
+  if (!strcmp(name, "poisson-nloglik")) return new EvalPoissionNegLogLik();
+  if (!strcmp(name, "auc")) return new EvalAuc();
+  if (!strncmp(name, "ams@", 4)) return new EvalAMS(name);
+  if (!strncmp(name, "pre@", 4)) return new EvalPrecision(name);
+  if (!strncmp(name, "pratio@", 7)) return new EvalPrecisionRatio(name);
+  if (!strncmp(name, "map", 3)) return new EvalMAP(name);
+  if (!strncmp(name, "ndcg", 4)) return new EvalNDCG(name);
+  if (!strncmp(name, "ct-", 3)) return new EvalCTest(CreateEvaluator(name+3), name);
+
+  utils::Error("unknown evaluation metric type: %s", name);
+  return NULL;
+}
+
+/*! \brief a set of evaluators */
+class EvalSet{
+ public:
+  inline void AddEval(const char *name) {
+    using namespace std;
+    for (size_t i = 0; i < evals_.size(); ++i) {
+      if (!strcmp(name, evals_[i]->Name())) return;
+    }
+    evals_.push_back(CreateEvaluator(name));
+  }
+  ~EvalSet(void) {
+    for (size_t i = 0; i < evals_.size(); ++i) {
+      delete evals_[i];
+    }
+  }
+  inline std::string Eval(const char *evname,
+                          const std::vector<float> &preds,
+                          const MetaInfo &info,
+                          bool distributed = false) {
+    std::string result = "";
+    for (size_t i = 0; i < evals_.size(); ++i) {
+      float res = evals_[i]->Eval(preds, info, distributed);
+      char tmp[1024];
+      utils::SPrintf(tmp, sizeof(tmp), "\t%s-%s:%f", evname, evals_[i]->Name(), res);
+      result += tmp;
+    }
+    return result;
+  }
+  inline size_t Size(void) const {
+    return evals_.size();
+  }
+
+ private:
+  std::vector<const IEvaluator*> evals_;
+};
+}  // namespace learner
+}  // namespace xgboost
+#endif  // XGBOOST_LEARNER_EVALUATION_H_
--- a/old_src/learner/helper_utils.h
+++ b/old_src/learner/helper_utils.h
@@ -0,0 +1,80 @@
+/*!
+ * Copyright 2014 by Contributors
+ * \file helper_utils.h
+ * \brief useful helper functions
+ * \author Tianqi Chen, Kailong Chen
+ */
+#ifndef XGBOOST_LEARNER_HELPER_UTILS_H_
+#define XGBOOST_LEARNER_HELPER_UTILS_H_
+
+#include <utility>
+#include <vector>
+#include <cmath>
+#include <algorithm>
+namespace xgboost {
+namespace learner {
+// simple helper function to do softmax
+inline static void Softmax(std::vector<float>* p_rec) {
+  std::vector<float> &rec = *p_rec;
+  float wmax = rec[0];
+  for (size_t i = 1; i < rec.size(); ++i) {
+    wmax = std::max(rec[i], wmax);
+  }
+  double wsum = 0.0f;
+  for (size_t i = 0; i < rec.size(); ++i) {
+    rec[i] = std::exp(rec[i]-wmax);
+    wsum += rec[i];
+  }
+  for (size_t i = 0; i < rec.size(); ++i) {
+    rec[i] /= static_cast<float>(wsum);
+  }
+}
+
+inline static int FindMaxIndex(const float  *rec, size_t size) {
+  size_t mxid = 0;
+  for (size_t i = 1; i < size; ++i) {
+    if (rec[i] > rec[mxid]) {
+      mxid = i;
+    }
+  }
+  return static_cast<int>(mxid);
+}
+
+// simple helper function to do softmax
+inline static int FindMaxIndex(const std::vector<float>& rec) {
+  return FindMaxIndex(BeginPtr(rec), rec.size());
+}
+
+// perform numerically safe logsum
+inline float LogSum(float x, float y) {
+  if (x < y) {
+    return y + std::log(std::exp(x - y) + 1.0f);
+  } else {
+    return x + std::log(std::exp(y - x) + 1.0f);
+  }
+}
+// numerically safe logsum
+inline float LogSum(const float *rec, size_t size) {
+  float mx = rec[0];
+  for (size_t i = 1; i < size; ++i) {
+    mx = std::max(mx, rec[i]);
+  }
+  float sum = 0.0f;
+  for (size_t i = 0; i < size; ++i) {
+    sum += std::exp(rec[i] - mx);
+  }
+  return mx + std::log(sum);
+}
+
+// comparator functions for sorting pairs in descending order
+inline static bool CmpFirst(const std::pair<float, unsigned> &a,
+                            const std::pair<float, unsigned> &b) {
+  return a.first > b.first;
+}
+inline static bool CmpSecond(const std::pair<float, unsigned> &a,
+                             const std::pair<float, unsigned> &b) {
+  return a.second > b.second;
+}
+}  // namespace learner
+}  // namespace xgboost
+#endif  // XGBOOST_LEARNER_HELPER_UTILS_H_
--- a/old_src/learner/learner-inl.hpp
+++ b/old_src/learner/learner-inl.hpp
@@ -0,0 +1,547 @@
+/*!
+ * Copyright 2014 by Contributors
+ * \file learner-inl.hpp
+ * \brief learning algorithm
+ * \author Tianqi Chen
+ */
+#ifndef XGBOOST_LEARNER_LEARNER_INL_HPP_
+#define XGBOOST_LEARNER_LEARNER_INL_HPP_
+
+#include <algorithm>
+#include <vector>
+#include <utility>
+#include <string>
+#include <limits>
+#include "../sync/sync.h"
+#include "../utils/io.h"
+#include "./objective.h"
+#include "./evaluation.h"
+#include "../gbm/gbm.h"
+
+namespace xgboost {
+/*! \brief namespace for learning algorithm */
+namespace learner {
+/*!
+ * \brief learner that performs gradient boosting for a specific objective function.
+ *  It does training and prediction.
+ */
+class BoostLearner : public rabit::Serializable {
+ public:
+  BoostLearner(void) {
+    obj_ = NULL;
+    gbm_ = NULL;
+    name_obj_ = "reg:linear";
+    name_gbm_ = "gbtree";
+    silent = 0;
+    prob_buffer_row = 1.0f;
+    distributed_mode = 0;
+    updater_mode = 0;
+    pred_buffer_size = 0;
+    seed_per_iteration = 0;
+    seed = 0;
+    save_base64 = 0;
+  }
+  virtual ~BoostLearner(void) {
+    if (obj_ != NULL) delete obj_;
+    if (gbm_ != NULL) delete gbm_;
+  }
+  /*!
+   * \brief add internal cache space for mat, this can speedup prediction for matrix,
+   *        please cache prediction for training and eval data
+   *    warning: if the model is loaded from file from some previous training history
+   *             set cache data must be called with exactly SAME
+   *             data matrices to continue training otherwise it will cause error
+   * \param mats array of pointers to matrix whose prediction result need to be cached
+   */
+  inline void SetCacheData(const std::vector<DMatrix*>& mats) {
+    utils::Assert(cache_.size() == 0, "can only call cache data once");
+    // assign buffer index
+    size_t buffer_size = 0;
+    for (size_t i = 0; i < mats.size(); ++i) {
+      bool dupilicate = false;
+      for (size_t j = 0; j < i; ++j) {
+        if (mats[i] == mats[j]) dupilicate = true;
+      }
+      if (dupilicate) continue;
+      // set mats[i]'s cache learner pointer to this
+      mats[i]->cache_learner_ptr_ = this;
+      cache_.push_back(CacheEntry(mats[i], buffer_size, mats[i]->info.num_row()));
+      buffer_size += mats[i]->info.num_row();
+    }
+    char str_temp[25];
+    utils::SPrintf(str_temp, sizeof(str_temp), "%lu",
+                   static_cast<unsigned long>(buffer_size)); // NOLINT(*)
+    this->SetParam("num_pbuffer", str_temp);
+    this->pred_buffer_size = buffer_size;
+  }
+  /*!
+   * \brief set parameters from outside
+   * \param name name of the parameter
+   * \param val  value of the parameter
+   */
+  inline void SetParam(const char *name, const char *val) {
+    using namespace std;
+    // in this version, bst: prefix is no longer required
+    if (strncmp(name, "bst:", 4) != 0) {
+      std::string n = "bst:"; n += name;
+      this->SetParam(n.c_str(), val);
+    }
+    if (!strcmp(name, "silent")) silent = atoi(val);
+    if (!strcmp(name, "dsplit")) {
+      if (!strcmp(val, "col")) {
+        this->SetParam("updater", "distcol");
+        distributed_mode = 1;
+      } else if (!strcmp(val, "row")) {
+        this->SetParam("updater", "grow_histmaker,prune");
+        distributed_mode = 2;
+      } else {
+        utils::Error("%s is invalid value for dsplit, should be row or col", val);
+      }
+    }
+    if (!strcmp(name, "updater_mode")) updater_mode = atoi(val);
+    if (!strcmp(name, "prob_buffer_row")) {
+      prob_buffer_row = static_cast<float>(atof(val));
+      utils::Check(distributed_mode == 0,
+                   "prob_buffer_row can only be used in single node mode so far");
+      this->SetParam("updater", "grow_colmaker,refresh,prune");
+    }
+    if (!strcmp(name, "eval_metric")) evaluator_.AddEval(val);
+    if (!strcmp("seed", name)) {
+      seed = atoi(val); random::Seed(seed);
+    }
+    if (!strcmp("seed_per_iter", name)) seed_per_iteration = atoi(val);
+    if (!strcmp("save_base64", name)) save_base64 = atoi(val);
+    if (!strcmp(name, "num_class")) {
+      this->SetParam("num_output_group", val);
+    }
+    if (!strcmp(name, "nthread")) {
+      omp_set_num_threads(atoi(val));
+    }
+    if (gbm_ == NULL) {
+      if (!strcmp(name, "objective")) name_obj_ = val;
+      if (!strcmp(name, "booster")) name_gbm_ = val;
+      mparam.SetParam(name, val);
+    }
+    if (gbm_ != NULL) gbm_->SetParam(name, val);
+    if (obj_ != NULL) obj_->SetParam(name, val);
+    if (gbm_ == NULL || obj_ == NULL) {
+      cfg_.push_back(std::make_pair(std::string(name), std::string(val)));
+    }
+  }
+  // this is an internal function
+  // initialize the trainer, called at InitModel and LoadModel
+  inline void InitTrainer(bool calc_num_feature = true) {
+    if (calc_num_feature) {
+      // estimate feature bound
+      unsigned num_feature = 0;
+      for (size_t i = 0; i < cache_.size(); ++i) {
+        num_feature = std::max(num_feature,
+                               static_cast<unsigned>(cache_[i].mat_->info.num_col()));
+      }
+      // run allreduce on num_feature to find the maximum value
+      rabit::Allreduce<rabit::op::Max>(&num_feature, 1);
+      if (num_feature > mparam.num_feature) mparam.num_feature = num_feature;
+    }
+    char str_temp[25];
+    utils::SPrintf(str_temp, sizeof(str_temp), "%d", mparam.num_feature);
+    this->SetParam("bst:num_feature", str_temp);
+  }
+  /*!
+   * \brief initialize the model
+   */
+  inline void InitModel(void) {
+    this->InitTrainer();
+    // initialize model
+    this->InitObjGBM();
+    // reset the base score
+    mparam.base_score = obj_->ProbToMargin(mparam.base_score);
+    // initialize GBM model
+    gbm_->InitModel();
+  }
+  /*!
+   * \brief load model from stream
+   * \param fi input stream
+   * \param calc_num_feature whether call InitTrainer with calc_num_feature
+   */
+  inline void LoadModel(utils::IStream &fi,  // NOLINT(*)
+                        bool calc_num_feature = true) {
+    utils::Check(fi.Read(&mparam, sizeof(ModelParam)) != 0,
+                 "BoostLearner: wrong model format");
+    {
+      // backward compatibility code for compatible with old model type
+      // for new model, Read(&name_obj_) is suffice
+      uint64_t len;
+      utils::Check(fi.Read(&len, sizeof(len)) != 0, "BoostLearner: wrong model format");
+      if (len >= std::numeric_limits<unsigned>::max()) {
+        int gap;
+        utils::Check(fi.Read(&gap, sizeof(gap)) != 0, "BoostLearner: wrong model format");
+        len = len >> static_cast<uint64_t>(32UL);
+      }
+      if (len != 0) {
+        name_obj_.resize(len);
+        utils::Check(fi.Read(&name_obj_[0], len) != 0, "BoostLearner: wrong model format");
+      }
+    }
+    utils::Check(fi.Read(&name_gbm_), "BoostLearner: wrong model format");
+    // delete existing gbm if any
+    if (obj_ != NULL) delete obj_;
+    if (gbm_ != NULL) delete gbm_;
+    this->InitTrainer(calc_num_feature);
+    this->InitObjGBM();
+    char tmp[32];
+    utils::SPrintf(tmp, sizeof(tmp), "%u", mparam.num_class);
+    obj_->SetParam("num_class", tmp);
+    gbm_->LoadModel(fi, mparam.saved_with_pbuffer != 0);
+    if (mparam.saved_with_pbuffer == 0) {
+      gbm_->ResetPredBuffer(pred_buffer_size);
+    }
+  }
+  // rabit load model from rabit checkpoint
+  virtual void Load(rabit::Stream *fi) {
+    // for row split, we should not keep pbuffer
+    this->LoadModel(*fi, false);
+  }
+  // rabit save model to rabit checkpoint
+  virtual void Save(rabit::Stream *fo) const {
+    // for row split, we should not keep pbuffer
+    this->SaveModel(*fo, distributed_mode != 2);
+  }
+  /*!
+   * \brief load model from file
+   * \param fname file name
+   */
+  inline void LoadModel(const char *fname) {
+    utils::IStream *fi = utils::IStream::Create(fname, "r");
+    std::string header; header.resize(4);
+    // check header for different binary encode
+    // can be base64 or binary
+    utils::Check(fi->Read(&header[0], 4) != 0, "invalid model");
+    // base64 format
+    if (header == "bs64") {
+      utils::Base64InStream bsin(fi);
+      bsin.InitPosition();
+      this->LoadModel(bsin, true);
+    } else if (header == "binf") {
+      this->LoadModel(*fi, true);
+    } else {
+      delete fi;
+      fi = utils::IStream::Create(fname, "r");
+      this->LoadModel(*fi, true);
+    }
+    delete fi;
+  }
+  inline void SaveModel(utils::IStream &fo, bool with_pbuffer) const { // NOLINT(*)
+    ModelParam p = mparam;
+    p.saved_with_pbuffer = static_cast<int>(with_pbuffer);
+    fo.Write(&p, sizeof(ModelParam));
+    fo.Write(name_obj_);
+    fo.Write(name_gbm_);
+    gbm_->SaveModel(fo, with_pbuffer);
+  }
+  /*!
+   * \brief save model into file
+   * \param fname file name
+   * \param with_pbuffer whether save pbuffer together
+   */
+  inline void SaveModel(const char *fname, bool with_pbuffer) const {
+    utils::IStream *fo = utils::IStream::Create(fname, "w");
+    if (save_base64 != 0 || !strcmp(fname, "stdout")) {
+      fo->Write("bs64\t", 5);
+      utils::Base64OutStream bout(fo);
+      this->SaveModel(bout, with_pbuffer);
+      bout.Finish('\n');
+    } else {
+      fo->Write("binf", 4);
+      this->SaveModel(*fo, with_pbuffer);
+    }
+    delete fo;
+  }
+  /*!
+   * \brief check if data matrix is ready to be used by training,
+   *  if not initialize it
+   * \param p_train pointer to the matrix used by training
+   */
+  inline void CheckInit(DMatrix *p_train) {
+    int ncol = static_cast<int>(p_train->info.info.num_col);
+    std::vector<bool> enabled(ncol, true);
+    // set max row per batch to limited value
+    // in distributed mode, use safe choice otherwise
+    size_t max_row_perbatch = std::numeric_limits<size_t>::max();
+    if (updater_mode != 0 || distributed_mode == 2) {
+      max_row_perbatch = 32UL << 10UL;
+    }
+    // initialize column access
+    p_train->fmat()->InitColAccess(enabled,
+                                   prob_buffer_row,
+                                   max_row_perbatch);
+    const int kMagicPage = 0xffffab02;
+    // check, if it is DMatrixPage, then use hist maker
+    if (p_train->magic == kMagicPage) {
+      this->SetParam("updater", "grow_histmaker,prune");
+    }
+  }
+  /*!
+   * \brief update the model for one iteration
+   * \param iter current iteration number
+   * \param train reference to the data matrix
+   */
+  inline void UpdateOneIter(int iter, const DMatrix &train) {
+    if (seed_per_iteration != 0 || rabit::IsDistributed()) {
+      random::Seed(this->seed * kRandSeedMagic + iter);
+    }
+    this->PredictRaw(train, &preds_);
+    obj_->GetGradient(preds_, train.info, iter, &gpair_);
+    gbm_->DoBoost(train.fmat(), this->FindBufferOffset(train), train.info.info, &gpair_);
+  }
+  /*!
+   * \brief whether model allow lazy checkpoint
+   */
+  inline bool AllowLazyCheckPoint(void) const {
+    return gbm_->AllowLazyCheckPoint();
+  }
+  /*!
+   * \brief evaluate the model for specific iteration
+   * \param iter iteration number
+   * \param evals datas i want to evaluate
+   * \param evname name of each dataset
+   * \return a string corresponding to the evaluation result
+   */
+  inline std::string EvalOneIter(int iter,
+                                 const std::vector<const DMatrix*> &evals,
+                                 const std::vector<std::string> &evname) {
+    std::string res;
+    char tmp[256];
+    utils::SPrintf(tmp, sizeof(tmp), "[%d]", iter);
+    res = tmp;
+    for (size_t i = 0; i < evals.size(); ++i) {
+      this->PredictRaw(*evals[i], &preds_);
+      obj_->EvalTransform(&preds_);
+      res += evaluator_.Eval(evname[i].c_str(), preds_, evals[i]->info, distributed_mode == 2);
+    }
+    return res;
+  }
+  /*!
+   * \brief simple evaluation function, with a specified metric
+   * \param data input data
+   * \param metric name of metric
+   * \return a pair of <evaluation name, result>
+   */
+  std::pair<std::string, float> Evaluate(const DMatrix &data, std::string metric) {
+    if (metric == "auto") metric = obj_->DefaultEvalMetric();
+    IEvaluator *ev = CreateEvaluator(metric.c_str());
+    this->PredictRaw(data, &preds_);
+    obj_->EvalTransform(&preds_);
+    float res = ev->Eval(preds_, data.info);
+    delete ev;
+    return std::make_pair(metric, res);
+  }
+  /*!
+   * \brief get prediction
+   * \param data input data
+   * \param output_margin whether to only predict margin value instead of transformed prediction
+   * \param out_preds output vector that stores the prediction
+   * \param ntree_limit limit number of trees used for boosted tree
+   *   predictor, when it equals 0, this means we are using all the trees
+   * \param pred_leaf whether to only predict the leaf index of each tree in a boosted tree predictor
+   */
+  inline void Predict(const DMatrix &data,
+                      bool output_margin,
+                      std::vector<float> *out_preds,
+                      unsigned ntree_limit = 0,
+                      bool pred_leaf = false) const {
+    if (pred_leaf) {
+      gbm_->PredictLeaf(data.fmat(), data.info.info, out_preds, ntree_limit);
+    } else {
+      this->PredictRaw(data, out_preds, ntree_limit);
+      if (!output_margin) {
+        obj_->PredTransform(out_preds);
+      }
+    }
+  }
+  /*!
+   * \brief online prediction function, predict score for one instance at a time
+   *  NOTE: use the batch prediction interface if possible, batch prediction is usually
+   *        more efficient than online prediction
+   *        This function is NOT threadsafe, make sure you only call from one thread
+   *
+   * \param inst the instance you want to predict
+   * \param output_margin whether to only predict margin value instead of transformed prediction
+   * \param out_preds output vector to hold the predictions
+   * \param ntree_limit limit the number of trees used in prediction
+   * \sa Predict
+   */
+  inline void Predict(const SparseBatch::Inst &inst,
+                      bool output_margin,
+                      std::vector<float> *out_preds,
+                      unsigned ntree_limit = 0) const {
+    gbm_->Predict(inst, out_preds, ntree_limit);
+    if (out_preds->size() == 1) {
+      (*out_preds)[0] += mparam.base_score;
+    }
+    if (!output_margin) {
+      obj_->PredTransform(out_preds);
+    }
+  }
+  /*! \brief dump model out */
+  inline std::vector<std::string> DumpModel(const utils::FeatMap& fmap, int option) {
+    return gbm_->DumpModel(fmap, option);
+  }
+
+ protected:
+  /*!
+   * \brief initialize the objective function and GBM,
+   * if not yet done
+   */
+  inline void InitObjGBM(void) {
+    if (obj_ != NULL) return;
+    utils::Assert(gbm_ == NULL, "GBM and obj should be NULL");
+    obj_ = CreateObjFunction(name_obj_.c_str());
+    gbm_ = gbm::CreateGradBooster(name_gbm_.c_str());
+    this->InitAdditionDefaultParam();
+    // set parameters
+    for (size_t i = 0; i < cfg_.size(); ++i) {
+      obj_->SetParam(cfg_[i].first.c_str(), cfg_[i].second.c_str());
+      gbm_->SetParam(cfg_[i].first.c_str(), cfg_[i].second.c_str());
+    }
+    if (evaluator_.Size() == 0) {
+      evaluator_.AddEval(obj_->DefaultEvalMetric());
+    }
+  }
+  /*!
+   * \brief additional default value for specific objs
+   */
+  inline void InitAdditionDefaultParam(void) {
+    if (name_obj_ == "count:poisson") {
+      obj_->SetParam("max_delta_step", "0.7");
+      gbm_->SetParam("max_delta_step", "0.7");
+    }
+  }
+  /*!
+   * \brief get un-transformed prediction
+   * \param data training data matrix
+   * \param out_preds output vector that stores the prediction
+   * \param ntree_limit limit number of trees used for boosted tree
+   *   predictor, when it equals 0, this means we are using all the trees
+   */
+  inline void PredictRaw(const DMatrix &data,
+                         std::vector<float> *out_preds,
+                         unsigned ntree_limit = 0) const {
+    gbm_->Predict(data.fmat(), this->FindBufferOffset(data),
+                  data.info.info, out_preds, ntree_limit);
+    // add base margin
+    std::vector<float> &preds = *out_preds;
+    const bst_omp_uint ndata = static_cast<bst_omp_uint>(preds.size());
+    if (data.info.base_margin.size() != 0) {
+      utils::Check(preds.size() == data.info.base_margin.size(),
+                   "base_margin.size does not match with prediction size");
+      #pragma omp parallel for schedule(static)
+      for (bst_omp_uint j = 0; j < ndata; ++j) {
+        preds[j] += data.info.base_margin[j];
+      }
+    } else {
+      #pragma omp parallel for schedule(static)
+      for (bst_omp_uint j = 0; j < ndata; ++j) {
+        preds[j] += mparam.base_score;
+      }
+    }
+  }
+
+  /*! \brief training parameter for regression */
+  struct ModelParam{
+    /* \brief global bias */
+    float base_score;
+    /* \brief number of features  */
+    unsigned num_feature;
+    /* \brief number of classes, if it is multi-class classification  */
+    int num_class;
+    /*! \brief whether the model itself is saved with pbuffer */
+    int saved_with_pbuffer;
+    /*! \brief reserved field */
+    int reserved[30];
+    /*! \brief constructor */
+    ModelParam(void) {
+      std::memset(this, 0, sizeof(ModelParam));
+      base_score = 0.5f;
+      num_feature = 0;
+      num_class = 0;
+      saved_with_pbuffer = 0;
+    }
+    /*!
+     * \brief set parameters from outside
+     * \param name name of the parameter
+     * \param val value of the parameter
+     */
+    inline void SetParam(const char *name, const char *val) {
+      using namespace std;
+      if (!strcmp("base_score", name)) base_score = static_cast<float>(atof(val));
+      if (!strcmp("num_class", name)) num_class = atoi(val);
+      if (!strcmp("bst:num_feature", name)) num_feature = atoi(val);
+    }
+  };
+  // data fields
+  // stored random seed
+  int seed;
+  // whether seed the PRNG each iteration
+  // this is important for restart from existing iterations
+  // default set to no, but will auto switch on in distributed mode
+  int seed_per_iteration;
+  // save model in base64 encoding
+  int save_base64;
+  // silent during training
+  int silent;
+  // distributed learning mode, if any, 0:none, 1:col, 2:row
+  int distributed_mode;
+  // updater mode, 0:normal, reserved for internal test
+  int updater_mode;
+  // cached size of predict buffer
+  size_t pred_buffer_size;
+  // maximum buffered row value
+  float prob_buffer_row;
+  // evaluation set
+  EvalSet evaluator_;
+  // model parameter
+  ModelParam  mparam;
+  // gbm model that back everything
+  gbm::IGradBooster *gbm_;
+  // name of gbm model used for training
+  std::string name_gbm_;
+  // objective function
+  IObjFunction *obj_;
+  // name of objective function
+  std::string name_obj_;
+  // configurations
+  std::vector< std::pair<std::string, std::string> > cfg_;
+  // temporal storages for prediction
+  std::vector<float> preds_;
+  // gradient pairs
+  std::vector<bst_gpair> gpair_;
+
+ protected:
+  // magic number to transform random seed
+  static const int kRandSeedMagic = 127;
+  // cache entry object that helps handle feature caching
+  struct CacheEntry {
+    const DMatrix *mat_;
+    size_t buffer_offset_;
+    size_t num_row_;
+    CacheEntry(const DMatrix *mat, size_t buffer_offset, size_t num_row)
+        :mat_(mat), buffer_offset_(buffer_offset), num_row_(num_row) {}
+  };
+  // find internal buffer offset for certain matrix, if not exist, return -1
+  inline int64_t FindBufferOffset(const DMatrix &mat) const {
+    for (size_t i = 0; i < cache_.size(); ++i) {
+      if (cache_[i].mat_ == &mat && mat.cache_learner_ptr_ == this) {
+        if (cache_[i].num_row_ == mat.info.num_row()) {
+          return static_cast<int64_t>(cache_[i].buffer_offset_);
+        }
+      }
+    }
+    return -1;
+  }
+  // data structure field
+  /*! \brief the entries indicates that we have internal prediction cache */
+  std::vector<CacheEntry> cache_;
+};
+}  // namespace learner
+}  // namespace xgboost
+#endif  // XGBOOST_LEARNER_LEARNER_INL_HPP_
--- a/old_src/learner/objective-inl.hpp
+++ b/old_src/learner/objective-inl.hpp
@@ -0,0 +1,642 @@
+/*!
+ * Copyright 2014 by Contributors
+ * \file objective-inl.hpp
+ * \brief objective function implementations
+ * \author Tianqi Chen, Kailong Chen
+ */
+#ifndef XGBOOST_LEARNER_OBJECTIVE_INL_HPP_
+#define XGBOOST_LEARNER_OBJECTIVE_INL_HPP_
+
+#include <vector>
+#include <algorithm>
+#include <utility>
+#include <cmath>
+#include <functional>
+#include "../data.h"
+#include "./objective.h"
+#include "./helper_utils.h"
+#include "../utils/random.h"
+#include "../utils/omp.h"
+
+namespace xgboost {
+namespace learner {
+/*! \brief defines functions to calculate some commonly used functions */
+struct LossType {
+  /*! \brief indicate which type we are using */
+  int loss_type;
+  // list of constants
+  static const int kLinearSquare = 0;
+  static const int kLogisticNeglik = 1;
+  static const int kLogisticClassify = 2;
+  static const int kLogisticRaw = 3;
+  /*!
+   * \brief transform the linear sum to prediction
+   * \param x linear sum of boosting ensemble
+   * \return transformed prediction
+   */
+  inline float PredTransform(float x) const {
+    switch (loss_type) {
+      case kLogisticRaw:
+      case kLinearSquare: return x;
+      case kLogisticClassify:
+      case kLogisticNeglik: return 1.0f / (1.0f + std::exp(-x));
+      default: utils::Error("unknown loss_type"); return 0.0f;
+    }
+  }
+  /*!
+   * \brief check if label range is valid
+   */
+  inline bool CheckLabel(float x) const {
+    if (loss_type != kLinearSquare) {
+      return x >= 0.0f && x <= 1.0f;
+    }
+    return true;
+  }
+  /*!
+   * \brief error message displayed when check label fail
+   */
+  inline const char * CheckLabelErrorMsg(void) const {
+    if (loss_type != kLinearSquare) {
+      return "label must be in [0,1] for logistic regression";
+    } else {
+      return "";
+    }
+  }
+  /*!
+   * \brief calculate first order gradient of loss, given transformed prediction
+   * \param predt transformed prediction
+   * \param label true label
+   * \return first order gradient
+   */
+  inline float FirstOrderGradient(float predt, float label) const {
+    switch (loss_type) {
+      case kLinearSquare: return predt - label;
+      case kLogisticRaw: predt = 1.0f / (1.0f + std::exp(-predt));
+      case kLogisticClassify:
+      case kLogisticNeglik: return predt - label;
+      default: utils::Error("unknown loss_type"); return 0.0f;
+    }
+  }
+  /*!
+   * \brief calculate second order gradient of loss, given transformed prediction
+   * \param predt transformed prediction
+   * \param label true label
+   * \return second order gradient
+   */
+  inline float SecondOrderGradient(float predt, float label) const {
+    // cap second order gradient to positive value
+    const float eps = 1e-16f;
+    switch (loss_type) {
+      case kLinearSquare: return 1.0f;
+      case kLogisticRaw: predt = 1.0f / (1.0f + std::exp(-predt));
+      case kLogisticClassify:
+      case kLogisticNeglik: return std::max(predt * (1.0f - predt), eps);
+      default: utils::Error("unknown loss_type"); return 0.0f;
+    }
+  }
+  /*!
+   * \brief transform probability value back to margin
+   */
+  inline float ProbToMargin(float base_score) const {
+    if (loss_type == kLogisticRaw ||
+        loss_type == kLogisticClassify ||
+        loss_type == kLogisticNeglik ) {
+      utils::Check(base_score > 0.0f && base_score < 1.0f,
+                   "base_score must be in (0,1) for logistic loss");
+      base_score = -std::log(1.0f / base_score - 1.0f);
+    }
+    return base_score;
+  }
+  /*! \brief get default evaluation metric for the objective */
+  inline const char *DefaultEvalMetric(void) const {
+    if (loss_type == kLogisticClassify) return "error";
+    if (loss_type == kLogisticRaw) return "auc";
+    return "rmse";
+  }
+};
+
+/*! \brief objective function that only need to */
+class RegLossObj : public IObjFunction {
+ public:
+  explicit RegLossObj(int loss_type) {
+    loss.loss_type = loss_type;
+    scale_pos_weight = 1.0f;
+  }
+  virtual ~RegLossObj(void) {}
+  virtual void SetParam(const char *name, const char *val) {
+    using namespace std;
+    if (!strcmp("scale_pos_weight", name)) {
+      scale_pos_weight = static_cast<float>(atof(val));
+    }
+  }
+  virtual void GetGradient(const std::vector<float> &preds,
+                           const MetaInfo &info,
+                           int iter,
+                           std::vector<bst_gpair> *out_gpair) {
+    utils::Check(info.labels.size() != 0, "label set cannot be empty");
+    utils::Check(preds.size() % info.labels.size() == 0,
+                 "labels are not correctly provided");
+    std::vector<bst_gpair> &gpair = *out_gpair;
+    gpair.resize(preds.size());
+    // check if label in range
+    bool label_correct = true;
+    // start calculating gradient
+    const unsigned nstep = static_cast<unsigned>(info.labels.size());
+    const bst_omp_uint ndata = static_cast<bst_omp_uint>(preds.size());
+    #pragma omp parallel for schedule(static)
+    for (bst_omp_uint i = 0; i < ndata; ++i) {
+      const unsigned j = i % nstep;
+      float p = loss.PredTransform(preds[i]);
+      float w = info.GetWeight(j);
+      if (info.labels[j] == 1.0f) w *= scale_pos_weight;
+      if (!loss.CheckLabel(info.labels[j])) label_correct = false;
+      gpair[i] = bst_gpair(loss.FirstOrderGradient(p, info.labels[j]) * w,
+                           loss.SecondOrderGradient(p, info.labels[j]) * w);
+    }
+    utils::Check(label_correct, loss.CheckLabelErrorMsg());
+  }
+  virtual const char* DefaultEvalMetric(void) const {
+    return loss.DefaultEvalMetric();
+  }
+  virtual void PredTransform(std::vector<float> *io_preds) {
+    std::vector<float> &preds = *io_preds;
+    const bst_omp_uint ndata = static_cast<bst_omp_uint>(preds.size());
+    #pragma omp parallel for schedule(static)
+    for (bst_omp_uint j = 0; j < ndata; ++j) {
+      preds[j] = loss.PredTransform(preds[j]);
+    }
+  }
+  virtual float ProbToMargin(float base_score) const {
+    return loss.ProbToMargin(base_score);
+  }
+
+ protected:
+  float scale_pos_weight;
+  LossType loss;
+};
+
+// poisson regression for count
+class PoissonRegression : public IObjFunction {
+ public:
+  PoissonRegression(void) {
+    max_delta_step = 0.0f;
+  }
+  virtual ~PoissonRegression(void) {}
+
+  virtual void SetParam(const char *name, const char *val) {
+    using namespace std;
+    if (!strcmp("max_delta_step", name)) {
+      max_delta_step = static_cast<float>(atof(val));
+    }
+  }
+  virtual void GetGradient(const std::vector<float> &preds,
+                           const MetaInfo &info,
+                           int iter,
+                           std::vector<bst_gpair> *out_gpair) {
+    utils::Check(max_delta_step != 0.0f,
+                 "PoissonRegression: need to set max_delta_step");
+    utils::Check(info.labels.size() != 0, "label set cannot be empty");
+    utils::Check(preds.size() == info.labels.size(),
+                 "labels are not correctly provided");
+    std::vector<bst_gpair> &gpair = *out_gpair;
+    gpair.resize(preds.size());
+    // check if label in range
+    bool label_correct = true;
+    // start calculating gradient
+    const long ndata = static_cast<bst_omp_uint>(preds.size()); // NOLINT(*)
+    #pragma omp parallel for schedule(static)
+    for (long i = 0; i < ndata; ++i) { // NOLINT(*)
+      float p = preds[i];
+      float w = info.GetWeight(i);
+      float y = info.labels[i];
+      if (y >= 0.0f) {
+        gpair[i] = bst_gpair((std::exp(p) - y) * w,
+                             std::exp(p + max_delta_step) * w);
+      } else {
+        label_correct = false;
+      }
+    }
+    utils::Check(label_correct,
+                 "PoissonRegression: label must be nonnegative");
+  }
+  virtual void PredTransform(std::vector<float> *io_preds) {
+    std::vector<float> &preds = *io_preds;
+    const long ndata = static_cast<long>(preds.size()); // NOLINT(*)
+    #pragma omp parallel for schedule(static)
+    for (long j = 0; j < ndata; ++j) {  // NOLINT(*)
+      preds[j] = std::exp(preds[j]);
+    }
+  }
+  virtual void EvalTransform(std::vector<float> *io_preds) {
+    PredTransform(io_preds);
+  }
+  virtual float ProbToMargin(float base_score) const {
+    return std::log(base_score);
+  }
+  virtual const char* DefaultEvalMetric(void) const {
+    return "poisson-nloglik";
+  }
+
+ private:
+  float max_delta_step;
+};
+
+// softmax multi-class classification
+class SoftmaxMultiClassObj : public IObjFunction {
+ public:
+  explicit SoftmaxMultiClassObj(int output_prob)
+      : output_prob(output_prob) {
+    nclass = 0;
+  }
+  virtual ~SoftmaxMultiClassObj(void) {}
+  virtual void SetParam(const char *name, const char *val) {
+    using namespace std;
+    if (!strcmp( "num_class", name )) nclass = atoi(val);
+  }
+  virtual void GetGradient(const std::vector<float> &preds,
+                           const MetaInfo &info,
+                           int iter,
+                           std::vector<bst_gpair> *out_gpair) {
+    utils::Check(nclass != 0, "must set num_class to use softmax");
+    utils::Check(info.labels.size() != 0, "label set cannot be empty");
+    utils::Check(preds.size() % (static_cast<size_t>(nclass) * info.labels.size()) == 0,
+                 "SoftmaxMultiClassObj: label size and pred size does not match");
+    std::vector<bst_gpair> &gpair = *out_gpair;
+    gpair.resize(preds.size());
+    const unsigned nstep = static_cast<unsigned>(info.labels.size() * nclass);
+    const bst_omp_uint ndata = static_cast<bst_omp_uint>(preds.size() / nclass);
+    int label_error = 0;
+    #pragma omp parallel
+    {
+      std::vector<float> rec(nclass);
+      #pragma omp for schedule(static)
+      for (bst_omp_uint i = 0; i < ndata; ++i) {
+        for (int k = 0; k < nclass; ++k) {
+          rec[k] = preds[i * nclass + k];
+        }
+        Softmax(&rec);
+        const unsigned j = i % nstep;
+        int label = static_cast<int>(info.labels[j]);
+        if (label < 0 || label >= nclass)  {
+          label_error = label; label = 0;
+        }
+        const float wt = info.GetWeight(j);
+        for (int k = 0; k < nclass; ++k) {
+          float p = rec[k];
+          const float h = 2.0f * p * (1.0f - p) * wt;
+          if (label == k) {
+            gpair[i * nclass + k] = bst_gpair((p - 1.0f) * wt, h);
+          } else {
+            gpair[i * nclass + k] = bst_gpair(p* wt, h);
+          }
+        }
+      }
+    }
+    utils::Check(label_error >= 0 && label_error < nclass,
+                 "SoftmaxMultiClassObj: label must be in [0, num_class),"\
+                 " num_class=%d but found %d in label", nclass, label_error);
+  }
+  virtual void PredTransform(std::vector<float> *io_preds) {
+    this->Transform(io_preds, output_prob);
+  }
+  virtual void EvalTransform(std::vector<float> *io_preds) {
+    this->Transform(io_preds, 1);
+  }
+  virtual const char* DefaultEvalMetric(void) const {
+    return "merror";
+  }
+
+ private:
+  inline void Transform(std::vector<float> *io_preds, int prob) {
+    utils::Check(nclass != 0, "must set num_class to use softmax");
+    std::vector<float> &preds = *io_preds;
+    std::vector<float> tmp;
+    const bst_omp_uint ndata = static_cast<bst_omp_uint>(preds.size()/nclass);
+    if (prob == 0) tmp.resize(ndata);
+    #pragma omp parallel
+    {
+      std::vector<float> rec(nclass);
+      #pragma omp for schedule(static)
+      for (bst_omp_uint j = 0; j < ndata; ++j) {
+        for (int k = 0; k < nclass; ++k) {
+          rec[k] = preds[j * nclass + k];
+        }
+        if (prob == 0) {
+          tmp[j] = static_cast<float>(FindMaxIndex(rec));
+        } else {
+          Softmax(&rec);
+          for (int k = 0; k < nclass; ++k) {
+            preds[j * nclass + k] = rec[k];
+          }
+        }
+      }
+    }
+    if (prob == 0) preds = tmp;
+  }
+  // data field
+  int nclass;
+  int output_prob;
+};
+
+/*! \brief objective for lambda rank */
+class LambdaRankObj : public IObjFunction {
+ public:
+  LambdaRankObj(void) {
+    loss.loss_type = LossType::kLogisticRaw;
+    fix_list_weight = 0.0f;
+    num_pairsample = 1;
+  }
+  virtual ~LambdaRankObj(void) {}
+  virtual void SetParam(const char *name, const char *val) {
+    using namespace std;
+    if (!strcmp( "loss_type", name )) loss.loss_type = atoi(val);
+    if (!strcmp( "fix_list_weight", name)) fix_list_weight = static_cast<float>(atof(val));
+    if (!strcmp( "num_pairsample", name)) num_pairsample = atoi(val);
+  }
+  virtual void GetGradient(const std::vector<float> &preds,
+                           const MetaInfo &info,
+                           int iter,
+                           std::vector<bst_gpair> *out_gpair) {
+    utils::Check(preds.size() == info.labels.size(), "label size predict size not match");
+    std::vector<bst_gpair> &gpair = *out_gpair;
+    gpair.resize(preds.size());
+    // quick consistency when group is not available
+    std::vector<unsigned> tgptr(2, 0); tgptr[1] = static_cast<unsigned>(info.labels.size());
+    const std::vector<unsigned> &gptr = info.group_ptr.size() == 0 ? tgptr : info.group_ptr;
+    utils::Check(gptr.size() != 0 && gptr.back() == info.labels.size(),
+                 "group structure not consistent with #rows");
+    const bst_omp_uint ngroup = static_cast<bst_omp_uint>(gptr.size() - 1);
+    #pragma omp parallel
+    {
+      // parall construct, declare random number generator here, so that each
+      // thread use its own random number generator, seed by thread id and current iteration
+      random::Random rnd; rnd.Seed(iter* 1111 + omp_get_thread_num());
+      std::vector<LambdaPair> pairs;
+      std::vector<ListEntry>  lst;
+      std::vector< std::pair<float, unsigned> > rec;
+      #pragma omp for schedule(static)
+      for (bst_omp_uint k = 0; k < ngroup; ++k) {
+        lst.clear(); pairs.clear();
+        for (unsigned j = gptr[k]; j < gptr[k+1]; ++j) {
+          lst.push_back(ListEntry(preds[j], info.labels[j], j));
+          gpair[j] = bst_gpair(0.0f, 0.0f);
+        }
+        std::sort(lst.begin(), lst.end(), ListEntry::CmpPred);
+        rec.resize(lst.size());
+        for (unsigned i = 0; i < lst.size(); ++i) {
+          rec[i] = std::make_pair(lst[i].label, i);
+        }
+        std::sort(rec.begin(), rec.end(), CmpFirst);
+        // enumerate buckets with same label, for each item in the lst, grab another sample randomly
+        for (unsigned i = 0; i < rec.size(); ) {
+          unsigned j = i + 1;
+          while (j < rec.size() && rec[j].first == rec[i].first) ++j;
+          // bucket in [i,j), get a sample outside bucket
+          unsigned nleft = i, nright = static_cast<unsigned>(rec.size() - j);
+          if (nleft + nright != 0) {
+            int nsample = num_pairsample;
+            while (nsample --) {
+              for (unsigned pid = i; pid < j; ++pid) {
+                unsigned ridx = static_cast<unsigned>(rnd.RandDouble() * (nleft+nright));
+                if (ridx < nleft) {
+                  pairs.push_back(LambdaPair(rec[ridx].second, rec[pid].second));
+                } else {
+                  pairs.push_back(LambdaPair(rec[pid].second, rec[ridx+j-i].second));
+                }
+              }
+            }
+          }
+          i = j;
+        }
+        // get lambda weight for the pairs
+        this->GetLambdaWeight(lst, &pairs);
+        // rescale each gradient and hessian so that the lst have constant weighted
+        float scale = 1.0f / num_pairsample;
+        if (fix_list_weight != 0.0f) {
+          scale *= fix_list_weight / (gptr[k+1] - gptr[k]);
+        }
+        for (size_t i = 0; i < pairs.size(); ++i) {
+          const ListEntry &pos = lst[pairs[i].pos_index];
+          const ListEntry &neg = lst[pairs[i].neg_index];
+          const float w = pairs[i].weight * scale;
+          float p = loss.PredTransform(pos.pred - neg.pred);
+          float g = loss.FirstOrderGradient(p, 1.0f);
+          float h = loss.SecondOrderGradient(p, 1.0f);
+          // accumulate gradient and hessian in both pid, and nid
+          gpair[pos.rindex].grad += g * w;
+          gpair[pos.rindex].hess += 2.0f * w * h;
+          gpair[neg.rindex].grad -= g * w;
+          gpair[neg.rindex].hess += 2.0f * w * h;
+        }
+      }
+    }
+  }
+  virtual const char* DefaultEvalMetric(void) const {
+    return "map";
+  }
+
+ protected:
+  /*! \brief helper information in a list */
+  struct ListEntry {
+    /*! \brief the predict score we in the data */
+    float pred;
+    /*! \brief the actual label of the entry */
+    float label;
+    /*! \brief row index in the data matrix */
+    unsigned rindex;
+    // constructor
+    ListEntry(float pred, float label, unsigned rindex)
+        : pred(pred), label(label), rindex(rindex) {}
+    // comparator by prediction
+    inline static bool CmpPred(const ListEntry &a, const ListEntry &b) {
+      return a.pred > b.pred;
+    }
+    // comparator by label
+    inline static bool CmpLabel(const ListEntry &a, const ListEntry &b) {
+      return a.label > b.label;
+    }
+  };
+  /*! \brief a pair in the lambda rank */
+  struct LambdaPair {
+    /*! \brief positive index: this is a position in the list */
+    unsigned pos_index;
+    /*! \brief negative index: this is a position in the list */
+    unsigned neg_index;
+    /*! \brief weight to be filled in */
+    float weight;
+    // constructor
+    LambdaPair(unsigned pos_index, unsigned neg_index)
+        : pos_index(pos_index), neg_index(neg_index), weight(1.0f) {}
+  };
+  /*!
+   * \brief get lambda weight for existing pairs
+   * \param list a list that is sorted by pred score
+   * \param io_pairs record of pairs, containing the pairs to fill in weights
+   */
+  virtual void GetLambdaWeight(const std::vector<ListEntry> &sorted_list,
+                               std::vector<LambdaPair> *io_pairs) = 0;
+
+ private:
+  // loss function
+  LossType loss;
+  // number of samples peformed for each instance
+  int num_pairsample;
+  // fix weight of each elements in list
+  float fix_list_weight;
+};
+
+class PairwiseRankObj: public LambdaRankObj{
+ public:
+  virtual ~PairwiseRankObj(void) {}
+
+ protected:
+  virtual void GetLambdaWeight(const std::vector<ListEntry> &sorted_list,
+                               std::vector<LambdaPair> *io_pairs) {}
+};
+
+// beta version: NDCG lambda rank
+class LambdaRankObjNDCG : public LambdaRankObj {
+ public:
+  virtual ~LambdaRankObjNDCG(void) {}
+
+ protected:
+  virtual void GetLambdaWeight(const std::vector<ListEntry> &sorted_list,
+                               std::vector<LambdaPair> *io_pairs) {
+    std::vector<LambdaPair> &pairs = *io_pairs;
+    float IDCG;
+    {
+      std::vector<float> labels(sorted_list.size());
+      for (size_t i = 0; i < sorted_list.size(); ++i) {
+        labels[i] = sorted_list[i].label;
+      }
+      std::sort(labels.begin(), labels.end(), std::greater<float>());
+      IDCG = CalcDCG(labels);
+    }
+    if (IDCG == 0.0) {
+      for (size_t i = 0; i < pairs.size(); ++i) {
+        pairs[i].weight = 0.0f;
+      }
+    } else {
+      IDCG = 1.0f / IDCG;
+      for (size_t i = 0; i < pairs.size(); ++i) {
+        unsigned pos_idx = pairs[i].pos_index;
+        unsigned neg_idx = pairs[i].neg_index;
+        float pos_loginv = 1.0f / std::log(pos_idx + 2.0f);
+        float neg_loginv = 1.0f / std::log(neg_idx + 2.0f);
+        int pos_label = static_cast<int>(sorted_list[pos_idx].label);
+        int neg_label = static_cast<int>(sorted_list[neg_idx].label);
+        float original =
+            ((1 << pos_label) - 1) * pos_loginv + ((1 << neg_label) - 1) * neg_loginv;
+        float changed  =
+            ((1 << neg_label) - 1) * pos_loginv + ((1 << pos_label) - 1) * neg_loginv;
+        float delta = (original - changed) * IDCG;
+        if (delta < 0.0f) delta = - delta;
+        pairs[i].weight = delta;
+      }
+    }
+  }
+  inline static float CalcDCG(const std::vector<float> &labels) {
+    double sumdcg = 0.0;
+    for (size_t i = 0; i < labels.size(); ++i) {
+      const unsigned rel = static_cast<unsigned>(labels[i]);
+      if (rel != 0) {
+        sumdcg += ((1 << rel) - 1) / std::log(static_cast<float>(i + 2));
+      }
+    }
+    return static_cast<float>(sumdcg);
+  }
+};
+
+class LambdaRankObjMAP : public LambdaRankObj {
+ public:
+  virtual ~LambdaRankObjMAP(void) {}
+
+ protected:
+  struct MAPStats {
+    /*! \brief the accumulated precision */
+    float ap_acc;
+    /*!
+     * \brief the accumulated precision,
+     *   assuming a positive instance is missing
+     */
+    float ap_acc_miss;
+    /*!
+     * \brief the accumulated precision,
+     * assuming that one more positive instance is inserted ahead
+     */
+    float ap_acc_add;
+    /* \brief the accumulated positive instance count */
+    float hits;
+    MAPStats(void) {}
+    MAPStats(float ap_acc, float ap_acc_miss, float ap_acc_add, float hits)
+        : ap_acc(ap_acc), ap_acc_miss(ap_acc_miss), ap_acc_add(ap_acc_add), hits(hits) {}
+  };
+  /*!
+   * \brief Obtain the delta MAP if trying to switch the positions of instances in index1 or index2
+   *        in sorted triples
+   * \param sorted_list the list containing entry information
+   * \param index1,index2 the instances switched
+   * \param map_stats a vector containing the accumulated precisions for each position in a list
+   */
+  inline float GetLambdaMAP(const std::vector<ListEntry> &sorted_list,
+                            int index1, int index2,
+                            std::vector<MAPStats> *p_map_stats) {
+    std::vector<MAPStats> &map_stats = *p_map_stats;
+    if (index1 == index2 || map_stats[map_stats.size() - 1].hits == 0) {
+      return 0.0f;
+    }
+    if (index1 > index2) std::swap(index1, index2);
+    float original = map_stats[index2].ap_acc;
+    if (index1 != 0) original -= map_stats[index1 - 1].ap_acc;
+    float changed = 0;
+    float label1 = sorted_list[index1].label > 0.0f ? 1.0f : 0.0f;
+    float label2 = sorted_list[index2].label > 0.0f ? 1.0f : 0.0f;
+    if (label1 == label2) {
+      return 0.0;
+    } else if (label1 < label2) {
+      changed += map_stats[index2 - 1].ap_acc_add - map_stats[index1].ap_acc_add;
+      changed += (map_stats[index1].hits + 1.0f) / (index1 + 1);
+    } else {
+      changed += map_stats[index2 - 1].ap_acc_miss - map_stats[index1].ap_acc_miss;
+      changed += map_stats[index2].hits / (index2 + 1);
+    }
+    float ans = (changed - original) / (map_stats[map_stats.size() - 1].hits);
+    if (ans < 0) ans = -ans;
+    return ans;
+  }
+  /*
+   * \brief obtain preprocessing results for calculating delta MAP
+   * \param sorted_list the list containing entry information
+   * \param map_stats a vector containing the accumulated precisions for each position in a list
+   */
+  inline void GetMAPStats(const std::vector<ListEntry> &sorted_list,
+                          std::vector<MAPStats> *p_map_acc) {
+    std::vector<MAPStats> &map_acc = *p_map_acc;
+    map_acc.resize(sorted_list.size());
+    float hit = 0, acc1 = 0, acc2 = 0, acc3 = 0;
+    for (size_t i = 1; i <= sorted_list.size(); ++i) {
+      if (sorted_list[i - 1].label > 0.0f) {
+        hit++;
+        acc1 += hit / i;
+        acc2 += (hit - 1) / i;
+        acc3 += (hit + 1) / i;
+      }
+      map_acc[i - 1] = MAPStats(acc1, acc2, acc3, hit);
+    }
+  }
+  virtual void GetLambdaWeight(const std::vector<ListEntry> &sorted_list,
+                               std::vector<LambdaPair> *io_pairs) {
+    std::vector<LambdaPair> &pairs = *io_pairs;
+    std::vector<MAPStats> map_stats;
+    GetMAPStats(sorted_list, &map_stats);
+    for (size_t i = 0; i < pairs.size(); ++i) {
+      pairs[i].weight =
+          GetLambdaMAP(sorted_list, pairs[i].pos_index,
+                       pairs[i].neg_index, &map_stats);
+    }
+  }
+};
+
+}  // namespace learner
+}  // namespace xgboost
+#endif  // XGBOOST_LEARNER_OBJECTIVE_INL_HPP_
--- a/old_src/learner/objective.h
+++ b/old_src/learner/objective.h
@@ -0,0 +1,89 @@
+/*!
+ * Copyright 2014 by Contributors
+ * \file objective.h
+ * \brief interface of objective function used for gradient boosting
+ * \author Tianqi Chen, Kailong Chen
+ */
+#ifndef XGBOOST_LEARNER_OBJECTIVE_H_
+#define XGBOOST_LEARNER_OBJECTIVE_H_
+
+#include <vector>
+#include "./dmatrix.h"
+
+namespace xgboost {
+namespace learner {
+/*! \brief interface of objective function */
+class IObjFunction{
+ public:
+  /*! \brief virtual destructor */
+  virtual ~IObjFunction(void) {}
+  /*!
+   * \brief set parameters from outside
+   * \param name name of the parameter
+   * \param val value of the parameter
+   */
+  virtual void SetParam(const char *name, const char *val) = 0;
+  /*!
+   * \brief get gradient over each of predictions, given existing information
+   * \param preds prediction of current round
+   * \param info information about labels, weights, groups in rank
+   * \param iter current iteration number
+   * \param out_gpair output of get gradient, saves gradient and second order gradient in
+   */
+  virtual void GetGradient(const std::vector<float> &preds,
+                           const MetaInfo &info,
+                           int iter,
+                           std::vector<bst_gpair> *out_gpair) = 0;
+  /*! \return the default evaluation metric for the objective */
+  virtual const char* DefaultEvalMetric(void) const = 0;
+  // the following functions are optional, most of time default implementation is good enough
+  /*!
+   * \brief transform prediction values, this is only called when Prediction is called
+   * \param io_preds prediction values, saves to this vector as well
+   */
+  virtual void PredTransform(std::vector<float> *io_preds) {}
+  /*!
+   * \brief transform prediction values, this is only called when Eval is called,
+   *  usually it redirect to PredTransform
+   * \param io_preds prediction values, saves to this vector as well
+   */
+  virtual void EvalTransform(std::vector<float> *io_preds) {
+    this->PredTransform(io_preds);
+  }
+  /*!
+   * \brief transform probability value back to margin
+   * this is used to transform user-set base_score back to margin
+   * used by gradient boosting
+   * \return transformed value
+   */
+  virtual float ProbToMargin(float base_score) const {
+    return base_score;
+  }
+};
+}  // namespace learner
+}  // namespace xgboost
+
+// this are implementations of objective functions
+#include "objective-inl.hpp"
+// factory function
+namespace xgboost {
+namespace learner {
+/*! \brief factory function to create objective function by name */
+inline IObjFunction* CreateObjFunction(const char *name) {
+  using namespace std;
+  if (!strcmp("reg:linear", name)) return new RegLossObj(LossType::kLinearSquare);
+  if (!strcmp("reg:logistic", name)) return new RegLossObj(LossType::kLogisticNeglik);
+  if (!strcmp("binary:logistic", name)) return new RegLossObj(LossType::kLogisticClassify);
+  if (!strcmp("binary:logitraw", name)) return new RegLossObj(LossType::kLogisticRaw);
+  if (!strcmp("count:poisson", name)) return new PoissonRegression();
+  if (!strcmp("multi:softmax", name)) return new SoftmaxMultiClassObj(0);
+  if (!strcmp("multi:softprob", name)) return new SoftmaxMultiClassObj(1);
+  if (!strcmp("rank:pairwise", name )) return new PairwiseRankObj();
+  if (!strcmp("rank:ndcg", name)) return new LambdaRankObjNDCG();
+  if (!strcmp("rank:map", name)) return new LambdaRankObjMAP();
+  utils::Error("unknown objective function type: %s", name);
+  return NULL;
+}
+}  // namespace learner
+}  // namespace xgboost
+#endif  // XGBOOST_LEARNER_OBJECTIVE_H_