Fix #3663: Allow sklearn API to use callbacks (#3682)

* Fix #3663: Allow sklearn API to use callbacks * Fix lint * Add Callback API to Python API doc
2018-09-07 23:51:26 +03:00 · 2018-09-07 23:51:26 +03:00 · 4b43810f51
commit 4b43810f51
parent 5a8bbb39a1
4 changed files with 104 additions and 53 deletions
--- a/doc/python/python_api.rst
+++ b/doc/python/python_api.rst
@ -53,3 +53,15 @@ Plotting API
 .. autofunction:: xgboost.plot_tree
 .. autofunction:: xgboost.to_graphviz
 .. _callback_api:
 Callback API
 ------------
 .. autofunction:: xgboost.callback.print_evaluation
 .. autofunction:: xgboost.callback.record_evaluation
 .. autofunction:: xgboost.callback.reset_learning_rate
 .. autofunction:: xgboost.callback.early_stop
--- a/python-package/xgboost/callback.py
+++ b/python-package/xgboost/callback.py
@ -32,7 +32,7 @@ def _fmt_metric(value, show_stdv=True):
 def print_evaluation(period=1, show_stdv=True):
    """Create a callback that print evaluation result.
-    We print the evaluation results every ``period`` iterations
+    We print the evaluation results every **period** iterations
    and on the first and the last iterations.
    Parameters
@ -60,7 +60,7 @@ def print_evaluation(period=1, show_stdv=True):
 def record_evaluation(eval_result):
-    """Create a call back that records the evaluation history into eval_result.
+    """Create a call back that records the evaluation history into **eval_result**.
    Parameters
    ----------
@ -109,10 +109,11 @@ def reset_learning_rate(learning_rates):
    learning_rates: list or function
        List of learning rate for each boosting round
        or a customized function that calculates eta in terms of
-        current number of round and the total number of boosting round (e.g. yields
+        current number of round and the total number of boosting round (e.g.
-        learning rate decay)
+        yields learning rate decay)
-        - list l: eta = l[boosting_round]
+
-        - function f: eta = f(boosting_round, num_boost_round)
+        * list ``l``: ``eta = l[boosting_round]``
        * function ``f``: ``eta = f(boosting_round, num_boost_round)``
    Returns
    -------
@ -150,14 +151,14 @@ def early_stop(stopping_rounds, maximize=False, verbose=True):
    """Create a callback that activates early stoppping.
    Validation error needs to decrease at least
-    every <stopping_rounds> round(s) to continue training.
+    every **stopping_rounds** round(s) to continue training.
-    Requires at least one item in evals.
+    Requires at least one item in **evals**.
    If there's more than one, will use the last.
    Returns the model from the last iteration (not the best one).
    If early stopping occurs, the model will have three additional fields:
-    bst.best_score, bst.best_iteration and bst.best_ntree_limit.
+    ``bst.best_score``, ``bst.best_iteration`` and ``bst.best_ntree_limit``.
-    (Use bst.best_ntree_limit to get the correct value if num_parallel_tree
+    (Use ``bst.best_ntree_limit`` to get the correct value if ``num_parallel_tree``
-    and/or num_class appears in the parameters)
+    and/or ``num_class`` appears in the parameters)
    Parameters
    ----------
--- a/python-package/xgboost/sklearn.py
+++ b/python-package/xgboost/sklearn.py
@ -1,5 +1,5 @@
 # coding: utf-8
-# pylint: disable=too-many-arguments, too-many-locals, invalid-name, fixme, E0012, R0912
+# pylint: disable=too-many-arguments, too-many-locals, invalid-name, fixme, E0012, R0912, C0302
 """Scikit-Learn Wrapper interface for XGBoost."""
 from __future__ import absolute_import
@ -69,9 +69,9 @@ class XGBModel(XGBModelBase):
    booster: string
        Specify which booster to use: gbtree, gblinear or dart.
    nthread : int
-        Number of parallel threads used to run xgboost.  (Deprecated, please use n_jobs)
+        Number of parallel threads used to run xgboost.  (Deprecated, please use ``n_jobs``)
    n_jobs : int
-        Number of parallel threads used to run xgboost.  (replaces nthread)
+        Number of parallel threads used to run xgboost.  (replaces ``nthread``)
    gamma : float
        Minimum loss reduction required to make a further partition on a leaf node of the tree.
    min_child_weight : int
@ -242,7 +242,7 @@ class XGBModel(XGBModelBase):
    def fit(self, X, y, sample_weight=None, eval_set=None, eval_metric=None,
            early_stopping_rounds=None, verbose=True, xgb_model=None,
-            sample_weight_eval_set=None):
+            sample_weight_eval_set=None, callbacks=None):
        # pylint: disable=missing-docstring,invalid-name,attribute-defined-outside-init
        """
        Fit the gradient boosting model
@ -285,6 +285,14 @@ class XGBModel(XGBModelBase):
        xgb_model : str
            file name of stored xgb model or 'Booster' instance Xgb model to be
            loaded before training (allows training continuation).
        callbacks : list of callback functions
            List of callback functions that are applied at end of each iteration.
            It is possible to use predefined callbacks by using :ref:`callback_api`.
            Example:
            .. code-block:: python
                [xgb.callback.reset_learning_rate(custom_rates)]
        """
        if sample_weight is not None:
            trainDmatrix = DMatrix(X, label=y, weight=sample_weight,
@ -325,7 +333,8 @@ class XGBModel(XGBModelBase):
                              self.n_estimators, evals=evals,
                              early_stopping_rounds=early_stopping_rounds,
                              evals_result=evals_result, obj=obj, feval=feval,
-                              verbose_eval=verbose, xgb_model=xgb_model)
+                              verbose_eval=verbose, xgb_model=xgb_model,
                              callbacks=callbacks)
        if evals_result:
            for val in evals_result.items():
@ -413,10 +422,10 @@ class XGBModel(XGBModelBase):
    def evals_result(self):
        """Return the evaluation results.
-        If ``eval_set`` is passed to the `fit` function, you can call ``evals_result()`` to
+        If **eval_set** is passed to the `fit` function, you can call
-        get evaluation results for all passed eval_sets. When ``eval_metric`` is also
+        ``evals_result()`` to get evaluation results for all passed **eval_sets**.
-        passed to the ``fit`` function, the ``evals_result`` will contain the ``eval_metrics``
+        When **eval_metric** is also passed to the `fit` function, the
-        passed to the ``fit`` function
+        **evals_result** will contain the **eval_metrics** passed to the `fit` function.
        Returns
        -------
@ -438,9 +447,9 @@ class XGBModel(XGBModelBase):
            evals_result = clf.evals_result()
-        The variable evals_result will contain:
+        The variable **evals_result** will contain:
-        .. code-block:: none
+        .. code-block:: python
            {'validation_0': {'logloss': ['0.604835', '0.531479']},
            'validation_1': {'logloss': ['0.41965', '0.17686']}}
@ -492,7 +501,7 @@ class XGBClassifier(XGBModel, XGBClassifierBase):
    def fit(self, X, y, sample_weight=None, eval_set=None, eval_metric=None,
            early_stopping_rounds=None, verbose=True, xgb_model=None,
-            sample_weight_eval_set=None):
+            sample_weight_eval_set=None, callbacks=None):
        # pylint: disable = attribute-defined-outside-init,arguments-differ
        """
        Fit gradient boosting classifier
@ -535,6 +544,14 @@ class XGBClassifier(XGBModel, XGBClassifierBase):
        xgb_model : str
            file name of stored xgb model or 'Booster' instance Xgb model to be
            loaded before training (allows training continuation).
        callbacks : list of callback functions
            List of callback functions that are applied at end of each iteration.
            It is possible to use predefined callbacks by using :ref:`callback_api`.
            Example:
            .. code-block:: python
                [xgb.callback.reset_learning_rate(custom_rates)]
        """
        evals_result = {}
        self.classes_ = np.unique(y)
@ -592,7 +609,8 @@ class XGBClassifier(XGBModel, XGBClassifierBase):
                              evals=evals,
                              early_stopping_rounds=early_stopping_rounds,
                              evals_result=evals_result, obj=obj, feval=feval,
-                              verbose_eval=verbose, xgb_model=None)
+                              verbose_eval=verbose, xgb_model=None,
                              callbacks=callbacks)
        self.objective = xgb_options["objective"]
        if evals_result:
@ -705,10 +723,10 @@ class XGBClassifier(XGBModel, XGBClassifierBase):
    def evals_result(self):
        """Return the evaluation results.
-        If eval_set is passed to the `fit` function, you can call evals_result() to
+        If **eval_set** is passed to the `fit` function, you can call
-        get evaluation results for all passed eval_sets. When eval_metric is also
+        ``evals_result()`` to get evaluation results for all passed **eval_sets**.
-        passed to the `fit` function, the evals_result will contain the eval_metrics
+        When **eval_metric** is also passed to the `fit` function, the
-        passed to the `fit` function
+        **evals_result** will contain the **eval_metrics** passed to the `fit` function.
        Returns
        -------
@ -730,9 +748,9 @@ class XGBClassifier(XGBModel, XGBClassifierBase):
            evals_result = clf.evals_result()
-        The variable ``evals_result`` will contain
+        The variable **evals_result** will contain
-        .. code-block:: none
+        .. code-block:: python
            {'validation_0': {'logloss': ['0.604835', '0.531479']},
            'validation_1': {'logloss': ['0.41965', '0.17686']}}
@ -771,9 +789,9 @@ class XGBRanker(XGBModel):
        booster: string
            Specify which booster to use: gbtree, gblinear or dart.
        nthread : int
-            Number of parallel threads used to run xgboost.  (Deprecated, please use n_jobs)
+            Number of parallel threads used to run xgboost.  (Deprecated, please use ``n_jobs``)
        n_jobs : int
-            Number of parallel threads used to run xgboost.  (replaces nthread)
+            Number of parallel threads used to run xgboost.  (replaces ``nthread``)
        gamma : float
            Minimum loss reduction required to make a further partition on a leaf node of the tree.
        min_child_weight : int
@ -816,8 +834,12 @@ class XGBRanker(XGBModel):
        ----
        A custom objective function is currently not supported by XGBRanker.
-        Group information is required for ranking tasks. Before fitting the model, your data need to
+        Note
-        be sorted by group. When fitting the model, you need to provide an additional array that
+        ----
        Group information is required for ranking tasks.
        Before fitting the model, your data need to be sorted by group. When
        fitting the model, you need to provide an additional array that
        contains the size of each group.
        For example, if your original data look like:
@ -863,7 +885,7 @@ class XGBRanker(XGBModel):
    def fit(self, X, y, group, sample_weight=None, eval_set=None, sample_weight_eval_set=None,
            eval_group=None, eval_metric=None, early_stopping_rounds=None,
-            verbose=False, xgb_model=None):
+            verbose=False, xgb_model=None, callbacks=None):
        # pylint: disable = attribute-defined-outside-init,arguments-differ
        """
        Fit the gradient boosting model
@ -911,6 +933,14 @@ class XGBRanker(XGBModel):
        xgb_model : str
            file name of stored xgb model or 'Booster' instance Xgb model to be
            loaded before training (allows training continuation).
        callbacks : list of callback functions
            List of callback functions that are applied at end of each iteration.
            It is possible to use predefined callbacks by using :ref:`callback_api`.
            Example:
            .. code-block:: python
                [xgb.callback.reset_learning_rate(custom_rates)]
        """
        # check if group information is provided
        if group is None:
@ -963,7 +993,8 @@ class XGBRanker(XGBModel):
                              self.n_estimators,
                              early_stopping_rounds=early_stopping_rounds, evals=evals,
                              evals_result=evals_result, feval=feval,
-                              verbose_eval=verbose, xgb_model=xgb_model)
+                              verbose_eval=verbose, xgb_model=xgb_model,
                              callbacks=callbacks)
        self.objective = params["objective"]
--- a/python-package/xgboost/training.py
+++ b/python-package/xgboost/training.py
@ -137,34 +137,35 @@ def train(params, dtrain, num_boost_round=10, evals=(), obj=None, feval=None,
        Whether to maximize feval.
    early_stopping_rounds: int
        Activates early stopping. Validation error needs to decrease at least
-        every <early_stopping_rounds> round(s) to continue training.
+        every **early_stopping_rounds** round(s) to continue training.
-        Requires at least one item in evals.
+        Requires at least one item in **evals**.
        If there's more than one, will use the last.
        Returns the model from the last iteration (not the best one).
        If early stopping occurs, the model will have three additional fields:
-        bst.best_score, bst.best_iteration and bst.best_ntree_limit.
+        ``bst.best_score``, ``bst.best_iteration`` and ``bst.best_ntree_limit``.
-        (Use bst.best_ntree_limit to get the correct value if num_parallel_tree
+        (Use ``bst.best_ntree_limit`` to get the correct value if
-        and/or num_class appears in the parameters)
+        ``num_parallel_tree`` and/or ``num_class`` appears in the parameters)
    evals_result: dict
        This dictionary stores the evaluation results of all the items in watchlist.
-        Example: with a watchlist containing [(dtest,'eval'), (dtrain,'train')] and
+        Example: with a watchlist containing
-        a parameter containing ('eval_metric': 'logloss'), the **evals_result**
+        ``[(dtest,'eval'), (dtrain,'train')]`` and
-        returns
+        a parameter containing ``('eval_metric': 'logloss')``,
        the **evals_result** returns
-        .. code-block:: none
+        .. code-block:: python
            {'train': {'logloss': ['0.48253', '0.35953']},
             'eval': {'logloss': ['0.480385', '0.357756']}}
    verbose_eval : bool or int
-        Requires at least one item in evals.
+        Requires at least one item in **evals**.
        If **verbose_eval** is True then the evaluation metric on the validation set is
        printed at each boosting stage.
        If **verbose_eval** is an integer then the evaluation metric on the validation set
        is printed at every given **verbose_eval** boosting stage. The last boosting stage
        / the boosting stage found by using **early_stopping_rounds** is also printed.
-        Example: with ``verbose_eval=4`` and at least one item in evals, an evaluation metric
+        Example: with ``verbose_eval=4`` and at least one item in **evals**, an evaluation metric
        is printed every 4 boosting stages, instead of every boosting stage.
    learning_rates: list or function (deprecated - use callback API instead)
        List of learning rate for each boosting round
@ -175,12 +176,17 @@ def train(params, dtrain, num_boost_round=10, evals=(), obj=None, feval=None,
        Xgb model to be loaded before training (allows training continuation).
    callbacks : list of callback functions
        List of callback functions that are applied at end of each iteration.
-        It is possible to use predefined callbacks by using xgb.callback module.
+        It is possible to use predefined callbacks by using
-        Example: [xgb.callback.reset_learning_rate(custom_rates)]
+        :ref:`Callback API <callback_api>`.
        Example:
        .. code-block:: python
            [xgb.callback.reset_learning_rate(custom_rates)]
    Returns
    -------
-    booster : a trained booster model
+    Booster : a trained booster model
    """
    callbacks = [] if callbacks is None else callbacks
@ -334,7 +340,7 @@ def cv(params, dtrain, num_boost_round=10, nfold=3, stratified=False, folds=None
    folds : a KFold or StratifiedKFold instance or list of fold indices
        Sklearn KFolds or StratifiedKFolds object.
        Alternatively may explicitly pass sample indices for each fold.
-        For ``n`` folds, ``folds`` should be a length ``n`` list of tuples.
+        For ``n`` folds, **folds** should be a length ``n`` list of tuples.
        Each tuple is ``(in,out)`` where ``in`` is a list of indices to be used
        as the training samples for the ``n`` th fold and ``out`` is a list of
        indices to be used as the testing samples for the ``n`` th fold.
@ -368,10 +374,11 @@ def cv(params, dtrain, num_boost_round=10, nfold=3, stratified=False, folds=None
        Seed used to generate the folds (passed to numpy.random.seed).
    callbacks : list of callback functions
        List of callback functions that are applied at end of each iteration.
-        It is possible to use predefined callbacks by using xgb.callback module.
+        It is possible to use predefined callbacks by using
        :ref:`Callback API <callback_api>`.
        Example:
-        .. code-block:: none
+        .. code-block:: python
            [xgb.callback.reset_learning_rate(custom_rates)]
    shuffle : bool