Remove the deprecated Python rabit module. (#9523)

2023-08-27 03:37:05 +08:00 · 2023-08-27 03:37:05 +08:00 · 209335b18c
commit 209335b18c
parent aa86bd5207
3 changed files with 1 additions and 201 deletions
--- a/python-package/xgboost/init.py
+++ b/python-package/xgboost/init.py
@ -4,7 +4,7 @@ Contributors: https://github.com/dmlc/xgboost/blob/master/CONTRIBUTORS.md
 """

 from . import tracker  # noqa
-from . import collective, dask, rabit
+from . import collective, dask
 from .core import (
    Booster,
    DataIter,
--- a/python-package/xgboost/rabit.py
+++ b/python-package/xgboost/rabit.py
@ -1,169 +0,0 @@
-"""Compatibility shim for xgboost.rabit; to be removed in 2.0"""
-import logging
-import warnings
-from enum import IntEnum, unique
-from typing import Any, Callable, List, Optional, TypeVar
-
-import numpy as np
-
-from . import collective
-
-LOGGER = logging.getLogger("[xgboost.rabit]")
-
-
-def _deprecation_warning() -> str:
-    return (
-        "The xgboost.rabit submodule is marked as deprecated in 1.7 and will be removed "
-        "in 2.0. Please use xgboost.collective instead."
-    )
-
-
-def init(args: Optional[List[bytes]] = None) -> None:
-    """Initialize the rabit library with arguments"""
-    warnings.warn(_deprecation_warning(), FutureWarning)
-    parsed = {}
-    if args:
-        for arg in args:
-            kv = arg.decode().split("=")
-            if len(kv) == 2:
-                parsed[kv[0]] = kv[1]
-    collective.init(**parsed)
-
-
-def finalize() -> None:
-    """Finalize the process, notify tracker everything is done."""
-    collective.finalize()
-
-
-def get_rank() -> int:
-    """Get rank of current process.
-    Returns
-    -------
-    rank : int
-        Rank of current process.
-    """
-    return collective.get_rank()
-
-
-def get_world_size() -> int:
-    """Get total number workers.
-    Returns
-    -------
-    n : int
-        Total number of process.
-    """
-    return collective.get_world_size()
-
-
-def is_distributed() -> int:
-    """If rabit is distributed."""
-    return collective.is_distributed()
-
-
-def tracker_print(msg: Any) -> None:
-    """Print message to the tracker.
-    This function can be used to communicate the information of
-    the progress to the tracker
-    Parameters
-    ----------
-    msg : str
-        The message to be printed to tracker.
-    """
-    collective.communicator_print(msg)
-
-
-def get_processor_name() -> bytes:
-    """Get the processor name.
-    Returns
-    -------
-    name : str
-        the name of processor(host)
-    """
-    return collective.get_processor_name().encode()
-
-
-T = TypeVar("T")  # pylint:disable=invalid-name
-
-
-def broadcast(data: T, root: int) -> T:
-    """Broadcast object from one node to all other nodes.
-    Parameters
-    ----------
-    data : any type that can be pickled
-        Input data, if current rank does not equal root, this can be None
-    root : int
-        Rank of the node to broadcast data from.
-    Returns
-    -------
-    object : int
-        the result of broadcast.
-    """
-    return collective.broadcast(data, root)
-
-
-@unique
-class Op(IntEnum):
-    """Supported operations for rabit."""
-
-    MAX = 0
-    MIN = 1
-    SUM = 2
-    OR = 3
-
-
-def allreduce(  # pylint:disable=invalid-name
-    data: np.ndarray, op: Op, prepare_fun: Optional[Callable[[np.ndarray], None]] = None
-) -> np.ndarray:
-    """Perform allreduce, return the result.
-    Parameters
-    ----------
-    data :
-        Input data.
-    op :
-        Reduction operators, can be MIN, MAX, SUM, BITOR
-    prepare_fun :
-        Lazy preprocessing function, if it is not None, prepare_fun(data)
-        will be called by the function before performing allreduce, to initialize the data
-        If the result of Allreduce can be recovered directly,
-        then prepare_fun will NOT be called
-    Returns
-    -------
-    result :
-        The result of allreduce, have same shape as data
-    Notes
-    -----
-    This function is not thread-safe.
-    """
-    if prepare_fun is None:
-        return collective.allreduce(data, collective.Op(op))
-    raise ValueError("preprocessing function is no longer supported")
-
-
-def version_number() -> int:
-    """Returns version number of current stored model.
-    This means how many calls to CheckPoint we made so far.
-    Returns
-    -------
-    version : int
-        Version number of currently stored model
-    """
-    return 0
-
-
-class RabitContext:
-    """A context controlling rabit initialization and finalization."""
-
-    def __init__(self, args: Optional[List[bytes]] = None) -> None:
-        if args is None:
-            args = []
-        self.args = args
-
-    def __enter__(self) -> None:
-        init(self.args)
-        assert is_distributed()
-        LOGGER.warning(_deprecation_warning())
-        LOGGER.debug("-------------- rabit say hello ------------------")
-
-    def __exit__(self, *args: List) -> None:
-        finalize()
-        LOGGER.debug("--------------- rabit say bye ------------------")
--- a/tests/python/test_collective.py
+++ b/tests/python/test_collective.py
@ -39,37 +39,6 @@ def test_rabit_communicator():
        assert worker.exitcode == 0


-# TODO(rongou): remove this once we remove the rabit api.
-def run_rabit_api_worker(rabit_env, world_size):
-    with xgb.rabit.RabitContext(rabit_env):
-        assert xgb.rabit.get_world_size() == world_size
-        assert xgb.rabit.is_distributed()
-        assert xgb.rabit.get_processor_name().decode() == socket.gethostname()
-        ret = xgb.rabit.broadcast('test1234', 0)
-        assert str(ret) == 'test1234'
-        ret = xgb.rabit.allreduce(np.asarray([1, 2, 3]), xgb.rabit.Op.SUM)
-        assert np.array_equal(ret, np.asarray([2, 4, 6]))
-
-
-# TODO(rongou): remove this once we remove the rabit api.
-def test_rabit_api():
-    world_size = 2
-    tracker = RabitTracker(host_ip='127.0.0.1', n_workers=world_size)
-    tracker.start(world_size)
-    rabit_env = []
-    for k, v in tracker.worker_envs().items():
-        rabit_env.append(f"{k}={v}".encode())
-    workers = []
-    for _ in range(world_size):
-        worker = multiprocessing.Process(target=run_rabit_api_worker,
-                                         args=(rabit_env, world_size))
-        workers.append(worker)
-        worker.start()
-    for worker in workers:
-        worker.join()
-        assert worker.exitcode == 0
-
-
 def run_federated_worker(port, world_size, rank):
    with xgb.collective.CommunicatorContext(xgboost_communicator='federated',
                                            federated_server_address=f'localhost:{port}',