From 8ba4722d0484a891e4f9ceba11ccbb5042809f22 Mon Sep 17 00:00:00 2001 From: Jiaming Yuan Date: Wed, 11 May 2022 20:54:48 +0800 Subject: [PATCH] Remove pyarrow workaround. (#7884) --- python-package/xgboost/data.py | 9 +-------- 1 file changed, 1 insertion(+), 8 deletions(-) diff --git a/python-package/xgboost/data.py b/python-package/xgboost/data.py index 47c41d994..d21c97910 100644 --- a/python-package/xgboost/data.py +++ b/python-package/xgboost/data.py @@ -2,7 +2,6 @@ # pylint: disable=too-many-return-statements, import-error '''Data dispatching for DMatrix.''' import ctypes -from distutils import version import json import warnings import os @@ -590,13 +589,7 @@ def _from_arrow( if enable_categorical: raise ValueError("categorical data in arrow is not supported yet.") - major, _, _ = version.StrictVersion(pa.__version__).version - if major == 4: - rb_iter = iter(data.to_batches()) - else: - # use_async=True to workaround pyarrow 6.0.1 hang, - # see Modin-3982 and ARROW-15362 - rb_iter = iter(data.to_batches(use_async=True)) + rb_iter = iter(data.to_batches()) it = record_batch_data_iter(rb_iter) next_callback = ctypes.CFUNCTYPE(ctypes.c_int, ctypes.c_void_p)(it) handle = ctypes.c_void_p()