Merge pull request #450 from phunterlau/master

add necessary configrations for pip installation
This commit is contained in:
Tianqi Chen 2015-08-20 18:45:30 -07:00
commit 19eef1d0da
9 changed files with 114 additions and 7 deletions

View File

@ -43,4 +43,5 @@ on going at master
* Python module now has importance plot and tree plot functions. * Python module now has importance plot and tree plot functions.
* Java api is ready for use * Java api is ready for use
* Added more test cases and continuous integration to make each build more robust * Added more test cases and continuous integration to make each build more robust
* Improvements in sklearn compatible module * Improvements in sklearn compatible module
* Added pip installation functionality for python module

View File

@ -45,4 +45,6 @@ List of Contributors
- Jamie is the initial creator of xgboost sklearn modue. - Jamie is the initial creator of xgboost sklearn modue.
* [Yen-Ying Lee](https://github.com/white1033) * [Yen-Ying Lee](https://github.com/white1033)
* [Masaaki Horikoshi](https://github.com/sinhrks) * [Masaaki Horikoshi](https://github.com/sinhrks)
- Masaaki is the initial creator of xgboost python plotting module. - Masaaki is the initial creator of xgboost python plotting module.
* [Hongliang Liu](https://github.com/phunterlau)
- Hongliang is the maintainer of xgboost python PyPI package for pip installation.

View File

@ -1,4 +1,5 @@
export CC = gcc export CC = gcc
#build on the fly
export CXX = g++ export CXX = g++
export MPICXX = mpicxx export MPICXX = mpicxx
export LDFLAGS= -pthread -lm export LDFLAGS= -pthread -lm
@ -167,6 +168,30 @@ Rcheck:
make Rbuild make Rbuild
R CMD check --as-cran xgboost*.tar.gz R CMD check --as-cran xgboost*.tar.gz
pythonpack:
#make clean
cd subtree/rabit;make clean;cd ..
rm -rf xgboost-deploy xgboost*.tar.gz
cp -r python-package xgboost-deploy
cp *.md xgboost-deploy/
cp LICENSE xgboost-deploy/
cp Makefile xgboost-deploy/xgboost
cp -r wrapper xgboost-deploy/xgboost
cp -r subtree xgboost-deploy/xgboost
cp -r multi-node xgboost-deploy/xgboost
cp -r windows xgboost-deploy/xgboost
cp -r src xgboost-deploy/xgboost
#make python
pythonbuild:
make pythonpack
python setup.py install
pythoncheck:
make pythonbuild
python -c 'import xgboost;print xgboost.core.find_lib_path()'
# lint requires dmlc to be in current folder # lint requires dmlc to be in current folder
lint: lint:
dmlc-core/scripts/lint.py xgboost $(LINT_LANG) src wrapper R-package python-package dmlc-core/scripts/lint.py xgboost $(LINT_LANG) src wrapper R-package python-package

View File

@ -0,0 +1,7 @@
include *.sh *.md
recursive-include xgboost *
recursive-include xgboost/wrapper *
recursive-include xgboost/windows *
recursive-include xgboost/subtree *
recursive-include xgboost/src *
recursive-include xgboost/multi-node *

View File

@ -1,7 +1,26 @@
XGBoost Python Package XGBoost Python Package
====================== ======================
Installation
------------
We are on [PyPI](https://pypi.python.org/pypi/xgboost) now. For stable version, please install using pip:
* ```pip install xgboost```
* Note for windows users: this pip installation may not work on some windows environment. Please install from github if pip doesn't work on windows.
For up-to-date version, please install from github.
* To make the python module, type ```./build.sh``` in the root directory of project * To make the python module, type ```./build.sh``` in the root directory of project
* Make sure you have [setuptools](https://pypi.python.org/pypi/setuptools) * Make sure you have [setuptools](https://pypi.python.org/pypi/setuptools)
* Install with `python setup.py install` from this directory. * Install with `python setup.py install` from this directory.
Examples
------
* Refer also to the walk through example in [demo folder](../demo/guide-python) * Refer also to the walk through example in [demo folder](../demo/guide-python)
* **NOTE**: if you want to run XGBoost process in parallel using the fork backend for joblib/multiprocessing, you must build XGBoost without support for OpenMP by `make no_omp=1`. Otherwise, use the forkserver (in Python 3.4) or spawn backend. See the sklearn_parallel.py demo. * See also the [example scripts](../demo/kaggle-higgs) for Kaggle Higgs Challenge, including [speedtest script](../demo/kaggle-higgs/speedtest.py) on this dataset.
Note
-----
* If you want to build xgboost on Mac OS X with multiprocessing support where clang in XCode by default doesn't support, please install gcc 4.9 or higher using [homebrew](http://brew.sh/) ```brew tap homebrew/versions; brew install gcc49```
* If you want to run XGBoost process in parallel using the fork backend for joblib/multiprocessing, you must build XGBoost without support for OpenMP by `make no_omp=1`. Otherwise, use the forkserver (in Python 3.4) or spawn backend. See the [sklearn_parallel.py](../demo/guide-python/sklearn_parallel.py) demo.

2
python-package/setup.cfg Normal file
View File

@ -0,0 +1,2 @@
[metadata]
description-file = README.md

View File

@ -2,20 +2,43 @@
"""Setup xgboost package.""" """Setup xgboost package."""
from __future__ import absolute_import from __future__ import absolute_import
import sys import sys
from setuptools import setup from setuptools import setup, find_packages
import subprocess
sys.path.insert(0, '.') sys.path.insert(0, '.')
#build on the fly
build_sh = subprocess.Popen(['sh', 'xgboost/build-python.sh'])
build_sh.wait()
output = build_sh.communicate()
print output
import xgboost import xgboost
LIB_PATH = xgboost.core.find_lib_path() LIB_PATH = xgboost.core.find_lib_path()
#print LIB_PATH
#to deploy to pip, please use
#make pythonpack
#python setup.py register sdist upload
#and be sure to test it firstly using "python setup.py register sdist upload -r pypitest"
setup(name='xgboost', setup(name='xgboost',
version=xgboost.__version__, version=xgboost.__version__,
#version='0.4a12',
description=xgboost.__doc__, description=xgboost.__doc__,
install_requires=[ install_requires=[
'numpy', 'numpy',
'scipy', 'scipy',
], ],
maintainer='Hongliang Liu',
maintainer_email='phunter.lau@gmail.com',
zip_safe=False, zip_safe=False,
packages=['xgboost'], packages=find_packages(),
data_files=[('xgboost', [LIB_PATH[0]])], #don't need this and don't use this, give everything to MANIFEST.in
#package_dir = {'':'xgboost'},
#package_data = {'': ['*.txt','*.md','*.sh'],
# }
#this will use MANIFEST.in during install where we specify additional files,
#this is the golden line
include_package_data=True,
data_files=[('xgboost', LIB_PATH)],
url='https://github.com/dmlc/xgboost') url='https://github.com/dmlc/xgboost')

View File

@ -0,0 +1,26 @@
#!/bin/bash
# This is a simple script to make xgboost in MAC and Linux for python wrapper only
# Basically, it first try to make with OpenMP, if fails, disable OpenMP and make it again.
# This will automatically make xgboost for MAC users who don't have OpenMP support.
# In most cases, type make will give what you want.
# See additional instruction in doc/build.md
# note: this script is build for python package only, and it might have some filename
# conflict with build.sh which is for everything.
pushd xgboost
if make python; then
echo "Successfully build multi-thread xgboost"
else
echo "-----------------------------"
echo "Building multi-thread xgboost failed"
echo "Start to build single-thread xgboost"
make clean
make python no_omp=1
echo "Successfully build single-thread xgboost"
echo "If you want multi-threaded version"
echo "See additional instructions in doc/build.md"
fi
popd

View File

@ -39,7 +39,9 @@ def find_lib_path():
List of all found library path to xgboost List of all found library path to xgboost
""" """
curr_path = os.path.dirname(os.path.abspath(os.path.expanduser(__file__))) curr_path = os.path.dirname(os.path.abspath(os.path.expanduser(__file__)))
dll_path = [curr_path, os.path.join(curr_path, '../../wrapper/')] #make pythonpack hack: copy this directory one level upper for setup.py
dll_path = [curr_path, os.path.join(curr_path, '../../wrapper/')
, os.path.join(curr_path, './wrapper/')]
if os.name == 'nt': if os.name == 'nt':
if platform.architecture()[0] == '64bit': if platform.architecture()[0] == '64bit':
dll_path.append(os.path.join(curr_path, '../../windows/x64/Release/')) dll_path.append(os.path.join(curr_path, '../../windows/x64/Release/'))