xgboost/multi-node/hadoop/run_hadoop_mushroom.sh
2015-01-11 16:06:19 +08:00

26 lines
1.0 KiB
Bash
Executable File

#!/bin/bash
if [ "$#" -lt 2 ];
then
echo "Usage: <num_of_slave_nodes> <path_in_HDFS>"
exit -1
fi
# put the local training file to HDFS
hadoop fs -mkdir $2/data
hadoop fs -put ../../demo/data/agaricus.txt.train $2/data
# training and output the final model file
../../rabit/tracker/rabit_hadoop.py -n $1 -i $2/data/agaricus.txt.train -o $2/mushroom.final.model ../../xgboost mushroom.hadoop.conf
# get the final model file
hadoop fs -get $2/mushroom.final.model/part-00000 ./mushroom.final.model
# output prediction task=pred of test:data
../../xgboost mushroom.hadoop.conf task=pred model_in=mushroom.final.model test:data=../../demo/data/agaricus.txt.test
# print the boosters of final.model in dump.raw.txt
../../xgboost mushroom.hadoop.conf task=dump model_in=mushroom.final.model name_dump=dump.raw.txt
# use the feature map in printing for better visualization
../../xgboost mushroom.hadoop.conf task=dump model_in=mushroom.final.model fmap=../../demo/data/featmap.txt name_dump=dump.nice.txt
cat dump.nice.txt