From 2f95968a1ca46e4ade45765a612e473cb917a45f Mon Sep 17 00:00:00 2001 From: Boliang Chen Date: Sun, 11 Jan 2015 15:34:55 +0800 Subject: [PATCH] ok --- multi-node/hadoop/run_hadoop_mushroom.sh | 29 ++++++++++++++++++++++++ 1 file changed, 29 insertions(+) create mode 100755 multi-node/hadoop/run_hadoop_mushroom.sh diff --git a/multi-node/hadoop/run_hadoop_mushroom.sh b/multi-node/hadoop/run_hadoop_mushroom.sh new file mode 100755 index 000000000..2f095ff25 --- /dev/null +++ b/multi-node/hadoop/run_hadoop_mushroom.sh @@ -0,0 +1,29 @@ +#!/bin/bash + +if [ "$#" -lt 2 ]; +then + echo "Usage: " + exit -1 +fi + +# put the local training file to HDFS +hadoop fs -mkdir $2/data +hadoop fs -put ../../demo/data/agaricus.txt.train $2/data + +# training and output the final model file +../../rabit/tracker/rabit_hadoop.py -n $1 -i $2/data/agaricus.txt.train \ + -o $2/model -f ../../demo/data/agaricus.txt.test \ + ../../xgboost mushroom.hadoop.conf dsplit=row + +# get the final model file +hadoop fs -get $2/model/part-00000 ./final.model + +# output prediction task=pred +../../xgboost mushroom.hadoop.conf task=pred model_in=final.model \ + test:data=../../demo/data/agaricus.txt.test +# print the boosters of final.model in dump.raw.txt +../../xgboost mushroom.hadoop.conf task=dump model_in=final.model name_dump=dump.raw.txt +# use the feature map in printing for better visualization +../../xgboost mushroom.hadoop.conf task=dump model_in=final.model \ + fmap=../../demo/data/featmap.txt name_dump=dump.nice.txt +cat dump.nice.txt