diff --git a/multi-node/hadoop/mushroom.hadoop.conf b/multi-node/hadoop/mushroom.hadoop.conf new file mode 100644 index 000000000..305b82dd3 --- /dev/null +++ b/multi-node/hadoop/mushroom.hadoop.conf @@ -0,0 +1,30 @@ +# General Parameters, see comment for each definition +# choose the booster, can be gbtree or gblinear +booster = gbtree +# choose logistic regression loss function for binary classification +objective = binary:logistic + +# Tree Booster Parameters +# step size shrinkage +eta = 1.0 +# minimum loss reduction required to make a further partition +gamma = 1.0 +# minimum sum of instance weight(hessian) needed in a child +min_child_weight = 1 +# maximum depth of a tree +max_depth = 3 + +# Task Parameters +# the number of round to do boosting +num_round = 2 +# 0 means do not save any model except the final round model +save_period = 0 +# The path of training data +data = stdin +# The path of model file +model_out = stdout + +# The path of validation data, used to monitor training process, here [test] sets name of the validation set +eval[test] = "agaricus.txt.test" +# evaluate on training data as well each round +eval_train = 1