add mushroom classification

2014-02-24 22:25:43 -08:00 · 2014-02-24 22:25:43 -08:00 · 9d6ef11eb5
commit 9d6ef11eb5
parent 4aa4faa625
2 changed files with 26 additions and 3 deletions
--- a/demo/mushroom/mushroom.conf
+++ b/demo/mushroom/mushroom.conf
@ -1,4 +1,4 @@
-num_round=10
+num_round=2

 save_period=0

@ -6,7 +6,7 @@ data = "agaricus.txt.train"
 eval[test] = "agaricus.txt.test"

 booster_type = 0
-loss_type = 1
+loss_type = 2

 bst:num_feature=126
 bst:eta=1.0
--- a/regression/xgboost_reg.h
+++ b/regression/xgboost_reg.h
@ -172,6 +172,7 @@ namespace xgboost{
            enum LossType{
                kLinearSquare = 0,
                kLogisticNeglik = 1,
+                kLogisticClassify = 2
            };

            /*! \brief training parameter for regression */
@ -211,6 +212,7 @@ namespace xgboost{
                inline float PredTransform( float x ){
                    switch( loss_type ){                        
                    case kLinearSquare: return x;
+                    case kLogisticClassify:
                    case kLogisticNeglik: return 1.0f/(1.0f + expf(-x));
                    default: utils::Error("unknown loss_type"); return 0.0f;
                    }
@ -225,7 +227,8 @@ namespace xgboost{
                inline float FirstOrderGradient( float predt, float label ) const{
                    switch( loss_type ){                        
                    case kLinearSquare: return predt - label;
-                    case 1: return predt - label;
+                    case kLogisticClassify:
+                    case kLogisticNeglik: return predt - label;
                    default: utils::Error("unknown loss_type"); return 0.0f;
                    }
                }
@ -238,6 +241,7 @@ namespace xgboost{
                inline float SecondOrderGradient( float predt, float label ) const{
                    switch( loss_type ){                        
                    case kLinearSquare: return 1.0f;
+                    case kLogisticClassify:
                    case kLogisticNeglik: return predt * ( 1 - predt );
                    default: utils::Error("unknown loss_type"); return 0.0f;
                    }
@ -253,6 +257,7 @@ namespace xgboost{
                    switch( loss_type ){
                    case kLinearSquare: return SquareLoss(preds,labels);
                    case kLogisticNeglik: return NegLoglikelihoodLoss(preds,labels);
+                    case kLogisticClassify: return ClassificationError(preds, labels);
                    default: utils::Error("unknown loss_type"); return 0.0f;
                    }
                }
@ -284,6 +289,24 @@ namespace xgboost{
                        ans -= labels[i] * logf(preds[i]) + ( 1 - labels[i] ) * logf(1 - preds[i]);
                    return ans;
                }
+
+                /*!
+                * \brief calculating the ClassificationError  loss, given the predictions and labels
+                * \param preds the given predictions
+                * \param labels the given labels
+                * \return the summation of square loss
+                */
+                inline float ClassificationError(const std::vector<float> &preds, const std::vector<float> &labels) const{
+                    int nerr = 0;
+                    for(size_t i = 0; i < preds.size(); i++){
+                        if( preds[i] > 0.5f ){
+                            if( labels[i] < 0.5f ) nerr ++;
+                        }else{
+                            if( labels[i] > 0.5f ) nerr ++;
+                        }
+                    }
+                    return (float)nerr/preds.size();
+                }                
            };
        private:
            int silent;