10 ani în urmă · 0b24ddffa8
--- a/classifier/fpclassifier/randomforest/DTBRandomOblique.cpp
+++ b/classifier/fpclassifier/randomforest/DTBRandomOblique.cpp
@@ -25,13 +25,13 @@ using namespace NICE;
 
															 DTBRandomOblique::DTBRandomOblique ( const Config *conf, string section )
														
 
															 {
														
 
															     random_split_tests = conf->gI(section, "random_split_tests", 10 );
														
 
															-    random_features = conf->gI(section, "random_features", 500 );
														
 
															     max_depth = conf->gI(section, "max_depth", 10 );
														
 
															     minimum_information_gain = conf->gD(section, "minimum_information_gain", 10e-7 );
														
 
															     minimum_entropy = conf->gD(section, "minimum_entropy", 10e-5 );
														
 
															     use_shannon_entropy = conf->gB(section, "use_shannon_entropy", false );
														
 
															     min_examples = conf->gI(section, "min_examples", 50);
														
 
															     save_indices = conf->gB(section, "save_indices", false);
														
 
															+    lambda = conf->gD(section, "lambda", 0.5 );
														
 
															     if ( conf->gB(section, "start_random_generator", false ) )
														
 
															         srand(time(NULL));
														
@@ -115,8 +115,14 @@ void DTBRandomOblique::getDataAndLabel(
 
															         const Example & ce = p.second;
														
 
															         NICE::Vector pixelRepr = f->getFeatureVector( &ce );
														
 
															+        pixelRepr /= pixelRepr.Max();
														
 
															         X.setRow(matIndex,pixelRepr);
														
 
															-        y.set(matIndex,(double)classno);
														
 
															+
														
 
															+        // TODO for multiclass scenarios we need ONEvsALL!
														
 
															+        if ( classno == 0 )
														
 
															+            y.set(matIndex,-1.0);
														
 
															+        else
														
 
															+            y.set(matIndex, 1.0);
														
 
															         matIndex++;
														
 
															     }
														
@@ -163,13 +169,18 @@ DecisionNode *DTBRandomOblique::buildRecursive(
 
															     NICE::Vector y;
														
 
															     getDataAndLabel(fp, examples, examples_selection, X, y);
														
 
															     NICE::Matrix XTX = X.transpose()*X;
														
 
															-    XTX = NICE::invert(XTX);
														
 
															+    XTX.addDiagonal ( NICE::Vector( XTX.rows(), lambda) );
														
 
															+
														
 
															+    //TODO: incorporate weighting according class distribution
														
 
															+
														
 
															+    NICE::Matrix G;
														
 
															+    choleskyDecomp(XTX, G);
														
 
															+    choleskyInvert(G, XTX);
														
 
															     NICE::Matrix temp = XTX * X.transpose();
														
 
															-    NICE::Vector params;
														
 
															-    params.multiply(temp,y,false);
														
 
															-    params.normalizeL2();
														
 
															+    NICE::Vector beta;
														
 
															+    beta.multiply(temp,y,false);
														
 
															-    Feature *best_feature = NULL;
														
 
															+    // variables
														
 
															     double best_threshold = 0.0;
														
 
															     double best_ig = -1.0;
														
 
															     FeatureValuesUnsorted values;
														
@@ -180,76 +191,69 @@ DecisionNode *DTBRandomOblique::buildRecursive(
 
															     double best_entropy_left = 0.0;
														
 
															     double best_entropy_right = 0.0;
														
 
															-    // random parameter vectors
														
 
															-    for ( int k = 0 ; k < random_features ; k++ )
														
 
															-    {
														
 
															-        /** Create random parameter vector */
														
 
															-#ifdef DETAILTREE
														
 
															-        std::cerr << "Calculating random parameter vector #" << k << std::endl;
														
 
															-#endif
														
 
															-        ConvolutionFeature *f = (ConvolutionFeature*)fp.begin()->second;
														
 
															-
														
 
															-        f->setParameterVector( params );
														
 
															+    // Setting Convolutional Feature
														
 
															+    ConvolutionFeature *f = (ConvolutionFeature*)fp.begin()->second;
														
 
															+    f->setParameterVector( beta );
														
 
															-        /** Compute feature values for current parameters */
														
 
															-        values.clear();
														
 
															-        f->calcFeatureValues( examples, examples_selection, values);
														
 
															+    // Feature Values
														
 
															+    values.clear();
														
 
															+    f->calcFeatureValues( examples, examples_selection, values);
														
 
															-        double minValue = (min_element ( values.begin(), values.end() ))->first;
														
 
															-        double maxValue = (max_element ( values.begin(), values.end() ))->first;
														
 
															+    double minValue = (min_element ( values.begin(), values.end() ))->first;
														
 
															+    double maxValue = (max_element ( values.begin(), values.end() ))->first;
														
 
															-        if ( maxValue - minValue < 1e-7 ) continue;
														
 
															+    if ( maxValue - minValue < 1e-7 )
														
 
															+        std::cerr << "DTBRandomOblique: Difference between min and max of features values to small!" << std::endl;
														
 
															-        // randomly chosen thresholds
														
 
															-        for ( int i = 0; i < random_split_tests; i++ )
														
 
															-        {
														
 
															-            double threshold = rand() * (maxValue - minValue ) / RAND_MAX + minValue;
														
 
															+    // randomly chosen thresholds
														
 
															+    for ( int i = 0; i < random_split_tests; i++ )
														
 
															+    {
														
 
															+        double threshold = ((maxValue - minValue ) / (double)random_split_tests)
														
 
															+                            + minValue;
														
 
															 #ifdef DETAILTREE
														
 
															-            std::cerr << "Testing split #" << i << " for vector #" << k
														
 
															-                      << ": t=" << threshold <<  std::endl;
														
 
															+        std::cerr << "Testing split #" << i << " for vector #" << k
														
 
															+                   << ": t=" << threshold <<  std::endl;
														
 
															 #endif
														
 
															-            // preparations
														
 
															-            double el, er;
														
 
															-            for ( int k = 0 ; k <= maxClassNo ; k++ )
														
 
															-            {
														
 
															-                distribution_left[k] = 0;
														
 
															-                distribution_right[k] = 0;
														
 
															-            }
														
 
															+        // preparations
														
 
															+        double el, er;
														
 
															+        for ( int k = 0 ; k <= maxClassNo ; k++ )
														
 
															+        {
														
 
															+            distribution_left[k] = 0.0;
														
 
															+            distribution_right[k] = 0.0;
														
 
															+        }
														
 
															-            /** Test the current split */
														
 
															-            // Does another split make sense?
														
 
															-            double count_left;
														
 
															-            double count_right;
														
 
															-            if ( ! entropyLeftRight ( values, threshold,
														
 
															-                                      distribution_left, distribution_right,
														
 
															-                                      el, er, count_left, count_right, maxClassNo ) )
														
 
															-                continue;
														
 
															+        /** Test the current split */
														
 
															+        // Does another split make sense?
														
 
															+        double count_left;
														
 
															+        double count_right;
														
 
															+        if ( ! entropyLeftRight ( values, threshold,
														
 
															+                                  distribution_left, distribution_right,
														
 
															+                                  el, er, count_left, count_right, maxClassNo ) )
														
 
															+            continue;
														
 
															-            // information gain and entropy
														
 
															-            double pl = (count_left) / (count_left + count_right);
														
 
															-            double ig = e - pl*el - (1-pl)*er;
														
 
															+        // information gain and entropy
														
 
															+        double pl = (count_left) / (count_left + count_right);
														
 
															+        double ig = e - pl*el - (1-pl)*er;
														
 
															-            if ( use_shannon_entropy )
														
 
															-            {
														
 
															-                double esplit = - ( pl*log(pl) + (1-pl)*log(1-pl) );
														
 
															-                ig = 2*ig / ( e + esplit );
														
 
															-            }
														
 
															+        if ( use_shannon_entropy )
														
 
															+        {
														
 
															+            double esplit = - ( pl*log(pl) + (1-pl)*log(1-pl) );
														
 
															+            ig = 2*ig / ( e + esplit );
														
 
															+        }
														
 
															+
														
 
															+        if ( ig > best_ig )
														
 
															+        {
														
 
															+            best_ig = ig;
														
 
															+            best_threshold = threshold;
														
 
															-            if ( ig > best_ig )
														
 
															+            for ( int k = 0 ; k <= maxClassNo ; k++ )
														
 
															             {
														
 
															-                best_ig = ig;
														
 
															-                best_threshold = threshold;
														
 
															-
														
 
															-                best_feature = f;
														
 
															-                for ( int k = 0 ; k <= maxClassNo ; k++ )
														
 
															-                {
														
 
															-                    best_distribution_left[k] = distribution_left[k];
														
 
															-                    best_distribution_right[k] = distribution_right[k];
														
 
															-                }
														
 
															-                best_entropy_left = el;
														
 
															-                best_entropy_right = er;
														
 
															+                best_distribution_left[k] = distribution_left[k];
														
 
															+                best_distribution_right[k] = distribution_right[k];
														
 
															             }
														
 
															+            best_entropy_left = el;
														
 
															+            best_entropy_right = er;
														
 
															         }
														
 
															     }
														
@@ -270,25 +274,23 @@ DecisionNode *DTBRandomOblique::buildRecursive(
 
															     }
														
 
															     /** Save the best split to current node */
														
 
															-    node->f = best_feature->clone();
														
 
															+    node->f = f->clone();
														
 
															     node->threshold = best_threshold;
														
 
															-    /** Recalculate examples using best split */
														
 
															-    vector<int> best_examples_left;
														
 
															-    vector<int> best_examples_right;
														
 
															-    values.clear();
														
 
															-    best_feature->calcFeatureValues ( examples, examples_selection, values );
														
 
															+    /** Split examples according to split function */
														
 
															+    vector<int> examples_left;
														
 
															+    vector<int> examples_right;
														
 
															-    best_examples_left.reserve ( values.size() / 2 );
														
 
															-    best_examples_right.reserve ( values.size() / 2 );
														
 
															+    examples_left.reserve ( values.size() / 2 );
														
 
															+    examples_right.reserve ( values.size() / 2 );
														
 
															     for ( FeatureValuesUnsorted::const_iterator i = values.begin();
														
 
															           i != values.end(); i++ )
														
 
															     {
														
 
															         double value = i->first;
														
 
															         if ( value < best_threshold )
														
 
															-            best_examples_left.push_back ( i->third );
														
 
															+            examples_left.push_back ( i->third );
														
 
															         else
														
 
															-            best_examples_right.push_back ( i->third );
														
 
															+            examples_right.push_back ( i->third );
														
 
															     }
														
 
															 #ifdef DEBUGTREE
														
@@ -299,16 +301,16 @@ DecisionNode *DTBRandomOblique::buildRecursive(
 
															               << best_entropy_right << std::endl;
														
 
															 #endif
														
 
															-    FullVector best_distribution_left_sparse ( distribution.size() );
														
 
															-    FullVector best_distribution_right_sparse ( distribution.size() );
														
 
															+    FullVector distribution_left_sparse ( distribution.size() );
														
 
															+    FullVector distribution_right_sparse ( distribution.size() );
														
 
															     for ( int k = 0 ; k <= maxClassNo ; k++ )
														
 
															     {
														
 
															         double l = best_distribution_left[k];
														
 
															         double r = best_distribution_right[k];
														
 
															         if ( l != 0 )
														
 
															-            best_distribution_left_sparse[k] = l;
														
 
															+            distribution_left_sparse[k] = l;
														
 
															         if ( r != 0 )
														
 
															-            best_distribution_right_sparse[k] = r;
														
 
															+            distribution_right_sparse[k] = r;
														
 
															 #ifdef DEBUGTREE
														
 
															         if ( (l>0)||(r>0) )
														
 
															         {
														
@@ -323,11 +325,13 @@ DecisionNode *DTBRandomOblique::buildRecursive(
 
															     /** Recursion */
														
 
															     // left child
														
 
															-    node->left = buildRecursive ( fp, examples, best_examples_left,
														
 
															-                                  best_distribution_left_sparse, best_entropy_left, maxClassNo, depth+1 );
														
 
															+    node->left  = buildRecursive ( fp, examples, examples_left,
														
 
															+                                   distribution_left_sparse, best_entropy_left,
														
 
															+                                   maxClassNo, depth+1 );
														
 
															     // right child
														
 
															-    node->right = buildRecursive ( fp, examples, best_examples_right,
														
 
															-                                   best_distribution_right_sparse, best_entropy_right, maxClassNo, depth+1 );
														
 
															+    node->right = buildRecursive ( fp, examples, examples_right,
														
 
															+                                   distribution_right_sparse, best_entropy_right,
														
 
															+                                   maxClassNo, depth+1 );
														
 
															     return node;
														
 
															 }
														
--- a/classifier/fpclassifier/randomforest/DTBRandomOblique.h
+++ b/classifier/fpclassifier/randomforest/DTBRandomOblique.h
@@ -32,9 +32,6 @@ class DTBRandomOblique : public DecisionTreeBuilder
 
															     /** Amount of randomly chosen thresholds */
														
 
															     int random_split_tests;
														
 
															-    /** Amount of randomly chosen features */
														
 
															-    int random_features;
														
 
															-
														
 
															     /** Maximum allowed depth of a tree */
														
 
															     int max_depth;
														
@@ -53,6 +50,9 @@ class DTBRandomOblique : public DecisionTreeBuilder
 
															     /** Whether to save indices in leaves or not */
														
 
															     bool save_indices;
														
 
															+    /** Regularization parameter */
														
 
															+    double lambda;
														
 
															+
														
 
															     /////////////////////////
														
 
															     /////////////////////////
														
 
															     //  PROTECTED METHODS  //