object DecisionTree extends Serializable with Logging
- Annotations
- @Since( "1.0.0" )
- Source
- DecisionTree.scala
- Alphabetic
- By Inheritance
- DecisionTree
- Logging
- Serializable
- Serializable
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Value Members
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        !=(arg0: Any): Boolean
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        ##(): Int
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        ==(arg0: Any): Boolean
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        asInstanceOf[T0]: T0
      
      
      - Definition Classes
- Any
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        clone(): AnyRef
      
      
      - Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        eq(arg0: AnyRef): Boolean
      
      
      - Definition Classes
- AnyRef
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        equals(arg0: Any): Boolean
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        finalize(): Unit
      
      
      - Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( classOf[java.lang.Throwable] )
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        getClass(): Class[_]
      
      
      - Definition Classes
- AnyRef → Any
- Annotations
- @native()
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        hashCode(): Int
      
      
      - Definition Classes
- AnyRef → Any
- Annotations
- @native()
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        initializeLogIfNecessary(isInterpreter: Boolean): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        isInstanceOf[T0]: Boolean
      
      
      - Definition Classes
- Any
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        isTraceEnabled(): Boolean
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        log: Logger
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logDebug(msg: ⇒ String, throwable: Throwable): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logDebug(msg: ⇒ String): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logError(msg: ⇒ String, throwable: Throwable): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logError(msg: ⇒ String): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logInfo(msg: ⇒ String, throwable: Throwable): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logInfo(msg: ⇒ String): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logName: String
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logTrace(msg: ⇒ String, throwable: Throwable): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logTrace(msg: ⇒ String): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logWarning(msg: ⇒ String, throwable: Throwable): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        logWarning(msg: ⇒ String): Unit
      
      
      - Attributes
- protected
- Definition Classes
- Logging
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        ne(arg0: AnyRef): Boolean
      
      
      - Definition Classes
- AnyRef
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        notify(): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @native()
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        notifyAll(): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @native()
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        synchronized[T0](arg0: ⇒ T0): T0
      
      
      - Definition Classes
- AnyRef
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        toString(): String
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        train(input: RDD[LabeledPoint], algo: Algo, impurity: Impurity, maxDepth: Int, numClasses: Int, maxBins: Int, quantileCalculationStrategy: QuantileStrategy, categoricalFeaturesInfo: Map[Int, Int]): DecisionTreeModel
      
      
      Method to train a decision tree model. Method to train a decision tree model. The method supports binary and multiclass classification and regression. - input
- Training dataset: RDD of org.apache.spark.mllib.regression.LabeledPoint. For classification, labels should take values {0, 1, ..., numClasses-1}. For regression, labels are real numbers. 
- algo
- Type of decision tree, either classification or regression. 
- impurity
- Criterion used for information gain calculation. 
- maxDepth
- Maximum depth of the tree (e.g. depth 0 means 1 leaf node, depth 1 means 1 internal node + 2 leaf nodes). 
- numClasses
- Number of classes for classification. Default value of 2. 
- maxBins
- Maximum number of bins used for splitting features. 
- quantileCalculationStrategy
- Algorithm for calculating quantiles. 
- categoricalFeaturesInfo
- Map storing arity of categorical features. An entry (n to k) indicates that feature n is categorical with k categories indexed from 0: {0, 1, ..., k-1}. 
- returns
- DecisionTreeModel that can be used for prediction. 
 - Annotations
- @Since( "1.0.0" )
- Note
- Using - org.apache.spark.mllib.tree.DecisionTree.trainClassifierand- org.apache.spark.mllib.tree.DecisionTree.trainRegressoris recommended to clearly separate classification and regression.
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        train(input: RDD[LabeledPoint], algo: Algo, impurity: Impurity, maxDepth: Int, numClasses: Int): DecisionTreeModel
      
      
      Method to train a decision tree model. Method to train a decision tree model. The method supports binary and multiclass classification and regression. - input
- Training dataset: RDD of org.apache.spark.mllib.regression.LabeledPoint. For classification, labels should take values {0, 1, ..., numClasses-1}. For regression, labels are real numbers. 
- algo
- Type of decision tree, either classification or regression. 
- impurity
- Criterion used for information gain calculation. 
- maxDepth
- Maximum depth of the tree (e.g. depth 0 means 1 leaf node, depth 1 means 1 internal node + 2 leaf nodes). 
- numClasses
- Number of classes for classification. Default value of 2. 
- returns
- DecisionTreeModel that can be used for prediction. 
 - Annotations
- @Since( "1.2.0" )
- Note
- Using - org.apache.spark.mllib.tree.DecisionTree.trainClassifierand- org.apache.spark.mllib.tree.DecisionTree.trainRegressoris recommended to clearly separate classification and regression.
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        train(input: RDD[LabeledPoint], algo: Algo, impurity: Impurity, maxDepth: Int): DecisionTreeModel
      
      
      Method to train a decision tree model. Method to train a decision tree model. The method supports binary and multiclass classification and regression. - input
- Training dataset: RDD of org.apache.spark.mllib.regression.LabeledPoint. For classification, labels should take values {0, 1, ..., numClasses-1}. For regression, labels are real numbers. 
- algo
- Type of decision tree, either classification or regression. 
- impurity
- Criterion used for information gain calculation. 
- maxDepth
- Maximum depth of the tree (e.g. depth 0 means 1 leaf node, depth 1 means 1 internal node + 2 leaf nodes). 
- returns
- DecisionTreeModel that can be used for prediction. 
 - Annotations
- @Since( "1.0.0" )
- Note
- Using - org.apache.spark.mllib.tree.DecisionTree.trainClassifierand- org.apache.spark.mllib.tree.DecisionTree.trainRegressoris recommended to clearly separate classification and regression.
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        train(input: RDD[LabeledPoint], strategy: Strategy): DecisionTreeModel
      
      
      Method to train a decision tree model. Method to train a decision tree model. The method supports binary and multiclass classification and regression. - input
- Training dataset: RDD of org.apache.spark.mllib.regression.LabeledPoint. For classification, labels should take values {0, 1, ..., numClasses-1}. For regression, labels are real numbers. 
- strategy
- The configuration parameters for the tree algorithm which specify the type of decision tree (classification or regression), feature type (continuous, categorical), depth of the tree, quantile calculation strategy, etc. 
- returns
- DecisionTreeModel that can be used for prediction. 
 - Annotations
- @Since( "1.0.0" )
- Note
- Using - org.apache.spark.mllib.tree.DecisionTree.trainClassifierand- org.apache.spark.mllib.tree.DecisionTree.trainRegressoris recommended to clearly separate classification and regression.
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        trainClassifier(input: JavaRDD[LabeledPoint], numClasses: Int, categoricalFeaturesInfo: Map[Integer, Integer], impurity: String, maxDepth: Int, maxBins: Int): DecisionTreeModel
      
      
      Java-friendly API for org.apache.spark.mllib.tree.DecisionTree.trainClassifierJava-friendly API for org.apache.spark.mllib.tree.DecisionTree.trainClassifier- Annotations
- @Since( "1.1.0" )
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        trainClassifier(input: RDD[LabeledPoint], numClasses: Int, categoricalFeaturesInfo: Map[Int, Int], impurity: String, maxDepth: Int, maxBins: Int): DecisionTreeModel
      
      
      Method to train a decision tree model for binary or multiclass classification. Method to train a decision tree model for binary or multiclass classification. - input
- Training dataset: RDD of org.apache.spark.mllib.regression.LabeledPoint. Labels should take values {0, 1, ..., numClasses-1}. 
- numClasses
- Number of classes for classification. 
- categoricalFeaturesInfo
- Map storing arity of categorical features. An entry (n to k) indicates that feature n is categorical with k categories indexed from 0: {0, 1, ..., k-1}. 
- impurity
- Criterion used for information gain calculation. Supported values: "gini" (recommended) or "entropy". 
- maxDepth
- Maximum depth of the tree (e.g. depth 0 means 1 leaf node, depth 1 means 1 internal node + 2 leaf nodes). (suggested value: 5) 
- maxBins
- Maximum number of bins used for splitting features. (suggested value: 32) 
- returns
- DecisionTreeModel that can be used for prediction. 
 - Annotations
- @Since( "1.1.0" )
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        trainRegressor(input: JavaRDD[LabeledPoint], categoricalFeaturesInfo: Map[Integer, Integer], impurity: String, maxDepth: Int, maxBins: Int): DecisionTreeModel
      
      
      Java-friendly API for org.apache.spark.mllib.tree.DecisionTree.trainRegressorJava-friendly API for org.apache.spark.mllib.tree.DecisionTree.trainRegressor- Annotations
- @Since( "1.1.0" )
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        trainRegressor(input: RDD[LabeledPoint], categoricalFeaturesInfo: Map[Int, Int], impurity: String, maxDepth: Int, maxBins: Int): DecisionTreeModel
      
      
      Method to train a decision tree model for regression. Method to train a decision tree model for regression. - input
- Training dataset: RDD of org.apache.spark.mllib.regression.LabeledPoint. Labels are real numbers. 
- categoricalFeaturesInfo
- Map storing arity of categorical features. An entry (n to k) indicates that feature n is categorical with k categories indexed from 0: {0, 1, ..., k-1}. 
- impurity
- Criterion used for information gain calculation. The only supported value for regression is "variance". 
- maxDepth
- Maximum depth of the tree (e.g. depth 0 means 1 leaf node, depth 1 means 1 internal node + 2 leaf nodes). (suggested value: 5) 
- maxBins
- Maximum number of bins used for splitting features. (suggested value: 32) 
- returns
- DecisionTreeModel that can be used for prediction. 
 - Annotations
- @Since( "1.1.0" )
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @throws( ... )
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(arg0: Long, arg1: Int): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @throws( ... )
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(arg0: Long): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()