class ChiSqSelector extends Serializable
Creates a ChiSquared feature selector.
The selector supports different selection methods: numTopFeatures, percentile, fpr,
fdr, fwe.
numTopFeatureschooses a fixed number of top features according to a chi-squared test.percentileis similar but chooses a fraction of all features instead of a fixed number.fprchooses all features whose p-values are below a threshold, thus controlling the false positive rate of selection.fdruses the [Benjamini-Hochberg procedure] (https://en.wikipedia.org/wiki/False_discovery_rate#Benjamini.E2.80.93Hochberg_procedure) to choose all features whose false discovery rate is below a threshold.fwechooses all features whose p-values are below a threshold. The threshold is scaled by 1/numFeatures, thus controlling the family-wise error rate of selection. By default, the selection method isnumTopFeatures, with the default number of top features set to 50.
- Annotations
 - @Since( "1.3.0" )
 - Source
 - ChiSqSelector.scala
 
- Alphabetic
 - By Inheritance
 
- ChiSqSelector
 - Serializable
 - Serializable
 - AnyRef
 - Any
 
- Hide All
 - Show All
 
- Public
 - All
 
Instance Constructors
Value Members
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        !=(arg0: Any): Boolean
      
      
      
- Definition Classes
 - AnyRef → Any
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        ##(): Int
      
      
      
- Definition Classes
 - AnyRef → Any
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        ==(arg0: Any): Boolean
      
      
      
- Definition Classes
 - AnyRef → Any
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        asInstanceOf[T0]: T0
      
      
      
- Definition Classes
 - Any
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        clone(): AnyRef
      
      
      
- Attributes
 - protected[lang]
 - Definition Classes
 - AnyRef
 - Annotations
 - @throws( ... ) @native()
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        eq(arg0: AnyRef): Boolean
      
      
      
- Definition Classes
 - AnyRef
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        equals(arg0: Any): Boolean
      
      
      
- Definition Classes
 - AnyRef → Any
 
 -  var fdr: Double
 - 
      
      
      
        
      
    
      
        
        def
      
      
        finalize(): Unit
      
      
      
- Attributes
 - protected[lang]
 - Definition Classes
 - AnyRef
 - Annotations
 - @throws( classOf[java.lang.Throwable] )
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        fit(data: RDD[LabeledPoint]): ChiSqSelectorModel
      
      
      
Returns a ChiSquared feature selector.
Returns a ChiSquared feature selector.
- data
 an
RDD[LabeledPoint]containing the labeled dataset with categorical features. Real-valued features will be treated as categorical for each distinct value. Apply feature discretizer before using this function.
- Annotations
 - @Since( "1.3.0" )
 
 -  var fpr: Double
 -  var fwe: Double
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        getClass(): Class[_]
      
      
      
- Definition Classes
 - AnyRef → Any
 - Annotations
 - @native()
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        hashCode(): Int
      
      
      
- Definition Classes
 - AnyRef → Any
 - Annotations
 - @native()
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        isInstanceOf[T0]: Boolean
      
      
      
- Definition Classes
 - Any
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        ne(arg0: AnyRef): Boolean
      
      
      
- Definition Classes
 - AnyRef
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        notify(): Unit
      
      
      
- Definition Classes
 - AnyRef
 - Annotations
 - @native()
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        notifyAll(): Unit
      
      
      
- Definition Classes
 - AnyRef
 - Annotations
 - @native()
 
 -  var numTopFeatures: Int
 -  var percentile: Double
 -  var selectorType: String
 - 
      
      
      
        
      
    
      
        
        def
      
      
        setFdr(value: Double): ChiSqSelector.this.type
      
      
      
- Annotations
 - @Since( "2.2.0" )
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        setFpr(value: Double): ChiSqSelector.this.type
      
      
      
- Annotations
 - @Since( "2.1.0" )
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        setFwe(value: Double): ChiSqSelector.this.type
      
      
      
- Annotations
 - @Since( "2.2.0" )
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        setNumTopFeatures(value: Int): ChiSqSelector.this.type
      
      
      
- Annotations
 - @Since( "1.6.0" )
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        setPercentile(value: Double): ChiSqSelector.this.type
      
      
      
- Annotations
 - @Since( "2.1.0" )
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        setSelectorType(value: String): ChiSqSelector.this.type
      
      
      
- Annotations
 - @Since( "2.1.0" )
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        synchronized[T0](arg0: ⇒ T0): T0
      
      
      
- Definition Classes
 - AnyRef
 
 - 
      
      
      
        
      
    
      
        
        def
      
      
        toString(): String
      
      
      
- Definition Classes
 - AnyRef → Any
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(): Unit
      
      
      
- Definition Classes
 - AnyRef
 - Annotations
 - @throws( ... )
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(arg0: Long, arg1: Int): Unit
      
      
      
- Definition Classes
 - AnyRef
 - Annotations
 - @throws( ... )
 
 - 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(arg0: Long): Unit
      
      
      
- Definition Classes
 - AnyRef
 - Annotations
 - @throws( ... ) @native()