class ChiSqSelector extends Serializable
Creates a ChiSquared feature selector.
The selector supports different selection methods: numTopFeatures, percentile, fpr,
fdr, fwe.
- numTopFeatureschooses a fixed number of top features according to a chi-squared test.
- percentileis similar but chooses a fraction of all features instead of a fixed number.
- fprchooses all features whose p-values are below a threshold, thus controlling the false positive rate of selection.
- fdruses the [Benjamini-Hochberg procedure] (https://en.wikipedia.org/wiki/False_discovery_rate#Benjamini.E2.80.93Hochberg_procedure) to choose all features whose false discovery rate is below a threshold.
- fwechooses all features whose p-values are below a threshold. The threshold is scaled by 1/numFeatures, thus controlling the family-wise error rate of selection. By default, the selection method is- numTopFeatures, with the default number of top features set to 50.
- Annotations
- @Since( "1.3.0" )
- Source
- ChiSqSelector.scala
- Alphabetic
- By Inheritance
- ChiSqSelector
- Serializable
- Serializable
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Instance Constructors
Value Members
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        !=(arg0: Any): Boolean
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        ##(): Int
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        ==(arg0: Any): Boolean
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        asInstanceOf[T0]: T0
      
      
      - Definition Classes
- Any
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        clone(): AnyRef
      
      
      - Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native() @IntrinsicCandidate()
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        eq(arg0: AnyRef): Boolean
      
      
      - Definition Classes
- AnyRef
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        equals(arg0: Any): Boolean
      
      
      - Definition Classes
- AnyRef → Any
 
-  var fdr: Double
- 
      
      
      
        
      
    
      
        
        def
      
      
        fit(data: RDD[LabeledPoint]): ChiSqSelectorModel
      
      
      Returns a ChiSquared feature selector. Returns a ChiSquared feature selector. - data
- an - RDD[LabeledPoint]containing the labeled dataset with categorical features. Real-valued features will be treated as categorical for each distinct value. Apply feature discretizer before using this function.
 - Annotations
- @Since( "1.3.0" )
 
-  var fpr: Double
-  var fwe: Double
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        getClass(): Class[_]
      
      
      - Definition Classes
- AnyRef → Any
- Annotations
- @native() @IntrinsicCandidate()
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        hashCode(): Int
      
      
      - Definition Classes
- AnyRef → Any
- Annotations
- @native() @IntrinsicCandidate()
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        isInstanceOf[T0]: Boolean
      
      
      - Definition Classes
- Any
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        ne(arg0: AnyRef): Boolean
      
      
      - Definition Classes
- AnyRef
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        notify(): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @native() @IntrinsicCandidate()
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        notifyAll(): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @native() @IntrinsicCandidate()
 
-  var numTopFeatures: Int
-  var percentile: Double
-  var selectorType: String
- 
      
      
      
        
      
    
      
        
        def
      
      
        setFdr(value: Double): ChiSqSelector.this.type
      
      
      - Annotations
- @Since( "2.2.0" )
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        setFpr(value: Double): ChiSqSelector.this.type
      
      
      - Annotations
- @Since( "2.1.0" )
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        setFwe(value: Double): ChiSqSelector.this.type
      
      
      - Annotations
- @Since( "2.2.0" )
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        setNumTopFeatures(value: Int): ChiSqSelector.this.type
      
      
      - Annotations
- @Since( "1.6.0" )
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        setPercentile(value: Double): ChiSqSelector.this.type
      
      
      - Annotations
- @Since( "2.1.0" )
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        setSelectorType(value: String): ChiSqSelector.this.type
      
      
      - Annotations
- @Since( "2.1.0" )
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        synchronized[T0](arg0: ⇒ T0): T0
      
      
      - Definition Classes
- AnyRef
 
- 
      
      
      
        
      
    
      
        
        def
      
      
        toString(): String
      
      
      - Definition Classes
- AnyRef → Any
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(arg0: Long, arg1: Int): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @throws( ... )
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(arg0: Long): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
 
- 
      
      
      
        
      
    
      
        final 
        def
      
      
        wait(): Unit
      
      
      - Definition Classes
- AnyRef
- Annotations
- @throws( ... )
 
Deprecated Value Members
- 
      
      
      
        
      
    
      
        
        def
      
      
        finalize(): Unit
      
      
      - Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( classOf[java.lang.Throwable] ) @Deprecated
- Deprecated