├── .gitignore ├── LICENSE ├── README.md ├── bin └── spark-featureselection_2.11-1.0.0.jar ├── project ├── build.properties └── plugins.sbt ├── src ├── main │ └── scala │ │ └── org │ │ └── apache │ │ └── spark │ │ └── ml │ │ └── feature │ │ └── selection │ │ ├── FeatureSelector.scala │ │ ├── FeatureSelectorParams.scala │ │ ├── embedded │ │ ├── ImportanceSelector.scala │ │ └── LRSelector.scala │ │ ├── filter │ │ ├── CorrelationSelector.scala │ │ ├── GiniSelector.scala │ │ └── InfoGainSelector.scala │ │ └── util │ │ └── VectorMerger.scala └── test │ ├── resources │ └── iris.data │ └── scala │ └── org │ └── apache │ └── spark │ └── ml │ └── feature │ └── selection │ ├── FeatureSelectionTestBase.scala │ ├── embedded │ ├── ImportanceSelectorSuite.scala │ └── LRSelectorSuite.scala │ ├── filter │ ├── CorrelationSelectorSuite.scala │ ├── GiniSelectorSuite.scala │ └── InfoGainSelectorSuite.scala │ ├── test_util │ ├── DefaultReadWriteTest.scala │ └── TempDirectory.scala │ └── util │ └── VectorMergerSuite.scala └── version.sbt /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/README.md -------------------------------------------------------------------------------- /bin/spark-featureselection_2.11-1.0.0.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/bin/spark-featureselection_2.11-1.0.0.jar -------------------------------------------------------------------------------- /project/build.properties: -------------------------------------------------------------------------------- 1 | sbt.version = 0.13.16 -------------------------------------------------------------------------------- /project/plugins.sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/project/plugins.sbt -------------------------------------------------------------------------------- /src/main/scala/org/apache/spark/ml/feature/selection/FeatureSelector.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/main/scala/org/apache/spark/ml/feature/selection/FeatureSelector.scala -------------------------------------------------------------------------------- /src/main/scala/org/apache/spark/ml/feature/selection/FeatureSelectorParams.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/main/scala/org/apache/spark/ml/feature/selection/FeatureSelectorParams.scala -------------------------------------------------------------------------------- /src/main/scala/org/apache/spark/ml/feature/selection/embedded/ImportanceSelector.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/main/scala/org/apache/spark/ml/feature/selection/embedded/ImportanceSelector.scala -------------------------------------------------------------------------------- /src/main/scala/org/apache/spark/ml/feature/selection/embedded/LRSelector.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/main/scala/org/apache/spark/ml/feature/selection/embedded/LRSelector.scala -------------------------------------------------------------------------------- /src/main/scala/org/apache/spark/ml/feature/selection/filter/CorrelationSelector.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/main/scala/org/apache/spark/ml/feature/selection/filter/CorrelationSelector.scala -------------------------------------------------------------------------------- /src/main/scala/org/apache/spark/ml/feature/selection/filter/GiniSelector.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/main/scala/org/apache/spark/ml/feature/selection/filter/GiniSelector.scala -------------------------------------------------------------------------------- /src/main/scala/org/apache/spark/ml/feature/selection/filter/InfoGainSelector.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/main/scala/org/apache/spark/ml/feature/selection/filter/InfoGainSelector.scala -------------------------------------------------------------------------------- /src/main/scala/org/apache/spark/ml/feature/selection/util/VectorMerger.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/main/scala/org/apache/spark/ml/feature/selection/util/VectorMerger.scala -------------------------------------------------------------------------------- /src/test/resources/iris.data: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/resources/iris.data -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/FeatureSelectionTestBase.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/FeatureSelectionTestBase.scala -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/embedded/ImportanceSelectorSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/embedded/ImportanceSelectorSuite.scala -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/embedded/LRSelectorSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/embedded/LRSelectorSuite.scala -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/filter/CorrelationSelectorSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/filter/CorrelationSelectorSuite.scala -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/filter/GiniSelectorSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/filter/GiniSelectorSuite.scala -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/filter/InfoGainSelectorSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/filter/InfoGainSelectorSuite.scala -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/test_util/DefaultReadWriteTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/test_util/DefaultReadWriteTest.scala -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/test_util/TempDirectory.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/test_util/TempDirectory.scala -------------------------------------------------------------------------------- /src/test/scala/org/apache/spark/ml/feature/selection/util/VectorMergerSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/MarcKaminski/spark-FeatureSelection/HEAD/src/test/scala/org/apache/spark/ml/feature/selection/util/VectorMergerSuite.scala -------------------------------------------------------------------------------- /version.sbt: -------------------------------------------------------------------------------- 1 | version in ThisBuild := "1.0.0-SNAPSHOT" --------------------------------------------------------------------------------