├── .gitignore ├── 01-introduction.ipynb ├── 02-supervised-learning.ipynb ├── 03-unsupervised-learning.ipynb ├── 04-scikit-learn-API-summary.ipynb ├── 05-representing-data-feature-engineering.ipynb ├── 06-model-evaluation-and-improvement.ipynb ├── 07-algorithm-chains-and-pipelines.ipynb ├── 08-working-with-text-data.ipynb ├── 09-conclusion.ipynb ├── data └── citibike.csv ├── images ├── 06_cross_val_selection.png ├── 06_cross_validation.png ├── 06_cross_validation.svg ├── 06_cross_validation2.png ├── 06_decision_threshold.png ├── 06_grid_search.png ├── 06_grid_search_overview.png ├── 06_label_kfold.png ├── 06_multi_label_confusion_matrix.png ├── 06_shuffle_split.png ├── 06_stratified_kfold.png ├── 06_stratified_kfold.svg ├── 06_threefold_split.png ├── api_table.png ├── bias.png ├── classifier_comparison.png ├── data_representation.svg ├── decision_tree.png ├── dendrogram.png ├── ds_workflow.png ├── fit.png ├── kmeans1.png ├── kmeans2.png ├── knn1.png ├── knn2.png ├── low.png ├── noise.png ├── overfitting_underfitting_cartoon.png ├── overfitting_underfitting_cartoon.svg ├── regression.png ├── sepal_petal.png ├── sepal_petal_small.png ├── supervised_workflow.svg ├── svm1.png ├── svm2.png ├── train_test_split_matrix.svg ├── variance.png └── voronoi.png ├── mglearn ├── __init__.py ├── datasets.py ├── make_blobs.py ├── plot_2d_separator.py ├── plot_agglomerative.py ├── plot_animal_tree.py ├── plot_decomposition.py ├── plot_helpers.py ├── plot_interactive_tree.py ├── plot_kmeans.py ├── plot_kneighbors_regularization.py ├── plot_knn_classification.py ├── plot_knn_regression.py ├── plot_linear_regression.py ├── plot_linear_svc_regularization.py ├── plot_nmf.py ├── plot_nn_graphs.py ├── plot_pca.py ├── plot_rbf_svm_parameters.py ├── plot_scaling.py ├── plot_tree_nonmonotonous.py ├── plots.py └── tools.py ├── preamble.py └── salary_lotto.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/.gitignore -------------------------------------------------------------------------------- /01-introduction.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/01-introduction.ipynb -------------------------------------------------------------------------------- /02-supervised-learning.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/02-supervised-learning.ipynb -------------------------------------------------------------------------------- /03-unsupervised-learning.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/03-unsupervised-learning.ipynb -------------------------------------------------------------------------------- /04-scikit-learn-API-summary.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/04-scikit-learn-API-summary.ipynb -------------------------------------------------------------------------------- /05-representing-data-feature-engineering.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/05-representing-data-feature-engineering.ipynb -------------------------------------------------------------------------------- /06-model-evaluation-and-improvement.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/06-model-evaluation-and-improvement.ipynb -------------------------------------------------------------------------------- /07-algorithm-chains-and-pipelines.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/07-algorithm-chains-and-pipelines.ipynb -------------------------------------------------------------------------------- /08-working-with-text-data.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/08-working-with-text-data.ipynb -------------------------------------------------------------------------------- /09-conclusion.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/09-conclusion.ipynb -------------------------------------------------------------------------------- /data/citibike.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/data/citibike.csv -------------------------------------------------------------------------------- /images/06_cross_val_selection.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_cross_val_selection.png -------------------------------------------------------------------------------- /images/06_cross_validation.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_cross_validation.png -------------------------------------------------------------------------------- /images/06_cross_validation.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_cross_validation.svg -------------------------------------------------------------------------------- /images/06_cross_validation2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_cross_validation2.png -------------------------------------------------------------------------------- /images/06_decision_threshold.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_decision_threshold.png -------------------------------------------------------------------------------- /images/06_grid_search.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_grid_search.png -------------------------------------------------------------------------------- /images/06_grid_search_overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_grid_search_overview.png -------------------------------------------------------------------------------- /images/06_label_kfold.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_label_kfold.png -------------------------------------------------------------------------------- /images/06_multi_label_confusion_matrix.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_multi_label_confusion_matrix.png -------------------------------------------------------------------------------- /images/06_shuffle_split.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_shuffle_split.png -------------------------------------------------------------------------------- /images/06_stratified_kfold.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_stratified_kfold.png -------------------------------------------------------------------------------- /images/06_stratified_kfold.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_stratified_kfold.svg -------------------------------------------------------------------------------- /images/06_threefold_split.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/06_threefold_split.png -------------------------------------------------------------------------------- /images/api_table.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/api_table.png -------------------------------------------------------------------------------- /images/bias.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/bias.png -------------------------------------------------------------------------------- /images/classifier_comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/classifier_comparison.png -------------------------------------------------------------------------------- /images/data_representation.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/data_representation.svg -------------------------------------------------------------------------------- /images/decision_tree.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/decision_tree.png -------------------------------------------------------------------------------- /images/dendrogram.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/dendrogram.png -------------------------------------------------------------------------------- /images/ds_workflow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/ds_workflow.png -------------------------------------------------------------------------------- /images/fit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/fit.png -------------------------------------------------------------------------------- /images/kmeans1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/kmeans1.png -------------------------------------------------------------------------------- /images/kmeans2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/kmeans2.png -------------------------------------------------------------------------------- /images/knn1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/knn1.png -------------------------------------------------------------------------------- /images/knn2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/knn2.png -------------------------------------------------------------------------------- /images/low.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/low.png -------------------------------------------------------------------------------- /images/noise.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/noise.png -------------------------------------------------------------------------------- /images/overfitting_underfitting_cartoon.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/overfitting_underfitting_cartoon.png -------------------------------------------------------------------------------- /images/overfitting_underfitting_cartoon.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/overfitting_underfitting_cartoon.svg -------------------------------------------------------------------------------- /images/regression.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/regression.png -------------------------------------------------------------------------------- /images/sepal_petal.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/sepal_petal.png -------------------------------------------------------------------------------- /images/sepal_petal_small.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/sepal_petal_small.png -------------------------------------------------------------------------------- /images/supervised_workflow.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/supervised_workflow.svg -------------------------------------------------------------------------------- /images/svm1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/svm1.png -------------------------------------------------------------------------------- /images/svm2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/svm2.png -------------------------------------------------------------------------------- /images/train_test_split_matrix.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/train_test_split_matrix.svg -------------------------------------------------------------------------------- /images/variance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/variance.png -------------------------------------------------------------------------------- /images/voronoi.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/images/voronoi.png -------------------------------------------------------------------------------- /mglearn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/__init__.py -------------------------------------------------------------------------------- /mglearn/datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/datasets.py -------------------------------------------------------------------------------- /mglearn/make_blobs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/make_blobs.py -------------------------------------------------------------------------------- /mglearn/plot_2d_separator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_2d_separator.py -------------------------------------------------------------------------------- /mglearn/plot_agglomerative.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_agglomerative.py -------------------------------------------------------------------------------- /mglearn/plot_animal_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_animal_tree.py -------------------------------------------------------------------------------- /mglearn/plot_decomposition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_decomposition.py -------------------------------------------------------------------------------- /mglearn/plot_helpers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_helpers.py -------------------------------------------------------------------------------- /mglearn/plot_interactive_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_interactive_tree.py -------------------------------------------------------------------------------- /mglearn/plot_kmeans.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_kmeans.py -------------------------------------------------------------------------------- /mglearn/plot_kneighbors_regularization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_kneighbors_regularization.py -------------------------------------------------------------------------------- /mglearn/plot_knn_classification.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_knn_classification.py -------------------------------------------------------------------------------- /mglearn/plot_knn_regression.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_knn_regression.py -------------------------------------------------------------------------------- /mglearn/plot_linear_regression.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_linear_regression.py -------------------------------------------------------------------------------- /mglearn/plot_linear_svc_regularization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_linear_svc_regularization.py -------------------------------------------------------------------------------- /mglearn/plot_nmf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_nmf.py -------------------------------------------------------------------------------- /mglearn/plot_nn_graphs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_nn_graphs.py -------------------------------------------------------------------------------- /mglearn/plot_pca.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_pca.py -------------------------------------------------------------------------------- /mglearn/plot_rbf_svm_parameters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_rbf_svm_parameters.py -------------------------------------------------------------------------------- /mglearn/plot_scaling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_scaling.py -------------------------------------------------------------------------------- /mglearn/plot_tree_nonmonotonous.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plot_tree_nonmonotonous.py -------------------------------------------------------------------------------- /mglearn/plots.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/plots.py -------------------------------------------------------------------------------- /mglearn/tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/mglearn/tools.py -------------------------------------------------------------------------------- /preamble.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/preamble.py -------------------------------------------------------------------------------- /salary_lotto.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/amueller/odsc_east_2016/HEAD/salary_lotto.py --------------------------------------------------------------------------------