{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": true }, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "# import seaborn as sns\n", "# import matplotlib.pyplot as plt\n", "import os\n", "from sklearn.model_selection import train_test_split\n", "from sklearn.feature_selection import SelectFromModel\n", "from sklearn.ensemble import RandomForestClassifier\n", "# plt.style.use('seaborn-colorblind')\n", "# %matplotlib inline\n", "from feature_selection import feature_shuffle\n" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Load Dataset" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "collapsed": true }, "outputs": [], "source": [ "from sklearn.datasets import load_breast_cancer\n", "data = load_breast_cancer()\n", "data = pd.DataFrame(np.c_[data['data'], data['target']],\n", " columns= np.append(data['feature_names'], ['target']))" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | mean radius | \n", "mean texture | \n", "mean perimeter | \n", "mean area | \n", "mean smoothness | \n", "mean compactness | \n", "mean concavity | \n", "mean concave points | \n", "mean symmetry | \n", "mean fractal dimension | \n", "... | \n", "worst texture | \n", "worst perimeter | \n", "worst area | \n", "worst smoothness | \n", "worst compactness | \n", "worst concavity | \n", "worst concave points | \n", "worst symmetry | \n", "worst fractal dimension | \n", "target | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "17.99 | \n", "10.38 | \n", "122.80 | \n", "1001.0 | \n", "0.11840 | \n", "0.27760 | \n", "0.3001 | \n", "0.14710 | \n", "0.2419 | \n", "0.07871 | \n", "... | \n", "17.33 | \n", "184.60 | \n", "2019.0 | \n", "0.1622 | \n", "0.6656 | \n", "0.7119 | \n", "0.2654 | \n", "0.4601 | \n", "0.11890 | \n", "0.0 | \n", "
| 1 | \n", "20.57 | \n", "17.77 | \n", "132.90 | \n", "1326.0 | \n", "0.08474 | \n", "0.07864 | \n", "0.0869 | \n", "0.07017 | \n", "0.1812 | \n", "0.05667 | \n", "... | \n", "23.41 | \n", "158.80 | \n", "1956.0 | \n", "0.1238 | \n", "0.1866 | \n", "0.2416 | \n", "0.1860 | \n", "0.2750 | \n", "0.08902 | \n", "0.0 | \n", "
| 2 | \n", "19.69 | \n", "21.25 | \n", "130.00 | \n", "1203.0 | \n", "0.10960 | \n", "0.15990 | \n", "0.1974 | \n", "0.12790 | \n", "0.2069 | \n", "0.05999 | \n", "... | \n", "25.53 | \n", "152.50 | \n", "1709.0 | \n", "0.1444 | \n", "0.4245 | \n", "0.4504 | \n", "0.2430 | \n", "0.3613 | \n", "0.08758 | \n", "0.0 | \n", "
| 3 | \n", "11.42 | \n", "20.38 | \n", "77.58 | \n", "386.1 | \n", "0.14250 | \n", "0.28390 | \n", "0.2414 | \n", "0.10520 | \n", "0.2597 | \n", "0.09744 | \n", "... | \n", "26.50 | \n", "98.87 | \n", "567.7 | \n", "0.2098 | \n", "0.8663 | \n", "0.6869 | \n", "0.2575 | \n", "0.6638 | \n", "0.17300 | \n", "0.0 | \n", "
| 4 | \n", "20.29 | \n", "14.34 | \n", "135.10 | \n", "1297.0 | \n", "0.10030 | \n", "0.13280 | \n", "0.1980 | \n", "0.10430 | \n", "0.1809 | \n", "0.05883 | \n", "... | \n", "16.67 | \n", "152.20 | \n", "1575.0 | \n", "0.1374 | \n", "0.2050 | \n", "0.4000 | \n", "0.1625 | \n", "0.2364 | \n", "0.07678 | \n", "0.0 | \n", "
5 rows × 31 columns
\n", "| \n", " | feature | \n", "auc_drop | \n", "
|---|---|---|
| 22 | \n", "worst perimeter | \n", "8.359457e-05 | \n", "
| 27 | \n", "worst concave points | \n", "3.134796e-05 | \n", "
| 23 | \n", "worst area | \n", "1.110223e-16 | \n", "
| 12 | \n", "perimeter error | \n", "1.110223e-16 | \n", "
| 0 | \n", "mean radius | \n", "0.000000e+00 | \n", "
| 16 | \n", "concavity error | \n", "0.000000e+00 | \n", "
| 28 | \n", "worst symmetry | \n", "0.000000e+00 | \n", "
| 26 | \n", "worst concavity | \n", "0.000000e+00 | \n", "
| 25 | \n", "worst compactness | \n", "0.000000e+00 | \n", "
| 24 | \n", "worst smoothness | \n", "0.000000e+00 | \n", "
| 21 | \n", "worst texture | \n", "0.000000e+00 | \n", "
| 20 | \n", "worst radius | \n", "0.000000e+00 | \n", "
| 19 | \n", "fractal dimension error | \n", "0.000000e+00 | \n", "
| 18 | \n", "symmetry error | \n", "0.000000e+00 | \n", "
| 17 | \n", "concave points error | \n", "0.000000e+00 | \n", "
| 15 | \n", "compactness error | \n", "0.000000e+00 | \n", "
| 1 | \n", "mean texture | \n", "0.000000e+00 | \n", "
| 14 | \n", "smoothness error | \n", "0.000000e+00 | \n", "
| 13 | \n", "area error | \n", "0.000000e+00 | \n", "
| 11 | \n", "texture error | \n", "0.000000e+00 | \n", "
| 10 | \n", "radius error | \n", "0.000000e+00 | \n", "
| 9 | \n", "mean fractal dimension | \n", "0.000000e+00 | \n", "
| 8 | \n", "mean symmetry | \n", "0.000000e+00 | \n", "
| 7 | \n", "mean concave points | \n", "0.000000e+00 | \n", "
| 6 | \n", "mean concavity | \n", "0.000000e+00 | \n", "
| 5 | \n", "mean compactness | \n", "0.000000e+00 | \n", "
| 4 | \n", "mean smoothness | \n", "0.000000e+00 | \n", "
| 3 | \n", "mean area | \n", "0.000000e+00 | \n", "
| 2 | \n", "mean perimeter | \n", "0.000000e+00 | \n", "
| 29 | \n", "worst fractal dimension | \n", "0.000000e+00 | \n", "