├── 0. datasets link part 4.txt
├── 8_2_Cross_Validation_Python_Implementation.ipynb
├── 8_6_Model_Selection_in_ML_with_Python.ipynb
├── Precision,_Recall,_F1_Score_Python_implementation.ipynb
└── Accuracy_score_and_Confusion_Matrix.ipynb


/0. datasets link part 4.txt:
--------------------------------------------------------------------------------
1 | All Datasets link: https://drive.google.com/drive/folders/12DCaNj6JKl2t6mZPwydCsrB2ho7UpiMu?usp=sharing


--------------------------------------------------------------------------------
/8_2_Cross_Validation_Python_Implementation.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |   "nbformat": 4,
  3 |   "nbformat_minor": 0,
  4 |   "metadata": {
  5 |     "colab": {
  6 |       "provenance": [],
  7 |       "collapsed_sections": []
  8 |     },
  9 |     "kernelspec": {
 10 |       "name": "python3",
 11 |       "display_name": "Python 3"
 12 |     },
 13 |     "language_info": {
 14 |       "name": "python"
 15 |     }
 16 |   },
 17 |   "cells": [
 18 |     {
 19 |       "cell_type": "markdown",
 20 |       "source": [
 21 |         "**Video Link:**\n",
 22 |         "\n",
 23 |         "K-Fold cross validation - concept ideo: https://youtu.be/dkd1eeaXbJA"
 24 |       ],
 25 |       "metadata": {
 26 |         "id": "1qbu9h-el72-"
 27 |       }
 28 |     },
 29 |     {
 30 |       "cell_type": "markdown",
 31 |       "source": [
 32 |         "Importing the Dependencies"
 33 |       ],
 34 |       "metadata": {
 35 |         "id": "bFJFyzowbp1A"
 36 |       }
 37 |     },
 38 |     {
 39 |       "cell_type": "code",
 40 |       "source": [
 41 |         "import numpy as np\n",
 42 |         "import pandas as pd\n",
 43 |         "from sklearn.model_selection import train_test_split\n",
 44 |         "from sklearn.model_selection import cross_val_score\n",
 45 |         "from sklearn.metrics import accuracy_score"
 46 |       ],
 47 |       "metadata": {
 48 |         "id": "cY2Jyn1jbnPb"
 49 |       },
 50 |       "execution_count": null,
 51 |       "outputs": []
 52 |     },
 53 |     {
 54 |       "cell_type": "markdown",
 55 |       "source": [
 56 |         "Importing the models"
 57 |       ],
 58 |       "metadata": {
 59 |         "id": "t_yFbxn0ci3f"
 60 |       }
 61 |     },
 62 |     {
 63 |       "cell_type": "code",
 64 |       "execution_count": null,
 65 |       "metadata": {
 66 |         "id": "eq2pMIzlbbqI"
 67 |       },
 68 |       "outputs": [],
 69 |       "source": [
 70 |         "from sklearn.linear_model import LogisticRegression\n",
 71 |         "from sklearn.svm import SVC\n",
 72 |         "from sklearn.neighbors import KNeighborsClassifier\n",
 73 |         "from sklearn.ensemble import RandomForestClassifier"
 74 |       ]
 75 |     },
 76 |     {
 77 |       "cell_type": "markdown",
 78 |       "metadata": {
 79 |         "id": "egMd5zeurTMR"
 80 |       },
 81 |       "source": [
 82 |         "Data Collection and Processing"
 83 |       ]
 84 |     },
 85 |     {
 86 |       "cell_type": "code",
 87 |       "metadata": {
 88 |         "id": "0q-3-LkQrREV"
 89 |       },
 90 |       "source": [
 91 |         "# loading the csv data to a Pandas DataFrame\n",
 92 |         "heart_data = pd.read_csv('/content/heart.csv')"
 93 |       ],
 94 |       "execution_count": null,
 95 |       "outputs": []
 96 |     },
 97 |     {
 98 |       "cell_type": "code",
 99 |       "metadata": {
100 |         "id": "M8dQxSTqriWD",
101 |         "colab": {
102 |           "base_uri": "https://localhost:8080/",
103 |           "height": 206
104 |         },
105 |         "outputId": "7ab56250-3739-413e-9f62-09491ddadf89"
106 |       },
107 |       "source": [
108 |         "# print first 5 rows of the dataset\n",
109 |         "heart_data.head()"
110 |       ],
111 |       "execution_count": null,
112 |       "outputs": [
113 |         {
114 |           "output_type": "execute_result",
115 |           "data": {
116 |             "text/html": [
117 |               "\n",
118 |               "  <div id=\"df-a1307183-7cef-44eb-a5e7-1a157251b718\">\n",
119 |               "    <div class=\"colab-df-container\">\n",
120 |               "      <div>\n",
121 |               "<style scoped>\n",
122 |               "    .dataframe tbody tr th:only-of-type {\n",
123 |               "        vertical-align: middle;\n",
124 |               "    }\n",
125 |               "\n",
126 |               "    .dataframe tbody tr th {\n",
127 |               "        vertical-align: top;\n",
128 |               "    }\n",
129 |               "\n",
130 |               "    .dataframe thead th {\n",
131 |               "        text-align: right;\n",
132 |               "    }\n",
133 |               "</style>\n",
134 |               "<table border=\"1\" class=\"dataframe\">\n",
135 |               "  <thead>\n",
136 |               "    <tr style=\"text-align: right;\">\n",
137 |               "      <th></th>\n",
138 |               "      <th>age</th>\n",
139 |               "      <th>sex</th>\n",
140 |               "      <th>cp</th>\n",
141 |               "      <th>trestbps</th>\n",
142 |               "      <th>chol</th>\n",
143 |               "      <th>fbs</th>\n",
144 |               "      <th>restecg</th>\n",
145 |               "      <th>thalach</th>\n",
146 |               "      <th>exang</th>\n",
147 |               "      <th>oldpeak</th>\n",
148 |               "      <th>slope</th>\n",
149 |               "      <th>ca</th>\n",
150 |               "      <th>thal</th>\n",
151 |               "      <th>target</th>\n",
152 |               "    </tr>\n",
153 |               "  </thead>\n",
154 |               "  <tbody>\n",
155 |               "    <tr>\n",
156 |               "      <th>0</th>\n",
157 |               "      <td>63</td>\n",
158 |               "      <td>1</td>\n",
159 |               "      <td>3</td>\n",
160 |               "      <td>145</td>\n",
161 |               "      <td>233</td>\n",
162 |               "      <td>1</td>\n",
163 |               "      <td>0</td>\n",
164 |               "      <td>150</td>\n",
165 |               "      <td>0</td>\n",
166 |               "      <td>2.3</td>\n",
167 |               "      <td>0</td>\n",
168 |               "      <td>0</td>\n",
169 |               "      <td>1</td>\n",
170 |               "      <td>1</td>\n",
171 |               "    </tr>\n",
172 |               "    <tr>\n",
173 |               "      <th>1</th>\n",
174 |               "      <td>37</td>\n",
175 |               "      <td>1</td>\n",
176 |               "      <td>2</td>\n",
177 |               "      <td>130</td>\n",
178 |               "      <td>250</td>\n",
179 |               "      <td>0</td>\n",
180 |               "      <td>1</td>\n",
181 |               "      <td>187</td>\n",
182 |               "      <td>0</td>\n",
183 |               "      <td>3.5</td>\n",
184 |               "      <td>0</td>\n",
185 |               "      <td>0</td>\n",
186 |               "      <td>2</td>\n",
187 |               "      <td>1</td>\n",
188 |               "    </tr>\n",
189 |               "    <tr>\n",
190 |               "      <th>2</th>\n",
191 |               "      <td>41</td>\n",
192 |               "      <td>0</td>\n",
193 |               "      <td>1</td>\n",
194 |               "      <td>130</td>\n",
195 |               "      <td>204</td>\n",
196 |               "      <td>0</td>\n",
197 |               "      <td>0</td>\n",
198 |               "      <td>172</td>\n",
199 |               "      <td>0</td>\n",
200 |               "      <td>1.4</td>\n",
201 |               "      <td>2</td>\n",
202 |               "      <td>0</td>\n",
203 |               "      <td>2</td>\n",
204 |               "      <td>1</td>\n",
205 |               "    </tr>\n",
206 |               "    <tr>\n",
207 |               "      <th>3</th>\n",
208 |               "      <td>56</td>\n",
209 |               "      <td>1</td>\n",
210 |               "      <td>1</td>\n",
211 |               "      <td>120</td>\n",
212 |               "      <td>236</td>\n",
213 |               "      <td>0</td>\n",
214 |               "      <td>1</td>\n",
215 |               "      <td>178</td>\n",
216 |               "      <td>0</td>\n",
217 |               "      <td>0.8</td>\n",
218 |               "      <td>2</td>\n",
219 |               "      <td>0</td>\n",
220 |               "      <td>2</td>\n",
221 |               "      <td>1</td>\n",
222 |               "    </tr>\n",
223 |               "    <tr>\n",
224 |               "      <th>4</th>\n",
225 |               "      <td>57</td>\n",
226 |               "      <td>0</td>\n",
227 |               "      <td>0</td>\n",
228 |               "      <td>120</td>\n",
229 |               "      <td>354</td>\n",
230 |               "      <td>0</td>\n",
231 |               "      <td>1</td>\n",
232 |               "      <td>163</td>\n",
233 |               "      <td>1</td>\n",
234 |               "      <td>0.6</td>\n",
235 |               "      <td>2</td>\n",
236 |               "      <td>0</td>\n",
237 |               "      <td>2</td>\n",
238 |               "      <td>1</td>\n",
239 |               "    </tr>\n",
240 |               "  </tbody>\n",
241 |               "</table>\n",
242 |               "</div>\n",
243 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-a1307183-7cef-44eb-a5e7-1a157251b718')\"\n",
244 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
245 |               "              style=\"display:none;\">\n",
246 |               "        \n",
247 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
248 |               "       width=\"24px\">\n",
249 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
250 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
251 |               "  </svg>\n",
252 |               "      </button>\n",
253 |               "      \n",
254 |               "  <style>\n",
255 |               "    .colab-df-container {\n",
256 |               "      display:flex;\n",
257 |               "      flex-wrap:wrap;\n",
258 |               "      gap: 12px;\n",
259 |               "    }\n",
260 |               "\n",
261 |               "    .colab-df-convert {\n",
262 |               "      background-color: #E8F0FE;\n",
263 |               "      border: none;\n",
264 |               "      border-radius: 50%;\n",
265 |               "      cursor: pointer;\n",
266 |               "      display: none;\n",
267 |               "      fill: #1967D2;\n",
268 |               "      height: 32px;\n",
269 |               "      padding: 0 0 0 0;\n",
270 |               "      width: 32px;\n",
271 |               "    }\n",
272 |               "\n",
273 |               "    .colab-df-convert:hover {\n",
274 |               "      background-color: #E2EBFA;\n",
275 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
276 |               "      fill: #174EA6;\n",
277 |               "    }\n",
278 |               "\n",
279 |               "    [theme=dark] .colab-df-convert {\n",
280 |               "      background-color: #3B4455;\n",
281 |               "      fill: #D2E3FC;\n",
282 |               "    }\n",
283 |               "\n",
284 |               "    [theme=dark] .colab-df-convert:hover {\n",
285 |               "      background-color: #434B5C;\n",
286 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
287 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
288 |               "      fill: #FFFFFF;\n",
289 |               "    }\n",
290 |               "  </style>\n",
291 |               "\n",
292 |               "      <script>\n",
293 |               "        const buttonEl =\n",
294 |               "          document.querySelector('#df-a1307183-7cef-44eb-a5e7-1a157251b718 button.colab-df-convert');\n",
295 |               "        buttonEl.style.display =\n",
296 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
297 |               "\n",
298 |               "        async function convertToInteractive(key) {\n",
299 |               "          const element = document.querySelector('#df-a1307183-7cef-44eb-a5e7-1a157251b718');\n",
300 |               "          const dataTable =\n",
301 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
302 |               "                                                     [key], {});\n",
303 |               "          if (!dataTable) return;\n",
304 |               "\n",
305 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
306 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
307 |               "            + ' to learn more about interactive tables.';\n",
308 |               "          element.innerHTML = '';\n",
309 |               "          dataTable['output_type'] = 'display_data';\n",
310 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
311 |               "          const docLink = document.createElement('div');\n",
312 |               "          docLink.innerHTML = docLinkHtml;\n",
313 |               "          element.appendChild(docLink);\n",
314 |               "        }\n",
315 |               "      </script>\n",
316 |               "    </div>\n",
317 |               "  </div>\n",
318 |               "  "
319 |             ],
320 |             "text/plain": [
321 |               "   age  sex  cp  trestbps  chol  fbs  ...  exang  oldpeak  slope  ca  thal  target\n",
322 |               "0   63    1   3       145   233    1  ...      0      2.3      0   0     1       1\n",
323 |               "1   37    1   2       130   250    0  ...      0      3.5      0   0     2       1\n",
324 |               "2   41    0   1       130   204    0  ...      0      1.4      2   0     2       1\n",
325 |               "3   56    1   1       120   236    0  ...      0      0.8      2   0     2       1\n",
326 |               "4   57    0   0       120   354    0  ...      1      0.6      2   0     2       1\n",
327 |               "\n",
328 |               "[5 rows x 14 columns]"
329 |             ]
330 |           },
331 |           "metadata": {},
332 |           "execution_count": 4
333 |         }
334 |       ]
335 |     },
336 |     {
337 |       "cell_type": "code",
338 |       "metadata": {
339 |         "id": "8nX1tIzbrz0u",
340 |         "colab": {
341 |           "base_uri": "https://localhost:8080/"
342 |         },
343 |         "outputId": "f0bfe5c2-e1a7-4694-bba8-f2168ce63928"
344 |       },
345 |       "source": [
346 |         "# number of rows and columns in the dataset\n",
347 |         "heart_data.shape"
348 |       ],
349 |       "execution_count": null,
350 |       "outputs": [
351 |         {
352 |           "output_type": "execute_result",
353 |           "data": {
354 |             "text/plain": [
355 |               "(303, 14)"
356 |             ]
357 |           },
358 |           "metadata": {},
359 |           "execution_count": 5
360 |         }
361 |       ]
362 |     },
363 |     {
364 |       "cell_type": "code",
365 |       "metadata": {
366 |         "id": "GjHtW31rsGlb",
367 |         "colab": {
368 |           "base_uri": "https://localhost:8080/"
369 |         },
370 |         "outputId": "f55c6b6d-3cc4-473c-df00-177229a6ec12"
371 |       },
372 |       "source": [
373 |         "# checking for missing values\n",
374 |         "heart_data.isnull().sum()"
375 |       ],
376 |       "execution_count": null,
377 |       "outputs": [
378 |         {
379 |           "output_type": "execute_result",
380 |           "data": {
381 |             "text/plain": [
382 |               "age         0\n",
383 |               "sex         0\n",
384 |               "cp          0\n",
385 |               "trestbps    0\n",
386 |               "chol        0\n",
387 |               "fbs         0\n",
388 |               "restecg     0\n",
389 |               "thalach     0\n",
390 |               "exang       0\n",
391 |               "oldpeak     0\n",
392 |               "slope       0\n",
393 |               "ca          0\n",
394 |               "thal        0\n",
395 |               "target      0\n",
396 |               "dtype: int64"
397 |             ]
398 |           },
399 |           "metadata": {},
400 |           "execution_count": 6
401 |         }
402 |       ]
403 |     },
404 |     {
405 |       "cell_type": "code",
406 |       "metadata": {
407 |         "id": "4InaOSIUsfWP",
408 |         "colab": {
409 |           "base_uri": "https://localhost:8080/"
410 |         },
411 |         "outputId": "a508875a-712b-4987-c459-57efe941bc14"
412 |       },
413 |       "source": [
414 |         "# checking the distribution of Target Variable\n",
415 |         "heart_data['target'].value_counts()"
416 |       ],
417 |       "execution_count": null,
418 |       "outputs": [
419 |         {
420 |           "output_type": "execute_result",
421 |           "data": {
422 |             "text/plain": [
423 |               "1    165\n",
424 |               "0    138\n",
425 |               "Name: target, dtype: int64"
426 |             ]
427 |           },
428 |           "metadata": {},
429 |           "execution_count": 7
430 |         }
431 |       ]
432 |     },
433 |     {
434 |       "cell_type": "markdown",
435 |       "metadata": {
436 |         "id": "aSOBu4qDtJy5"
437 |       },
438 |       "source": [
439 |         "1 --> Defective Heart\n",
440 |         "\n",
441 |         "0 --> Healthy Heart"
442 |       ]
443 |     },
444 |     {
445 |       "cell_type": "markdown",
446 |       "metadata": {
447 |         "id": "tW8i4igjtPRC"
448 |       },
449 |       "source": [
450 |         "Splitting the Features and Target"
451 |       ]
452 |     },
453 |     {
454 |       "cell_type": "code",
455 |       "metadata": {
456 |         "id": "Q6yfbswrs7m3"
457 |       },
458 |       "source": [
459 |         "X = heart_data.drop(columns='target', axis=1)\n",
460 |         "Y = heart_data['target']"
461 |       ],
462 |       "execution_count": null,
463 |       "outputs": []
464 |     },
465 |     {
466 |       "cell_type": "code",
467 |       "metadata": {
468 |         "id": "XJoCp4ZKtpZy",
469 |         "colab": {
470 |           "base_uri": "https://localhost:8080/"
471 |         },
472 |         "outputId": "f12ada00-3c4f-4372-b334-72d44bd46abc"
473 |       },
474 |       "source": [
475 |         "print(X)"
476 |       ],
477 |       "execution_count": null,
478 |       "outputs": [
479 |         {
480 |           "output_type": "stream",
481 |           "name": "stdout",
482 |           "text": [
483 |             "     age  sex  cp  trestbps  chol  ...  exang  oldpeak  slope  ca  thal\n",
484 |             "0     63    1   3       145   233  ...      0      2.3      0   0     1\n",
485 |             "1     37    1   2       130   250  ...      0      3.5      0   0     2\n",
486 |             "2     41    0   1       130   204  ...      0      1.4      2   0     2\n",
487 |             "3     56    1   1       120   236  ...      0      0.8      2   0     2\n",
488 |             "4     57    0   0       120   354  ...      1      0.6      2   0     2\n",
489 |             "..   ...  ...  ..       ...   ...  ...    ...      ...    ...  ..   ...\n",
490 |             "298   57    0   0       140   241  ...      1      0.2      1   0     3\n",
491 |             "299   45    1   3       110   264  ...      0      1.2      1   0     3\n",
492 |             "300   68    1   0       144   193  ...      0      3.4      1   2     3\n",
493 |             "301   57    1   0       130   131  ...      1      1.2      1   1     3\n",
494 |             "302   57    0   1       130   236  ...      0      0.0      1   1     2\n",
495 |             "\n",
496 |             "[303 rows x 13 columns]\n"
497 |           ]
498 |         }
499 |       ]
500 |     },
501 |     {
502 |       "cell_type": "code",
503 |       "metadata": {
504 |         "id": "nukuj-YItq1w",
505 |         "colab": {
506 |           "base_uri": "https://localhost:8080/"
507 |         },
508 |         "outputId": "6f3ffab4-3273-4cb3-e28f-4a12bdd57695"
509 |       },
510 |       "source": [
511 |         "print(Y)"
512 |       ],
513 |       "execution_count": null,
514 |       "outputs": [
515 |         {
516 |           "output_type": "stream",
517 |           "name": "stdout",
518 |           "text": [
519 |             "0      1\n",
520 |             "1      1\n",
521 |             "2      1\n",
522 |             "3      1\n",
523 |             "4      1\n",
524 |             "      ..\n",
525 |             "298    0\n",
526 |             "299    0\n",
527 |             "300    0\n",
528 |             "301    0\n",
529 |             "302    0\n",
530 |             "Name: target, Length: 303, dtype: int64\n"
531 |           ]
532 |         }
533 |       ]
534 |     },
535 |     {
536 |       "cell_type": "markdown",
537 |       "source": [
538 |         "#**Train Test Split**"
539 |       ],
540 |       "metadata": {
541 |         "id": "aC6gnrWKmLkt"
542 |       }
543 |     },
544 |     {
545 |       "cell_type": "code",
546 |       "source": [
547 |         "X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2, stratify = Y, random_state=3)"
548 |       ],
549 |       "metadata": {
550 |         "id": "r3YeSH60mNkI"
551 |       },
552 |       "execution_count": null,
553 |       "outputs": []
554 |     },
555 |     {
556 |       "cell_type": "code",
557 |       "source": [
558 |         "print(X.shape, X_train.shape, X_test.shape)"
559 |       ],
560 |       "metadata": {
561 |         "colab": {
562 |           "base_uri": "https://localhost:8080/"
563 |         },
564 |         "id": "Cu0IQu4R5DUi",
565 |         "outputId": "e79e8d4e-d001-49ca-8815-f37881c6d3ba"
566 |       },
567 |       "execution_count": null,
568 |       "outputs": [
569 |         {
570 |           "output_type": "stream",
571 |           "name": "stdout",
572 |           "text": [
573 |             "(303, 13) (242, 13) (61, 13)\n"
574 |           ]
575 |         }
576 |       ]
577 |     },
578 |     {
579 |       "cell_type": "markdown",
580 |       "source": [
581 |         "Comparing the performance of the models"
582 |       ],
583 |       "metadata": {
584 |         "id": "YJGEFKbL6Xgz"
585 |       }
586 |     },
587 |     {
588 |       "cell_type": "code",
589 |       "source": [
590 |         "# list of models\n",
591 |         "models = [LogisticRegression(max_iter=1000), SVC(kernel='linear'), KNeighborsClassifier(), RandomForestClassifier()]"
592 |       ],
593 |       "metadata": {
594 |         "id": "FFYBrujx6He7"
595 |       },
596 |       "execution_count": null,
597 |       "outputs": []
598 |     },
599 |     {
600 |       "cell_type": "code",
601 |       "source": [
602 |         "def compare_models_train_test():\n",
603 |         "\n",
604 |         "  for model in models:\n",
605 |         "\n",
606 |         "    # training the model\n",
607 |         "    model.fit(X_train, Y_train)\n",
608 |         "    \n",
609 |         "    # evaluating the model\n",
610 |         "    test_data_prediction = model.predict(X_test)\n",
611 |         "\n",
612 |         "    accuracy = accuracy_score(Y_test, test_data_prediction)\n",
613 |         "\n",
614 |         "    print('Accuracy score of the ', model, ' = ', accuracy)\n",
615 |         "\n"
616 |       ],
617 |       "metadata": {
618 |         "id": "RBN8lQVj6x0g"
619 |       },
620 |       "execution_count": null,
621 |       "outputs": []
622 |     },
623 |     {
624 |       "cell_type": "code",
625 |       "source": [
626 |         "compare_models_train_test()"
627 |       ],
628 |       "metadata": {
629 |         "colab": {
630 |           "base_uri": "https://localhost:8080/"
631 |         },
632 |         "id": "35fIR_v_7Qt_",
633 |         "outputId": "bff483fc-4fbb-417f-90c0-5b11b75dbfa8"
634 |       },
635 |       "execution_count": null,
636 |       "outputs": [
637 |         {
638 |           "output_type": "stream",
639 |           "name": "stdout",
640 |           "text": [
641 |             "Accuracy score of the  LogisticRegression(max_iter=1000)  =  0.7704918032786885\n",
642 |             "Accuracy score of the  SVC(kernel='linear')  =  0.7704918032786885\n",
643 |             "Accuracy score of the  KNeighborsClassifier()  =  0.6557377049180327\n",
644 |             "Accuracy score of the  RandomForestClassifier()  =  0.8032786885245902\n"
645 |           ]
646 |         }
647 |       ]
648 |     },
649 |     {
650 |       "cell_type": "markdown",
651 |       "source": [
652 |         "#**Cross Validation**"
653 |       ],
654 |       "metadata": {
655 |         "id": "Wf783hX19fwN"
656 |       }
657 |     },
658 |     {
659 |       "cell_type": "markdown",
660 |       "source": [
661 |         "Logistic Regression"
662 |       ],
663 |       "metadata": {
664 |         "id": "cpRlz36P9vfe"
665 |       }
666 |     },
667 |     {
668 |       "cell_type": "code",
669 |       "source": [
670 |         "cv_score_lr = cross_val_score(LogisticRegression(max_iter=1000), X, Y, cv=5)\n",
671 |         "\n",
672 |         "print(cv_score_lr)\n",
673 |         "\n",
674 |         "mean_accuracy_lr = sum(cv_score_lr)/len(cv_score_lr)\n",
675 |         "\n",
676 |         "mean_accuracy_lr = mean_accuracy_lr*100\n",
677 |         "\n",
678 |         "mean_accuracy_lr = round(mean_accuracy_lr, 2)\n",
679 |         "\n",
680 |         "print(mean_accuracy_lr)"
681 |       ],
682 |       "metadata": {
683 |         "colab": {
684 |           "base_uri": "https://localhost:8080/"
685 |         },
686 |         "id": "fIkZCHab746J",
687 |         "outputId": "891b5b92-0339-4a96-8541-322084317ee3"
688 |       },
689 |       "execution_count": null,
690 |       "outputs": [
691 |         {
692 |           "output_type": "stream",
693 |           "name": "stdout",
694 |           "text": [
695 |             "[0.80327869 0.86885246 0.85245902 0.86666667 0.75      ]\n",
696 |             "82.83\n"
697 |           ]
698 |         }
699 |       ]
700 |     },
701 |     {
702 |       "cell_type": "markdown",
703 |       "source": [
704 |         "Support Vector Classifier"
705 |       ],
706 |       "metadata": {
707 |         "id": "RA7W2es0AFD3"
708 |       }
709 |     },
710 |     {
711 |       "cell_type": "code",
712 |       "source": [
713 |         "cv_score_svc = cross_val_score(SVC(kernel='linear'), X, Y, cv=5)\n",
714 |         "\n",
715 |         "print(cv_score_svc)\n",
716 |         "\n",
717 |         "mean_accuracy_svc = sum(cv_score_svc)/len(cv_score_svc)\n",
718 |         "\n",
719 |         "mean_accuracy_svc = mean_accuracy_svc*100\n",
720 |         "\n",
721 |         "mean_accuracy_svc = round(mean_accuracy_svc, 2)\n",
722 |         "\n",
723 |         "print(mean_accuracy_svc)"
724 |       ],
725 |       "metadata": {
726 |         "colab": {
727 |           "base_uri": "https://localhost:8080/"
728 |         },
729 |         "id": "nNCZfeSe-0oZ",
730 |         "outputId": "4e79257f-c77f-4d9c-e967-b3641ef86454"
731 |       },
732 |       "execution_count": null,
733 |       "outputs": [
734 |         {
735 |           "output_type": "stream",
736 |           "name": "stdout",
737 |           "text": [
738 |             "[0.81967213 0.8852459  0.80327869 0.86666667 0.76666667]\n",
739 |             "82.83\n"
740 |           ]
741 |         }
742 |       ]
743 |     },
744 |     {
745 |       "cell_type": "markdown",
746 |       "source": [
747 |         "Creating a Function to compare the models"
748 |       ],
749 |       "metadata": {
750 |         "id": "PlM83YyPApq_"
751 |       }
752 |     },
753 |     {
754 |       "cell_type": "code",
755 |       "source": [
756 |         "# list of models\n",
757 |         "models = [LogisticRegression(max_iter=1000), SVC(kernel='linear'), KNeighborsClassifier(), RandomForestClassifier()]"
758 |       ],
759 |       "metadata": {
760 |         "id": "uyAZczwYAT3f"
761 |       },
762 |       "execution_count": null,
763 |       "outputs": []
764 |     },
765 |     {
766 |       "cell_type": "code",
767 |       "source": [
768 |         "def compare_models_cross_validation():\n",
769 |         "\n",
770 |         "  for model in models:\n",
771 |         "\n",
772 |         "    cv_score = cross_val_score(model, X,Y, cv=5)\n",
773 |         "    \n",
774 |         "    mean_accuracy = sum(cv_score)/len(cv_score)\n",
775 |         "\n",
776 |         "    mean_accuracy = mean_accuracy*100\n",
777 |         "\n",
778 |         "    mean_accuracy = round(mean_accuracy, 2)\n",
779 |         "\n",
780 |         "    print('Cross Validation accuracies for ', model, '=  ', cv_score)\n",
781 |         "    print('Accuracy % of the ', model, mean_accuracy)\n",
782 |         "    print('----------------------------------------------')\n"
783 |       ],
784 |       "metadata": {
785 |         "id": "AWfa55OKAygv"
786 |       },
787 |       "execution_count": null,
788 |       "outputs": []
789 |     },
790 |     {
791 |       "cell_type": "code",
792 |       "source": [
793 |         "compare_models_cross_validation()"
794 |       ],
795 |       "metadata": {
796 |         "colab": {
797 |           "base_uri": "https://localhost:8080/"
798 |         },
799 |         "id": "QaCp6U_cBvVM",
800 |         "outputId": "0591db43-6a2c-4329-840d-04f3ae721d17"
801 |       },
802 |       "execution_count": null,
803 |       "outputs": [
804 |         {
805 |           "output_type": "stream",
806 |           "name": "stdout",
807 |           "text": [
808 |             "Cross Validation accuracies for  LogisticRegression(max_iter=1000) =   [0.80327869 0.86885246 0.85245902 0.86666667 0.75      ]\n",
809 |             "Accuracy % of the  LogisticRegression(max_iter=1000) 82.83\n",
810 |             "----------------------------------------------\n",
811 |             "Cross Validation accuracies for  SVC(kernel='linear') =   [0.81967213 0.8852459  0.80327869 0.86666667 0.76666667]\n",
812 |             "Accuracy % of the  SVC(kernel='linear') 82.83\n",
813 |             "----------------------------------------------\n",
814 |             "Cross Validation accuracies for  KNeighborsClassifier() =   [0.60655738 0.6557377  0.57377049 0.73333333 0.65      ]\n",
815 |             "Accuracy % of the  KNeighborsClassifier() 64.39\n",
816 |             "----------------------------------------------\n",
817 |             "Cross Validation accuracies for  RandomForestClassifier() =   [0.81967213 0.8852459  0.7704918  0.83333333 0.76666667]\n",
818 |             "Accuracy % of the  RandomForestClassifier() 81.51\n",
819 |             "----------------------------------------------\n"
820 |           ]
821 |         }
822 |       ]
823 |     },
824 |     {
825 |       "cell_type": "code",
826 |       "source": [],
827 |       "metadata": {
828 |         "id": "LRVoaEiLBx7V"
829 |       },
830 |       "execution_count": null,
831 |       "outputs": []
832 |     }
833 |   ]
834 | }


--------------------------------------------------------------------------------
/8_6_Model_Selection_in_ML_with_Python.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |   "nbformat": 4,
   3 |   "nbformat_minor": 0,
   4 |   "metadata": {
   5 |     "colab": {
   6 |       "provenance": [],
   7 |       "collapsed_sections": []
   8 |     },
   9 |     "kernelspec": {
  10 |       "name": "python3",
  11 |       "display_name": "Python 3"
  12 |     },
  13 |     "language_info": {
  14 |       "name": "python"
  15 |     }
  16 |   },
  17 |   "cells": [
  18 |     {
  19 |       "cell_type": "markdown",
  20 |       "source": [
  21 |         "Importing the dependencies"
  22 |       ],
  23 |       "metadata": {
  24 |         "id": "n6aUe4VhqwOj"
  25 |       }
  26 |     },
  27 |     {
  28 |       "cell_type": "code",
  29 |       "execution_count": null,
  30 |       "metadata": {
  31 |         "id": "6eFgKfedIpHm"
  32 |       },
  33 |       "outputs": [],
  34 |       "source": [
  35 |         "import numpy as np\n",
  36 |         "import pandas as pd\n",
  37 |         "from sklearn.model_selection import cross_val_score\n",
  38 |         "from sklearn.model_selection import GridSearchCV"
  39 |       ]
  40 |     },
  41 |     {
  42 |       "cell_type": "code",
  43 |       "source": [
  44 |         "# importing the models\n",
  45 |         "from sklearn.linear_model import LogisticRegression\n",
  46 |         "from sklearn.svm import SVC\n",
  47 |         "from sklearn.neighbors import KNeighborsClassifier\n",
  48 |         "from sklearn.ensemble import RandomForestClassifier"
  49 |       ],
  50 |       "metadata": {
  51 |         "id": "sHCGhgcErTI0"
  52 |       },
  53 |       "execution_count": null,
  54 |       "outputs": []
  55 |     },
  56 |     {
  57 |       "cell_type": "markdown",
  58 |       "source": [
  59 |         "We will be working on the Heart Disease dataset"
  60 |       ],
  61 |       "metadata": {
  62 |         "id": "9mJdx-jlKLH4"
  63 |       }
  64 |     },
  65 |     {
  66 |       "cell_type": "code",
  67 |       "source": [
  68 |         "# loading the csv data to a Pandas DataFrame\n",
  69 |         "heart_data = pd.read_csv('/content/heart.csv')"
  70 |       ],
  71 |       "metadata": {
  72 |         "id": "_lmdeZiLJdGm"
  73 |       },
  74 |       "execution_count": null,
  75 |       "outputs": []
  76 |     },
  77 |     {
  78 |       "cell_type": "code",
  79 |       "source": [
  80 |         "# print first 5 rows of the dataset\n",
  81 |         "heart_data.head()"
  82 |       ],
  83 |       "metadata": {
  84 |         "colab": {
  85 |           "base_uri": "https://localhost:8080/",
  86 |           "height": 206
  87 |         },
  88 |         "id": "xeMBIvC_Osi4",
  89 |         "outputId": "114a150f-83ca-4ebd-81c1-5117db28ed38"
  90 |       },
  91 |       "execution_count": null,
  92 |       "outputs": [
  93 |         {
  94 |           "output_type": "execute_result",
  95 |           "data": {
  96 |             "text/plain": [
  97 |               "   age  sex  cp  trestbps  chol  fbs  restecg  thalach  exang  oldpeak  slope  \\\n",
  98 |               "0   63    1   3       145   233    1        0      150      0      2.3      0   \n",
  99 |               "1   37    1   2       130   250    0        1      187      0      3.5      0   \n",
 100 |               "2   41    0   1       130   204    0        0      172      0      1.4      2   \n",
 101 |               "3   56    1   1       120   236    0        1      178      0      0.8      2   \n",
 102 |               "4   57    0   0       120   354    0        1      163      1      0.6      2   \n",
 103 |               "\n",
 104 |               "   ca  thal  target  \n",
 105 |               "0   0     1       1  \n",
 106 |               "1   0     2       1  \n",
 107 |               "2   0     2       1  \n",
 108 |               "3   0     2       1  \n",
 109 |               "4   0     2       1  "
 110 |             ],
 111 |             "text/html": [
 112 |               "\n",
 113 |               "  <div id=\"df-36571508-e9af-4067-b822-9dc27bb9c4e9\">\n",
 114 |               "    <div class=\"colab-df-container\">\n",
 115 |               "      <div>\n",
 116 |               "<style scoped>\n",
 117 |               "    .dataframe tbody tr th:only-of-type {\n",
 118 |               "        vertical-align: middle;\n",
 119 |               "    }\n",
 120 |               "\n",
 121 |               "    .dataframe tbody tr th {\n",
 122 |               "        vertical-align: top;\n",
 123 |               "    }\n",
 124 |               "\n",
 125 |               "    .dataframe thead th {\n",
 126 |               "        text-align: right;\n",
 127 |               "    }\n",
 128 |               "</style>\n",
 129 |               "<table border=\"1\" class=\"dataframe\">\n",
 130 |               "  <thead>\n",
 131 |               "    <tr style=\"text-align: right;\">\n",
 132 |               "      <th></th>\n",
 133 |               "      <th>age</th>\n",
 134 |               "      <th>sex</th>\n",
 135 |               "      <th>cp</th>\n",
 136 |               "      <th>trestbps</th>\n",
 137 |               "      <th>chol</th>\n",
 138 |               "      <th>fbs</th>\n",
 139 |               "      <th>restecg</th>\n",
 140 |               "      <th>thalach</th>\n",
 141 |               "      <th>exang</th>\n",
 142 |               "      <th>oldpeak</th>\n",
 143 |               "      <th>slope</th>\n",
 144 |               "      <th>ca</th>\n",
 145 |               "      <th>thal</th>\n",
 146 |               "      <th>target</th>\n",
 147 |               "    </tr>\n",
 148 |               "  </thead>\n",
 149 |               "  <tbody>\n",
 150 |               "    <tr>\n",
 151 |               "      <th>0</th>\n",
 152 |               "      <td>63</td>\n",
 153 |               "      <td>1</td>\n",
 154 |               "      <td>3</td>\n",
 155 |               "      <td>145</td>\n",
 156 |               "      <td>233</td>\n",
 157 |               "      <td>1</td>\n",
 158 |               "      <td>0</td>\n",
 159 |               "      <td>150</td>\n",
 160 |               "      <td>0</td>\n",
 161 |               "      <td>2.3</td>\n",
 162 |               "      <td>0</td>\n",
 163 |               "      <td>0</td>\n",
 164 |               "      <td>1</td>\n",
 165 |               "      <td>1</td>\n",
 166 |               "    </tr>\n",
 167 |               "    <tr>\n",
 168 |               "      <th>1</th>\n",
 169 |               "      <td>37</td>\n",
 170 |               "      <td>1</td>\n",
 171 |               "      <td>2</td>\n",
 172 |               "      <td>130</td>\n",
 173 |               "      <td>250</td>\n",
 174 |               "      <td>0</td>\n",
 175 |               "      <td>1</td>\n",
 176 |               "      <td>187</td>\n",
 177 |               "      <td>0</td>\n",
 178 |               "      <td>3.5</td>\n",
 179 |               "      <td>0</td>\n",
 180 |               "      <td>0</td>\n",
 181 |               "      <td>2</td>\n",
 182 |               "      <td>1</td>\n",
 183 |               "    </tr>\n",
 184 |               "    <tr>\n",
 185 |               "      <th>2</th>\n",
 186 |               "      <td>41</td>\n",
 187 |               "      <td>0</td>\n",
 188 |               "      <td>1</td>\n",
 189 |               "      <td>130</td>\n",
 190 |               "      <td>204</td>\n",
 191 |               "      <td>0</td>\n",
 192 |               "      <td>0</td>\n",
 193 |               "      <td>172</td>\n",
 194 |               "      <td>0</td>\n",
 195 |               "      <td>1.4</td>\n",
 196 |               "      <td>2</td>\n",
 197 |               "      <td>0</td>\n",
 198 |               "      <td>2</td>\n",
 199 |               "      <td>1</td>\n",
 200 |               "    </tr>\n",
 201 |               "    <tr>\n",
 202 |               "      <th>3</th>\n",
 203 |               "      <td>56</td>\n",
 204 |               "      <td>1</td>\n",
 205 |               "      <td>1</td>\n",
 206 |               "      <td>120</td>\n",
 207 |               "      <td>236</td>\n",
 208 |               "      <td>0</td>\n",
 209 |               "      <td>1</td>\n",
 210 |               "      <td>178</td>\n",
 211 |               "      <td>0</td>\n",
 212 |               "      <td>0.8</td>\n",
 213 |               "      <td>2</td>\n",
 214 |               "      <td>0</td>\n",
 215 |               "      <td>2</td>\n",
 216 |               "      <td>1</td>\n",
 217 |               "    </tr>\n",
 218 |               "    <tr>\n",
 219 |               "      <th>4</th>\n",
 220 |               "      <td>57</td>\n",
 221 |               "      <td>0</td>\n",
 222 |               "      <td>0</td>\n",
 223 |               "      <td>120</td>\n",
 224 |               "      <td>354</td>\n",
 225 |               "      <td>0</td>\n",
 226 |               "      <td>1</td>\n",
 227 |               "      <td>163</td>\n",
 228 |               "      <td>1</td>\n",
 229 |               "      <td>0.6</td>\n",
 230 |               "      <td>2</td>\n",
 231 |               "      <td>0</td>\n",
 232 |               "      <td>2</td>\n",
 233 |               "      <td>1</td>\n",
 234 |               "    </tr>\n",
 235 |               "  </tbody>\n",
 236 |               "</table>\n",
 237 |               "</div>\n",
 238 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-36571508-e9af-4067-b822-9dc27bb9c4e9')\"\n",
 239 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
 240 |               "              style=\"display:none;\">\n",
 241 |               "        \n",
 242 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
 243 |               "       width=\"24px\">\n",
 244 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
 245 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
 246 |               "  </svg>\n",
 247 |               "      </button>\n",
 248 |               "      \n",
 249 |               "  <style>\n",
 250 |               "    .colab-df-container {\n",
 251 |               "      display:flex;\n",
 252 |               "      flex-wrap:wrap;\n",
 253 |               "      gap: 12px;\n",
 254 |               "    }\n",
 255 |               "\n",
 256 |               "    .colab-df-convert {\n",
 257 |               "      background-color: #E8F0FE;\n",
 258 |               "      border: none;\n",
 259 |               "      border-radius: 50%;\n",
 260 |               "      cursor: pointer;\n",
 261 |               "      display: none;\n",
 262 |               "      fill: #1967D2;\n",
 263 |               "      height: 32px;\n",
 264 |               "      padding: 0 0 0 0;\n",
 265 |               "      width: 32px;\n",
 266 |               "    }\n",
 267 |               "\n",
 268 |               "    .colab-df-convert:hover {\n",
 269 |               "      background-color: #E2EBFA;\n",
 270 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
 271 |               "      fill: #174EA6;\n",
 272 |               "    }\n",
 273 |               "\n",
 274 |               "    [theme=dark] .colab-df-convert {\n",
 275 |               "      background-color: #3B4455;\n",
 276 |               "      fill: #D2E3FC;\n",
 277 |               "    }\n",
 278 |               "\n",
 279 |               "    [theme=dark] .colab-df-convert:hover {\n",
 280 |               "      background-color: #434B5C;\n",
 281 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
 282 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
 283 |               "      fill: #FFFFFF;\n",
 284 |               "    }\n",
 285 |               "  </style>\n",
 286 |               "\n",
 287 |               "      <script>\n",
 288 |               "        const buttonEl =\n",
 289 |               "          document.querySelector('#df-36571508-e9af-4067-b822-9dc27bb9c4e9 button.colab-df-convert');\n",
 290 |               "        buttonEl.style.display =\n",
 291 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
 292 |               "\n",
 293 |               "        async function convertToInteractive(key) {\n",
 294 |               "          const element = document.querySelector('#df-36571508-e9af-4067-b822-9dc27bb9c4e9');\n",
 295 |               "          const dataTable =\n",
 296 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
 297 |               "                                                     [key], {});\n",
 298 |               "          if (!dataTable) return;\n",
 299 |               "\n",
 300 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
 301 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
 302 |               "            + ' to learn more about interactive tables.';\n",
 303 |               "          element.innerHTML = '';\n",
 304 |               "          dataTable['output_type'] = 'display_data';\n",
 305 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
 306 |               "          const docLink = document.createElement('div');\n",
 307 |               "          docLink.innerHTML = docLinkHtml;\n",
 308 |               "          element.appendChild(docLink);\n",
 309 |               "        }\n",
 310 |               "      </script>\n",
 311 |               "    </div>\n",
 312 |               "  </div>\n",
 313 |               "  "
 314 |             ]
 315 |           },
 316 |           "metadata": {},
 317 |           "execution_count": 4
 318 |         }
 319 |       ]
 320 |     },
 321 |     {
 322 |       "cell_type": "code",
 323 |       "metadata": {
 324 |         "colab": {
 325 |           "base_uri": "https://localhost:8080/"
 326 |         },
 327 |         "id": "8nX1tIzbrz0u",
 328 |         "outputId": "7918a49e-7797-4657-b74b-236dc43b54f3"
 329 |       },
 330 |       "source": [
 331 |         "# number of rows and columns in the dataset\n",
 332 |         "heart_data.shape"
 333 |       ],
 334 |       "execution_count": null,
 335 |       "outputs": [
 336 |         {
 337 |           "output_type": "execute_result",
 338 |           "data": {
 339 |             "text/plain": [
 340 |               "(303, 14)"
 341 |             ]
 342 |           },
 343 |           "metadata": {},
 344 |           "execution_count": 5
 345 |         }
 346 |       ]
 347 |     },
 348 |     {
 349 |       "cell_type": "code",
 350 |       "metadata": {
 351 |         "colab": {
 352 |           "base_uri": "https://localhost:8080/"
 353 |         },
 354 |         "id": "GjHtW31rsGlb",
 355 |         "outputId": "5cd0124d-9f43-4787-8716-44a4bf1541df"
 356 |       },
 357 |       "source": [
 358 |         "# checking for missing values\n",
 359 |         "heart_data.isnull().sum()"
 360 |       ],
 361 |       "execution_count": null,
 362 |       "outputs": [
 363 |         {
 364 |           "output_type": "execute_result",
 365 |           "data": {
 366 |             "text/plain": [
 367 |               "age         0\n",
 368 |               "sex         0\n",
 369 |               "cp          0\n",
 370 |               "trestbps    0\n",
 371 |               "chol        0\n",
 372 |               "fbs         0\n",
 373 |               "restecg     0\n",
 374 |               "thalach     0\n",
 375 |               "exang       0\n",
 376 |               "oldpeak     0\n",
 377 |               "slope       0\n",
 378 |               "ca          0\n",
 379 |               "thal        0\n",
 380 |               "target      0\n",
 381 |               "dtype: int64"
 382 |             ]
 383 |           },
 384 |           "metadata": {},
 385 |           "execution_count": 6
 386 |         }
 387 |       ]
 388 |     },
 389 |     {
 390 |       "cell_type": "code",
 391 |       "metadata": {
 392 |         "colab": {
 393 |           "base_uri": "https://localhost:8080/"
 394 |         },
 395 |         "id": "4InaOSIUsfWP",
 396 |         "outputId": "ea550fb1-ccf0-427c-c467-2b5d36bf7b72"
 397 |       },
 398 |       "source": [
 399 |         "# checking the distribution of Target Variable\n",
 400 |         "heart_data['target'].value_counts()"
 401 |       ],
 402 |       "execution_count": null,
 403 |       "outputs": [
 404 |         {
 405 |           "output_type": "execute_result",
 406 |           "data": {
 407 |             "text/plain": [
 408 |               "1    165\n",
 409 |               "0    138\n",
 410 |               "Name: target, dtype: int64"
 411 |             ]
 412 |           },
 413 |           "metadata": {},
 414 |           "execution_count": 7
 415 |         }
 416 |       ]
 417 |     },
 418 |     {
 419 |       "cell_type": "markdown",
 420 |       "metadata": {
 421 |         "id": "aSOBu4qDtJy5"
 422 |       },
 423 |       "source": [
 424 |         "1 --> Defective Heart\n",
 425 |         "\n",
 426 |         "0 --> Healthy Heart"
 427 |       ]
 428 |     },
 429 |     {
 430 |       "cell_type": "markdown",
 431 |       "metadata": {
 432 |         "id": "tW8i4igjtPRC"
 433 |       },
 434 |       "source": [
 435 |         "Splitting the Features and Target"
 436 |       ]
 437 |     },
 438 |     {
 439 |       "cell_type": "code",
 440 |       "metadata": {
 441 |         "id": "Q6yfbswrs7m3"
 442 |       },
 443 |       "source": [
 444 |         "X = heart_data.drop(columns='target', axis=1)\n",
 445 |         "Y = heart_data['target']"
 446 |       ],
 447 |       "execution_count": null,
 448 |       "outputs": []
 449 |     },
 450 |     {
 451 |       "cell_type": "code",
 452 |       "metadata": {
 453 |         "colab": {
 454 |           "base_uri": "https://localhost:8080/"
 455 |         },
 456 |         "id": "XJoCp4ZKtpZy",
 457 |         "outputId": "8ab1fe07-baa7-4c75-ac83-1c62f27e33f6"
 458 |       },
 459 |       "source": [
 460 |         "print(X)"
 461 |       ],
 462 |       "execution_count": null,
 463 |       "outputs": [
 464 |         {
 465 |           "output_type": "stream",
 466 |           "name": "stdout",
 467 |           "text": [
 468 |             "     age  sex  cp  trestbps  chol  fbs  restecg  thalach  exang  oldpeak  \\\n",
 469 |             "0     63    1   3       145   233    1        0      150      0      2.3   \n",
 470 |             "1     37    1   2       130   250    0        1      187      0      3.5   \n",
 471 |             "2     41    0   1       130   204    0        0      172      0      1.4   \n",
 472 |             "3     56    1   1       120   236    0        1      178      0      0.8   \n",
 473 |             "4     57    0   0       120   354    0        1      163      1      0.6   \n",
 474 |             "..   ...  ...  ..       ...   ...  ...      ...      ...    ...      ...   \n",
 475 |             "298   57    0   0       140   241    0        1      123      1      0.2   \n",
 476 |             "299   45    1   3       110   264    0        1      132      0      1.2   \n",
 477 |             "300   68    1   0       144   193    1        1      141      0      3.4   \n",
 478 |             "301   57    1   0       130   131    0        1      115      1      1.2   \n",
 479 |             "302   57    0   1       130   236    0        0      174      0      0.0   \n",
 480 |             "\n",
 481 |             "     slope  ca  thal  \n",
 482 |             "0        0   0     1  \n",
 483 |             "1        0   0     2  \n",
 484 |             "2        2   0     2  \n",
 485 |             "3        2   0     2  \n",
 486 |             "4        2   0     2  \n",
 487 |             "..     ...  ..   ...  \n",
 488 |             "298      1   0     3  \n",
 489 |             "299      1   0     3  \n",
 490 |             "300      1   2     3  \n",
 491 |             "301      1   1     3  \n",
 492 |             "302      1   1     2  \n",
 493 |             "\n",
 494 |             "[303 rows x 13 columns]\n"
 495 |           ]
 496 |         }
 497 |       ]
 498 |     },
 499 |     {
 500 |       "cell_type": "code",
 501 |       "metadata": {
 502 |         "colab": {
 503 |           "base_uri": "https://localhost:8080/"
 504 |         },
 505 |         "id": "nukuj-YItq1w",
 506 |         "outputId": "98f7e5ce-068a-4340-b739-c9b5947b2613"
 507 |       },
 508 |       "source": [
 509 |         "print(Y)"
 510 |       ],
 511 |       "execution_count": null,
 512 |       "outputs": [
 513 |         {
 514 |           "output_type": "stream",
 515 |           "name": "stdout",
 516 |           "text": [
 517 |             "0      1\n",
 518 |             "1      1\n",
 519 |             "2      1\n",
 520 |             "3      1\n",
 521 |             "4      1\n",
 522 |             "      ..\n",
 523 |             "298    0\n",
 524 |             "299    0\n",
 525 |             "300    0\n",
 526 |             "301    0\n",
 527 |             "302    0\n",
 528 |             "Name: target, Length: 303, dtype: int64\n"
 529 |           ]
 530 |         }
 531 |       ]
 532 |     },
 533 |     {
 534 |       "cell_type": "code",
 535 |       "source": [
 536 |         " X = np.asarray(X)\n",
 537 |         " Y = np.asarray(Y)"
 538 |       ],
 539 |       "metadata": {
 540 |         "id": "4OFJBpqfTCjJ"
 541 |       },
 542 |       "execution_count": null,
 543 |       "outputs": []
 544 |     },
 545 |     {
 546 |       "cell_type": "markdown",
 547 |       "source": [
 548 |         "**Model Selection**"
 549 |       ],
 550 |       "metadata": {
 551 |         "id": "BHcyqvzw0c15"
 552 |       }
 553 |     },
 554 |     {
 555 |       "cell_type": "markdown",
 556 |       "source": [
 557 |         "1. Comparing the models with default hyperparameter values using Cross Validation"
 558 |       ],
 559 |       "metadata": {
 560 |         "id": "YE4gR8NbCDfz"
 561 |       }
 562 |     },
 563 |     {
 564 |       "cell_type": "code",
 565 |       "source": [
 566 |         "# list of models\n",
 567 |         "models = [LogisticRegression(max_iter=1000), SVC(kernel='linear'), KNeighborsClassifier(), RandomForestClassifier(random_state=0)]"
 568 |       ],
 569 |       "metadata": {
 570 |         "id": "D71G1BFz0emy"
 571 |       },
 572 |       "execution_count": null,
 573 |       "outputs": []
 574 |     },
 575 |     {
 576 |       "cell_type": "code",
 577 |       "source": [
 578 |         "def compare_models_cross_validation():\n",
 579 |         "\n",
 580 |         "  for model in models:\n",
 581 |         "\n",
 582 |         "    cv_score = cross_val_score(model, X, Y, cv=5)\n",
 583 |         "    mean_accuracy = sum(cv_score)/len(cv_score)\n",
 584 |         "    mean_accuracy = mean_accuracy*100\n",
 585 |         "    mean_accuracy = round(mean_accuracy, 2)\n",
 586 |         "\n",
 587 |         "    print('Cross Validation accuracies for the',model,'=', cv_score)\n",
 588 |         "    print('Acccuracy score of the ',model,'=',mean_accuracy,'%')\n",
 589 |         "    print('---------------------------------------------------------------')"
 590 |       ],
 591 |       "metadata": {
 592 |         "id": "rhY3ikQOC3rZ"
 593 |       },
 594 |       "execution_count": null,
 595 |       "outputs": []
 596 |     },
 597 |     {
 598 |       "cell_type": "code",
 599 |       "source": [
 600 |         "compare_models_cross_validation()"
 601 |       ],
 602 |       "metadata": {
 603 |         "colab": {
 604 |           "base_uri": "https://localhost:8080/"
 605 |         },
 606 |         "id": "17dfatWwEwVW",
 607 |         "outputId": "b54c7253-ce1c-47d7-c5f3-bc1156943ff2"
 608 |       },
 609 |       "execution_count": null,
 610 |       "outputs": [
 611 |         {
 612 |           "output_type": "stream",
 613 |           "name": "stdout",
 614 |           "text": [
 615 |             "Cross Validation accuracies for the LogisticRegression(max_iter=1000) = [0.80327869 0.8852459  0.85245902 0.86666667 0.75      ]\n",
 616 |             "Acccuracy score of the  LogisticRegression(max_iter=1000) = 83.15 %\n",
 617 |             "---------------------------------------------------------------\n",
 618 |             "Cross Validation accuracies for the SVC(kernel='linear') = [0.81967213 0.8852459  0.80327869 0.86666667 0.76666667]\n",
 619 |             "Acccuracy score of the  SVC(kernel='linear') = 82.83 %\n",
 620 |             "---------------------------------------------------------------\n",
 621 |             "Cross Validation accuracies for the KNeighborsClassifier() = [0.60655738 0.6557377  0.57377049 0.73333333 0.65      ]\n",
 622 |             "Acccuracy score of the  KNeighborsClassifier() = 64.39 %\n",
 623 |             "---------------------------------------------------------------\n",
 624 |             "Cross Validation accuracies for the RandomForestClassifier(random_state=0) = [0.85245902 0.90163934 0.81967213 0.81666667 0.8       ]\n",
 625 |             "Acccuracy score of the  RandomForestClassifier(random_state=0) = 83.81 %\n",
 626 |             "---------------------------------------------------------------\n"
 627 |           ]
 628 |         }
 629 |       ]
 630 |     },
 631 |     {
 632 |       "cell_type": "markdown",
 633 |       "source": [
 634 |         "Inference: For the Heart Disease dataset, **Random Forest Classifier** has the Highest accuracy value with default hyperparameter values"
 635 |       ],
 636 |       "metadata": {
 637 |         "id": "O-BZYtX6FtwZ"
 638 |       }
 639 |     },
 640 |     {
 641 |       "cell_type": "markdown",
 642 |       "source": [
 643 |         "2. Comparing the models with different Hyperparameter values using GridSearchCV"
 644 |       ],
 645 |       "metadata": {
 646 |         "id": "loKdk57gGWmR"
 647 |       }
 648 |     },
 649 |     {
 650 |       "cell_type": "code",
 651 |       "source": [
 652 |         "# list of models\n",
 653 |         "models_list = [LogisticRegression(max_iter=10000), SVC(), KNeighborsClassifier(), RandomForestClassifier(random_state=0)]"
 654 |       ],
 655 |       "metadata": {
 656 |         "id": "43Wq9FXWEzHn"
 657 |       },
 658 |       "execution_count": null,
 659 |       "outputs": []
 660 |     },
 661 |     {
 662 |       "cell_type": "code",
 663 |       "source": [
 664 |         "# creating a dictionary that contains hyperparameter values for the above mentioned models\n",
 665 |         "\n",
 666 |         "\n",
 667 |         "model_hyperparameters = {\n",
 668 |         "    \n",
 669 |         "\n",
 670 |         "    'log_reg_hyperparameters': {\n",
 671 |         "        \n",
 672 |         "        'C' : [1,5,10,20]\n",
 673 |         "    },\n",
 674 |         "\n",
 675 |         "    'svc_hyperparameters': {\n",
 676 |         "        \n",
 677 |         "        'kernel' : ['linear','poly','rbf','sigmoid'],\n",
 678 |         "        'C' : [1,5,10,20]\n",
 679 |         "    },\n",
 680 |         "\n",
 681 |         "\n",
 682 |         "    'KNN_hyperparameters' : {\n",
 683 |         "        \n",
 684 |         "        'n_neighbors' : [3,5,10]\n",
 685 |         "    },\n",
 686 |         "\n",
 687 |         "\n",
 688 |         "    'random_forest_hyperparameters' : {\n",
 689 |         "        \n",
 690 |         "        'n_estimators' : [10, 20, 50, 100]\n",
 691 |         "    }\n",
 692 |         "}"
 693 |       ],
 694 |       "metadata": {
 695 |         "id": "zfODd_glGxnd"
 696 |       },
 697 |       "execution_count": null,
 698 |       "outputs": []
 699 |     },
 700 |     {
 701 |       "cell_type": "code",
 702 |       "source": [
 703 |         "type(model_hyperparameters)"
 704 |       ],
 705 |       "metadata": {
 706 |         "colab": {
 707 |           "base_uri": "https://localhost:8080/"
 708 |         },
 709 |         "id": "uj9F-miFJATp",
 710 |         "outputId": "a5ea0055-e2eb-42fb-a237-a2b3e6a9f5d3"
 711 |       },
 712 |       "execution_count": null,
 713 |       "outputs": [
 714 |         {
 715 |           "output_type": "execute_result",
 716 |           "data": {
 717 |             "text/plain": [
 718 |               "dict"
 719 |             ]
 720 |           },
 721 |           "metadata": {},
 722 |           "execution_count": 40
 723 |         }
 724 |       ]
 725 |     },
 726 |     {
 727 |       "cell_type": "code",
 728 |       "source": [
 729 |         "print(model_hyperparameters.keys())"
 730 |       ],
 731 |       "metadata": {
 732 |         "colab": {
 733 |           "base_uri": "https://localhost:8080/"
 734 |         },
 735 |         "id": "ykAidRlaJrBx",
 736 |         "outputId": "c8b77598-91a2-4929-f340-8e27a6716c74"
 737 |       },
 738 |       "execution_count": null,
 739 |       "outputs": [
 740 |         {
 741 |           "output_type": "stream",
 742 |           "name": "stdout",
 743 |           "text": [
 744 |             "dict_keys(['log_reg_hyperparameters', 'svc_hyperparameters', 'KNN_hyperparameters', 'random_forest_hyperparameters'])\n"
 745 |           ]
 746 |         }
 747 |       ]
 748 |     },
 749 |     {
 750 |       "cell_type": "code",
 751 |       "source": [
 752 |         "model_hyperparameters['log_reg_hyperparameters']"
 753 |       ],
 754 |       "metadata": {
 755 |         "colab": {
 756 |           "base_uri": "https://localhost:8080/"
 757 |         },
 758 |         "id": "enerj0PaKDdM",
 759 |         "outputId": "4865421f-75e0-4b04-a7db-25985e77ba01"
 760 |       },
 761 |       "execution_count": null,
 762 |       "outputs": [
 763 |         {
 764 |           "output_type": "execute_result",
 765 |           "data": {
 766 |             "text/plain": [
 767 |               "{'C': [1, 5, 10, 20]}"
 768 |             ]
 769 |           },
 770 |           "metadata": {},
 771 |           "execution_count": 50
 772 |         }
 773 |       ]
 774 |     },
 775 |     {
 776 |       "cell_type": "code",
 777 |       "source": [
 778 |         "model_keys = list(model_hyperparameters.keys())\n",
 779 |         "print(model_keys)"
 780 |       ],
 781 |       "metadata": {
 782 |         "colab": {
 783 |           "base_uri": "https://localhost:8080/"
 784 |         },
 785 |         "id": "zYzP9-RzJ1J8",
 786 |         "outputId": "db1e33bb-a2f4-49e3-836e-91fec83313b9"
 787 |       },
 788 |       "execution_count": null,
 789 |       "outputs": [
 790 |         {
 791 |           "output_type": "stream",
 792 |           "name": "stdout",
 793 |           "text": [
 794 |             "['log_reg_hyperparameters', 'svc_hyperparameters', 'KNN_hyperparameters', 'random_forest_hyperparameters']\n"
 795 |           ]
 796 |         }
 797 |       ]
 798 |     },
 799 |     {
 800 |       "cell_type": "code",
 801 |       "source": [
 802 |         "model_keys[0]"
 803 |       ],
 804 |       "metadata": {
 805 |         "colab": {
 806 |           "base_uri": "https://localhost:8080/",
 807 |           "height": 35
 808 |         },
 809 |         "id": "umt2Y6DXKJrd",
 810 |         "outputId": "860770f2-4a81-466c-ed4f-1723fc9ec6b5"
 811 |       },
 812 |       "execution_count": null,
 813 |       "outputs": [
 814 |         {
 815 |           "output_type": "execute_result",
 816 |           "data": {
 817 |             "text/plain": [
 818 |               "'log_reg_hyperparameters'"
 819 |             ],
 820 |             "application/vnd.google.colaboratory.intrinsic+json": {
 821 |               "type": "string"
 822 |             }
 823 |           },
 824 |           "metadata": {},
 825 |           "execution_count": 44
 826 |         }
 827 |       ]
 828 |     },
 829 |     {
 830 |       "cell_type": "code",
 831 |       "source": [
 832 |         "model_hyperparameters[model_keys[0]]"
 833 |       ],
 834 |       "metadata": {
 835 |         "colab": {
 836 |           "base_uri": "https://localhost:8080/"
 837 |         },
 838 |         "id": "gssFvxkTKYCL",
 839 |         "outputId": "a44879a7-a7b1-47c9-d938-92d8645dff0e"
 840 |       },
 841 |       "execution_count": null,
 842 |       "outputs": [
 843 |         {
 844 |           "output_type": "execute_result",
 845 |           "data": {
 846 |             "text/plain": [
 847 |               "{'C': [1, 5, 10, 20]}"
 848 |             ]
 849 |           },
 850 |           "metadata": {},
 851 |           "execution_count": 45
 852 |         }
 853 |       ]
 854 |     },
 855 |     {
 856 |       "cell_type": "markdown",
 857 |       "source": [
 858 |         "Applying GridSearchCV"
 859 |       ],
 860 |       "metadata": {
 861 |         "id": "F5Kl_MW8K5tr"
 862 |       }
 863 |     },
 864 |     {
 865 |       "cell_type": "code",
 866 |       "source": [
 867 |         "def ModelSelection(list_of_models, hyperparameters_dictionary):\n",
 868 |         "\n",
 869 |         "  result = []\n",
 870 |         "\n",
 871 |         "  i = 0\n",
 872 |         "\n",
 873 |         "  for model in list_of_models:\n",
 874 |         "\n",
 875 |         "    key = model_keys[i]\n",
 876 |         "\n",
 877 |         "    params = hyperparameters_dictionary[key]\n",
 878 |         "\n",
 879 |         "    i += 1\n",
 880 |         "\n",
 881 |         "    print(model)\n",
 882 |         "    print(params)\n",
 883 |         "    print('---------------------------------')\n",
 884 |         "\n",
 885 |         "\n",
 886 |         "    classifier = GridSearchCV(model, params, cv=5)\n",
 887 |         "\n",
 888 |         "    # fitting the data to classifier\n",
 889 |         "    classifier.fit(X,Y)\n",
 890 |         "\n",
 891 |         "    result.append({\n",
 892 |         "        'model used' : model,\n",
 893 |         "        'highest score' : classifier.best_score_,\n",
 894 |         "        'best hyperparameters' : classifier.best_params_\n",
 895 |         "    })\n",
 896 |         "\n",
 897 |         "  result_dataframe = pd.DataFrame(result, columns = ['model used','highest score','best hyperparameters'])\n",
 898 |         "\n",
 899 |         "  return result_dataframe"
 900 |       ],
 901 |       "metadata": {
 902 |         "id": "2x5dWxgaKnmW"
 903 |       },
 904 |       "execution_count": null,
 905 |       "outputs": []
 906 |     },
 907 |     {
 908 |       "cell_type": "code",
 909 |       "source": [
 910 |         "ModelSelection(models_list, model_hyperparameters)"
 911 |       ],
 912 |       "metadata": {
 913 |         "colab": {
 914 |           "base_uri": "https://localhost:8080/",
 915 |           "height": 383
 916 |         },
 917 |         "id": "Mtfv4xkwNBd0",
 918 |         "outputId": "a6bc4fd3-86b2-4ef3-81ff-747944e86f89"
 919 |       },
 920 |       "execution_count": null,
 921 |       "outputs": [
 922 |         {
 923 |           "output_type": "stream",
 924 |           "name": "stdout",
 925 |           "text": [
 926 |             "LogisticRegression(max_iter=10000)\n",
 927 |             "{'C': [1, 5, 10, 20]}\n",
 928 |             "---------------------------------\n",
 929 |             "SVC()\n",
 930 |             "{'kernel': ['linear', 'poly', 'rbf', 'sigmoid'], 'C': [1, 5, 10, 20]}\n",
 931 |             "---------------------------------\n",
 932 |             "KNeighborsClassifier()\n",
 933 |             "{'n_neighbors': [3, 5, 10]}\n",
 934 |             "---------------------------------\n",
 935 |             "RandomForestClassifier(random_state=0)\n",
 936 |             "{'n_estimators': [10, 20, 50, 100]}\n",
 937 |             "---------------------------------\n"
 938 |           ]
 939 |         },
 940 |         {
 941 |           "output_type": "execute_result",
 942 |           "data": {
 943 |             "text/plain": [
 944 |               "                               model used  highest score  \\\n",
 945 |               "0      LogisticRegression(max_iter=10000)       0.831585   \n",
 946 |               "1                                   SVC()       0.828306   \n",
 947 |               "2                  KNeighborsClassifier()       0.643880   \n",
 948 |               "3  RandomForestClassifier(random_state=0)       0.838087   \n",
 949 |               "\n",
 950 |               "           best hyperparameters  \n",
 951 |               "0                      {'C': 5}  \n",
 952 |               "1  {'C': 1, 'kernel': 'linear'}  \n",
 953 |               "2            {'n_neighbors': 5}  \n",
 954 |               "3         {'n_estimators': 100}  "
 955 |             ],
 956 |             "text/html": [
 957 |               "\n",
 958 |               "  <div id=\"df-556c0392-2072-4e22-867c-540e3484927f\">\n",
 959 |               "    <div class=\"colab-df-container\">\n",
 960 |               "      <div>\n",
 961 |               "<style scoped>\n",
 962 |               "    .dataframe tbody tr th:only-of-type {\n",
 963 |               "        vertical-align: middle;\n",
 964 |               "    }\n",
 965 |               "\n",
 966 |               "    .dataframe tbody tr th {\n",
 967 |               "        vertical-align: top;\n",
 968 |               "    }\n",
 969 |               "\n",
 970 |               "    .dataframe thead th {\n",
 971 |               "        text-align: right;\n",
 972 |               "    }\n",
 973 |               "</style>\n",
 974 |               "<table border=\"1\" class=\"dataframe\">\n",
 975 |               "  <thead>\n",
 976 |               "    <tr style=\"text-align: right;\">\n",
 977 |               "      <th></th>\n",
 978 |               "      <th>model used</th>\n",
 979 |               "      <th>highest score</th>\n",
 980 |               "      <th>best hyperparameters</th>\n",
 981 |               "    </tr>\n",
 982 |               "  </thead>\n",
 983 |               "  <tbody>\n",
 984 |               "    <tr>\n",
 985 |               "      <th>0</th>\n",
 986 |               "      <td>LogisticRegression(max_iter=10000)</td>\n",
 987 |               "      <td>0.831585</td>\n",
 988 |               "      <td>{'C': 5}</td>\n",
 989 |               "    </tr>\n",
 990 |               "    <tr>\n",
 991 |               "      <th>1</th>\n",
 992 |               "      <td>SVC()</td>\n",
 993 |               "      <td>0.828306</td>\n",
 994 |               "      <td>{'C': 1, 'kernel': 'linear'}</td>\n",
 995 |               "    </tr>\n",
 996 |               "    <tr>\n",
 997 |               "      <th>2</th>\n",
 998 |               "      <td>KNeighborsClassifier()</td>\n",
 999 |               "      <td>0.643880</td>\n",
1000 |               "      <td>{'n_neighbors': 5}</td>\n",
1001 |               "    </tr>\n",
1002 |               "    <tr>\n",
1003 |               "      <th>3</th>\n",
1004 |               "      <td>RandomForestClassifier(random_state=0)</td>\n",
1005 |               "      <td>0.838087</td>\n",
1006 |               "      <td>{'n_estimators': 100}</td>\n",
1007 |               "    </tr>\n",
1008 |               "  </tbody>\n",
1009 |               "</table>\n",
1010 |               "</div>\n",
1011 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-556c0392-2072-4e22-867c-540e3484927f')\"\n",
1012 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
1013 |               "              style=\"display:none;\">\n",
1014 |               "        \n",
1015 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
1016 |               "       width=\"24px\">\n",
1017 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
1018 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
1019 |               "  </svg>\n",
1020 |               "      </button>\n",
1021 |               "      \n",
1022 |               "  <style>\n",
1023 |               "    .colab-df-container {\n",
1024 |               "      display:flex;\n",
1025 |               "      flex-wrap:wrap;\n",
1026 |               "      gap: 12px;\n",
1027 |               "    }\n",
1028 |               "\n",
1029 |               "    .colab-df-convert {\n",
1030 |               "      background-color: #E8F0FE;\n",
1031 |               "      border: none;\n",
1032 |               "      border-radius: 50%;\n",
1033 |               "      cursor: pointer;\n",
1034 |               "      display: none;\n",
1035 |               "      fill: #1967D2;\n",
1036 |               "      height: 32px;\n",
1037 |               "      padding: 0 0 0 0;\n",
1038 |               "      width: 32px;\n",
1039 |               "    }\n",
1040 |               "\n",
1041 |               "    .colab-df-convert:hover {\n",
1042 |               "      background-color: #E2EBFA;\n",
1043 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
1044 |               "      fill: #174EA6;\n",
1045 |               "    }\n",
1046 |               "\n",
1047 |               "    [theme=dark] .colab-df-convert {\n",
1048 |               "      background-color: #3B4455;\n",
1049 |               "      fill: #D2E3FC;\n",
1050 |               "    }\n",
1051 |               "\n",
1052 |               "    [theme=dark] .colab-df-convert:hover {\n",
1053 |               "      background-color: #434B5C;\n",
1054 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
1055 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
1056 |               "      fill: #FFFFFF;\n",
1057 |               "    }\n",
1058 |               "  </style>\n",
1059 |               "\n",
1060 |               "      <script>\n",
1061 |               "        const buttonEl =\n",
1062 |               "          document.querySelector('#df-556c0392-2072-4e22-867c-540e3484927f button.colab-df-convert');\n",
1063 |               "        buttonEl.style.display =\n",
1064 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
1065 |               "\n",
1066 |               "        async function convertToInteractive(key) {\n",
1067 |               "          const element = document.querySelector('#df-556c0392-2072-4e22-867c-540e3484927f');\n",
1068 |               "          const dataTable =\n",
1069 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
1070 |               "                                                     [key], {});\n",
1071 |               "          if (!dataTable) return;\n",
1072 |               "\n",
1073 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
1074 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
1075 |               "            + ' to learn more about interactive tables.';\n",
1076 |               "          element.innerHTML = '';\n",
1077 |               "          dataTable['output_type'] = 'display_data';\n",
1078 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
1079 |               "          const docLink = document.createElement('div');\n",
1080 |               "          docLink.innerHTML = docLinkHtml;\n",
1081 |               "          element.appendChild(docLink);\n",
1082 |               "        }\n",
1083 |               "      </script>\n",
1084 |               "    </div>\n",
1085 |               "  </div>\n",
1086 |               "  "
1087 |             ]
1088 |           },
1089 |           "metadata": {},
1090 |           "execution_count": 52
1091 |         }
1092 |       ]
1093 |     },
1094 |     {
1095 |       "cell_type": "markdown",
1096 |       "source": [
1097 |         "Random Forest Classifier with n_estimators = 100 has the highest accuracy"
1098 |       ],
1099 |       "metadata": {
1100 |         "id": "7ZOb0iQBPiZ8"
1101 |       }
1102 |     },
1103 |     {
1104 |       "cell_type": "code",
1105 |       "source": [],
1106 |       "metadata": {
1107 |         "id": "0hGHX4uONKgn"
1108 |       },
1109 |       "execution_count": null,
1110 |       "outputs": []
1111 |     }
1112 |   ]
1113 | }


--------------------------------------------------------------------------------
/Precision,_Recall,_F1_Score_Python_implementation.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |   "nbformat": 4,
   3 |   "nbformat_minor": 0,
   4 |   "metadata": {
   5 |     "colab": {
   6 |       "provenance": [],
   7 |       "collapsed_sections": []
   8 |     },
   9 |     "kernelspec": {
  10 |       "name": "python3",
  11 |       "display_name": "Python 3"
  12 |     },
  13 |     "language_info": {
  14 |       "name": "python"
  15 |     }
  16 |   },
  17 |   "cells": [
  18 |     {
  19 |       "cell_type": "markdown",
  20 |       "source": [
  21 |         "Importing the Dependencies"
  22 |       ],
  23 |       "metadata": {
  24 |         "id": "xgd0kvExWcAm"
  25 |       }
  26 |     },
  27 |     {
  28 |       "cell_type": "code",
  29 |       "execution_count": null,
  30 |       "metadata": {
  31 |         "id": "Yg0dYZpxUnnH"
  32 |       },
  33 |       "outputs": [],
  34 |       "source": [
  35 |         "import numpy as np\n",
  36 |         "import pandas as pd\n",
  37 |         "from sklearn.model_selection import train_test_split\n",
  38 |         "from sklearn.linear_model import LogisticRegression"
  39 |       ]
  40 |     },
  41 |     {
  42 |       "cell_type": "markdown",
  43 |       "source": [
  44 |         "Data Collection & Processing"
  45 |       ],
  46 |       "metadata": {
  47 |         "id": "6C-ri2RfZINI"
  48 |       }
  49 |     },
  50 |     {
  51 |       "cell_type": "code",
  52 |       "metadata": {
  53 |         "id": "0q-3-LkQrREV"
  54 |       },
  55 |       "source": [
  56 |         "# loading the csv data to a Pandas DataFrame\n",
  57 |         "heart_data = pd.read_csv('heart.csv')"
  58 |       ],
  59 |       "execution_count": null,
  60 |       "outputs": []
  61 |     },
  62 |     {
  63 |       "cell_type": "code",
  64 |       "metadata": {
  65 |         "colab": {
  66 |           "base_uri": "https://localhost:8080/",
  67 |           "height": 206
  68 |         },
  69 |         "id": "M8dQxSTqriWD",
  70 |         "outputId": "fb5a61f8-1a7e-48b2-8324-dec8280bde10"
  71 |       },
  72 |       "source": [
  73 |         "# print first 5 rows of the dataset\n",
  74 |         "heart_data.head()"
  75 |       ],
  76 |       "execution_count": null,
  77 |       "outputs": [
  78 |         {
  79 |           "output_type": "execute_result",
  80 |           "data": {
  81 |             "text/plain": [
  82 |               "   age  sex  cp  trestbps  chol  fbs  restecg  thalach  exang  oldpeak  slope  \\\n",
  83 |               "0   63    1   3       145   233    1        0      150      0      2.3      0   \n",
  84 |               "1   37    1   2       130   250    0        1      187      0      3.5      0   \n",
  85 |               "2   41    0   1       130   204    0        0      172      0      1.4      2   \n",
  86 |               "3   56    1   1       120   236    0        1      178      0      0.8      2   \n",
  87 |               "4   57    0   0       120   354    0        1      163      1      0.6      2   \n",
  88 |               "\n",
  89 |               "   ca  thal  target  \n",
  90 |               "0   0     1       1  \n",
  91 |               "1   0     2       1  \n",
  92 |               "2   0     2       1  \n",
  93 |               "3   0     2       1  \n",
  94 |               "4   0     2       1  "
  95 |             ],
  96 |             "text/html": [
  97 |               "\n",
  98 |               "  <div id=\"df-34720754-a536-40c3-8ad5-433546461268\">\n",
  99 |               "    <div class=\"colab-df-container\">\n",
 100 |               "      <div>\n",
 101 |               "<style scoped>\n",
 102 |               "    .dataframe tbody tr th:only-of-type {\n",
 103 |               "        vertical-align: middle;\n",
 104 |               "    }\n",
 105 |               "\n",
 106 |               "    .dataframe tbody tr th {\n",
 107 |               "        vertical-align: top;\n",
 108 |               "    }\n",
 109 |               "\n",
 110 |               "    .dataframe thead th {\n",
 111 |               "        text-align: right;\n",
 112 |               "    }\n",
 113 |               "</style>\n",
 114 |               "<table border=\"1\" class=\"dataframe\">\n",
 115 |               "  <thead>\n",
 116 |               "    <tr style=\"text-align: right;\">\n",
 117 |               "      <th></th>\n",
 118 |               "      <th>age</th>\n",
 119 |               "      <th>sex</th>\n",
 120 |               "      <th>cp</th>\n",
 121 |               "      <th>trestbps</th>\n",
 122 |               "      <th>chol</th>\n",
 123 |               "      <th>fbs</th>\n",
 124 |               "      <th>restecg</th>\n",
 125 |               "      <th>thalach</th>\n",
 126 |               "      <th>exang</th>\n",
 127 |               "      <th>oldpeak</th>\n",
 128 |               "      <th>slope</th>\n",
 129 |               "      <th>ca</th>\n",
 130 |               "      <th>thal</th>\n",
 131 |               "      <th>target</th>\n",
 132 |               "    </tr>\n",
 133 |               "  </thead>\n",
 134 |               "  <tbody>\n",
 135 |               "    <tr>\n",
 136 |               "      <th>0</th>\n",
 137 |               "      <td>63</td>\n",
 138 |               "      <td>1</td>\n",
 139 |               "      <td>3</td>\n",
 140 |               "      <td>145</td>\n",
 141 |               "      <td>233</td>\n",
 142 |               "      <td>1</td>\n",
 143 |               "      <td>0</td>\n",
 144 |               "      <td>150</td>\n",
 145 |               "      <td>0</td>\n",
 146 |               "      <td>2.3</td>\n",
 147 |               "      <td>0</td>\n",
 148 |               "      <td>0</td>\n",
 149 |               "      <td>1</td>\n",
 150 |               "      <td>1</td>\n",
 151 |               "    </tr>\n",
 152 |               "    <tr>\n",
 153 |               "      <th>1</th>\n",
 154 |               "      <td>37</td>\n",
 155 |               "      <td>1</td>\n",
 156 |               "      <td>2</td>\n",
 157 |               "      <td>130</td>\n",
 158 |               "      <td>250</td>\n",
 159 |               "      <td>0</td>\n",
 160 |               "      <td>1</td>\n",
 161 |               "      <td>187</td>\n",
 162 |               "      <td>0</td>\n",
 163 |               "      <td>3.5</td>\n",
 164 |               "      <td>0</td>\n",
 165 |               "      <td>0</td>\n",
 166 |               "      <td>2</td>\n",
 167 |               "      <td>1</td>\n",
 168 |               "    </tr>\n",
 169 |               "    <tr>\n",
 170 |               "      <th>2</th>\n",
 171 |               "      <td>41</td>\n",
 172 |               "      <td>0</td>\n",
 173 |               "      <td>1</td>\n",
 174 |               "      <td>130</td>\n",
 175 |               "      <td>204</td>\n",
 176 |               "      <td>0</td>\n",
 177 |               "      <td>0</td>\n",
 178 |               "      <td>172</td>\n",
 179 |               "      <td>0</td>\n",
 180 |               "      <td>1.4</td>\n",
 181 |               "      <td>2</td>\n",
 182 |               "      <td>0</td>\n",
 183 |               "      <td>2</td>\n",
 184 |               "      <td>1</td>\n",
 185 |               "    </tr>\n",
 186 |               "    <tr>\n",
 187 |               "      <th>3</th>\n",
 188 |               "      <td>56</td>\n",
 189 |               "      <td>1</td>\n",
 190 |               "      <td>1</td>\n",
 191 |               "      <td>120</td>\n",
 192 |               "      <td>236</td>\n",
 193 |               "      <td>0</td>\n",
 194 |               "      <td>1</td>\n",
 195 |               "      <td>178</td>\n",
 196 |               "      <td>0</td>\n",
 197 |               "      <td>0.8</td>\n",
 198 |               "      <td>2</td>\n",
 199 |               "      <td>0</td>\n",
 200 |               "      <td>2</td>\n",
 201 |               "      <td>1</td>\n",
 202 |               "    </tr>\n",
 203 |               "    <tr>\n",
 204 |               "      <th>4</th>\n",
 205 |               "      <td>57</td>\n",
 206 |               "      <td>0</td>\n",
 207 |               "      <td>0</td>\n",
 208 |               "      <td>120</td>\n",
 209 |               "      <td>354</td>\n",
 210 |               "      <td>0</td>\n",
 211 |               "      <td>1</td>\n",
 212 |               "      <td>163</td>\n",
 213 |               "      <td>1</td>\n",
 214 |               "      <td>0.6</td>\n",
 215 |               "      <td>2</td>\n",
 216 |               "      <td>0</td>\n",
 217 |               "      <td>2</td>\n",
 218 |               "      <td>1</td>\n",
 219 |               "    </tr>\n",
 220 |               "  </tbody>\n",
 221 |               "</table>\n",
 222 |               "</div>\n",
 223 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-34720754-a536-40c3-8ad5-433546461268')\"\n",
 224 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
 225 |               "              style=\"display:none;\">\n",
 226 |               "        \n",
 227 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
 228 |               "       width=\"24px\">\n",
 229 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
 230 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
 231 |               "  </svg>\n",
 232 |               "      </button>\n",
 233 |               "      \n",
 234 |               "  <style>\n",
 235 |               "    .colab-df-container {\n",
 236 |               "      display:flex;\n",
 237 |               "      flex-wrap:wrap;\n",
 238 |               "      gap: 12px;\n",
 239 |               "    }\n",
 240 |               "\n",
 241 |               "    .colab-df-convert {\n",
 242 |               "      background-color: #E8F0FE;\n",
 243 |               "      border: none;\n",
 244 |               "      border-radius: 50%;\n",
 245 |               "      cursor: pointer;\n",
 246 |               "      display: none;\n",
 247 |               "      fill: #1967D2;\n",
 248 |               "      height: 32px;\n",
 249 |               "      padding: 0 0 0 0;\n",
 250 |               "      width: 32px;\n",
 251 |               "    }\n",
 252 |               "\n",
 253 |               "    .colab-df-convert:hover {\n",
 254 |               "      background-color: #E2EBFA;\n",
 255 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
 256 |               "      fill: #174EA6;\n",
 257 |               "    }\n",
 258 |               "\n",
 259 |               "    [theme=dark] .colab-df-convert {\n",
 260 |               "      background-color: #3B4455;\n",
 261 |               "      fill: #D2E3FC;\n",
 262 |               "    }\n",
 263 |               "\n",
 264 |               "    [theme=dark] .colab-df-convert:hover {\n",
 265 |               "      background-color: #434B5C;\n",
 266 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
 267 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
 268 |               "      fill: #FFFFFF;\n",
 269 |               "    }\n",
 270 |               "  </style>\n",
 271 |               "\n",
 272 |               "      <script>\n",
 273 |               "        const buttonEl =\n",
 274 |               "          document.querySelector('#df-34720754-a536-40c3-8ad5-433546461268 button.colab-df-convert');\n",
 275 |               "        buttonEl.style.display =\n",
 276 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
 277 |               "\n",
 278 |               "        async function convertToInteractive(key) {\n",
 279 |               "          const element = document.querySelector('#df-34720754-a536-40c3-8ad5-433546461268');\n",
 280 |               "          const dataTable =\n",
 281 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
 282 |               "                                                     [key], {});\n",
 283 |               "          if (!dataTable) return;\n",
 284 |               "\n",
 285 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
 286 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
 287 |               "            + ' to learn more about interactive tables.';\n",
 288 |               "          element.innerHTML = '';\n",
 289 |               "          dataTable['output_type'] = 'display_data';\n",
 290 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
 291 |               "          const docLink = document.createElement('div');\n",
 292 |               "          docLink.innerHTML = docLinkHtml;\n",
 293 |               "          element.appendChild(docLink);\n",
 294 |               "        }\n",
 295 |               "      </script>\n",
 296 |               "    </div>\n",
 297 |               "  </div>\n",
 298 |               "  "
 299 |             ]
 300 |           },
 301 |           "metadata": {},
 302 |           "execution_count": 3
 303 |         }
 304 |       ]
 305 |     },
 306 |     {
 307 |       "cell_type": "code",
 308 |       "metadata": {
 309 |         "colab": {
 310 |           "base_uri": "https://localhost:8080/",
 311 |           "height": 206
 312 |         },
 313 |         "id": "Fx_aCZDgrqdR",
 314 |         "outputId": "e4a5c735-f1cb-4a24-d522-66e6fe0181d6"
 315 |       },
 316 |       "source": [
 317 |         "# print last 5 rows of the dataset\n",
 318 |         "heart_data.tail()"
 319 |       ],
 320 |       "execution_count": null,
 321 |       "outputs": [
 322 |         {
 323 |           "output_type": "execute_result",
 324 |           "data": {
 325 |             "text/plain": [
 326 |               "     age  sex  cp  trestbps  chol  fbs  restecg  thalach  exang  oldpeak  \\\n",
 327 |               "298   57    0   0       140   241    0        1      123      1      0.2   \n",
 328 |               "299   45    1   3       110   264    0        1      132      0      1.2   \n",
 329 |               "300   68    1   0       144   193    1        1      141      0      3.4   \n",
 330 |               "301   57    1   0       130   131    0        1      115      1      1.2   \n",
 331 |               "302   57    0   1       130   236    0        0      174      0      0.0   \n",
 332 |               "\n",
 333 |               "     slope  ca  thal  target  \n",
 334 |               "298      1   0     3       0  \n",
 335 |               "299      1   0     3       0  \n",
 336 |               "300      1   2     3       0  \n",
 337 |               "301      1   1     3       0  \n",
 338 |               "302      1   1     2       0  "
 339 |             ],
 340 |             "text/html": [
 341 |               "\n",
 342 |               "  <div id=\"df-5f706685-1fd1-44f9-ba5a-9783a7751daa\">\n",
 343 |               "    <div class=\"colab-df-container\">\n",
 344 |               "      <div>\n",
 345 |               "<style scoped>\n",
 346 |               "    .dataframe tbody tr th:only-of-type {\n",
 347 |               "        vertical-align: middle;\n",
 348 |               "    }\n",
 349 |               "\n",
 350 |               "    .dataframe tbody tr th {\n",
 351 |               "        vertical-align: top;\n",
 352 |               "    }\n",
 353 |               "\n",
 354 |               "    .dataframe thead th {\n",
 355 |               "        text-align: right;\n",
 356 |               "    }\n",
 357 |               "</style>\n",
 358 |               "<table border=\"1\" class=\"dataframe\">\n",
 359 |               "  <thead>\n",
 360 |               "    <tr style=\"text-align: right;\">\n",
 361 |               "      <th></th>\n",
 362 |               "      <th>age</th>\n",
 363 |               "      <th>sex</th>\n",
 364 |               "      <th>cp</th>\n",
 365 |               "      <th>trestbps</th>\n",
 366 |               "      <th>chol</th>\n",
 367 |               "      <th>fbs</th>\n",
 368 |               "      <th>restecg</th>\n",
 369 |               "      <th>thalach</th>\n",
 370 |               "      <th>exang</th>\n",
 371 |               "      <th>oldpeak</th>\n",
 372 |               "      <th>slope</th>\n",
 373 |               "      <th>ca</th>\n",
 374 |               "      <th>thal</th>\n",
 375 |               "      <th>target</th>\n",
 376 |               "    </tr>\n",
 377 |               "  </thead>\n",
 378 |               "  <tbody>\n",
 379 |               "    <tr>\n",
 380 |               "      <th>298</th>\n",
 381 |               "      <td>57</td>\n",
 382 |               "      <td>0</td>\n",
 383 |               "      <td>0</td>\n",
 384 |               "      <td>140</td>\n",
 385 |               "      <td>241</td>\n",
 386 |               "      <td>0</td>\n",
 387 |               "      <td>1</td>\n",
 388 |               "      <td>123</td>\n",
 389 |               "      <td>1</td>\n",
 390 |               "      <td>0.2</td>\n",
 391 |               "      <td>1</td>\n",
 392 |               "      <td>0</td>\n",
 393 |               "      <td>3</td>\n",
 394 |               "      <td>0</td>\n",
 395 |               "    </tr>\n",
 396 |               "    <tr>\n",
 397 |               "      <th>299</th>\n",
 398 |               "      <td>45</td>\n",
 399 |               "      <td>1</td>\n",
 400 |               "      <td>3</td>\n",
 401 |               "      <td>110</td>\n",
 402 |               "      <td>264</td>\n",
 403 |               "      <td>0</td>\n",
 404 |               "      <td>1</td>\n",
 405 |               "      <td>132</td>\n",
 406 |               "      <td>0</td>\n",
 407 |               "      <td>1.2</td>\n",
 408 |               "      <td>1</td>\n",
 409 |               "      <td>0</td>\n",
 410 |               "      <td>3</td>\n",
 411 |               "      <td>0</td>\n",
 412 |               "    </tr>\n",
 413 |               "    <tr>\n",
 414 |               "      <th>300</th>\n",
 415 |               "      <td>68</td>\n",
 416 |               "      <td>1</td>\n",
 417 |               "      <td>0</td>\n",
 418 |               "      <td>144</td>\n",
 419 |               "      <td>193</td>\n",
 420 |               "      <td>1</td>\n",
 421 |               "      <td>1</td>\n",
 422 |               "      <td>141</td>\n",
 423 |               "      <td>0</td>\n",
 424 |               "      <td>3.4</td>\n",
 425 |               "      <td>1</td>\n",
 426 |               "      <td>2</td>\n",
 427 |               "      <td>3</td>\n",
 428 |               "      <td>0</td>\n",
 429 |               "    </tr>\n",
 430 |               "    <tr>\n",
 431 |               "      <th>301</th>\n",
 432 |               "      <td>57</td>\n",
 433 |               "      <td>1</td>\n",
 434 |               "      <td>0</td>\n",
 435 |               "      <td>130</td>\n",
 436 |               "      <td>131</td>\n",
 437 |               "      <td>0</td>\n",
 438 |               "      <td>1</td>\n",
 439 |               "      <td>115</td>\n",
 440 |               "      <td>1</td>\n",
 441 |               "      <td>1.2</td>\n",
 442 |               "      <td>1</td>\n",
 443 |               "      <td>1</td>\n",
 444 |               "      <td>3</td>\n",
 445 |               "      <td>0</td>\n",
 446 |               "    </tr>\n",
 447 |               "    <tr>\n",
 448 |               "      <th>302</th>\n",
 449 |               "      <td>57</td>\n",
 450 |               "      <td>0</td>\n",
 451 |               "      <td>1</td>\n",
 452 |               "      <td>130</td>\n",
 453 |               "      <td>236</td>\n",
 454 |               "      <td>0</td>\n",
 455 |               "      <td>0</td>\n",
 456 |               "      <td>174</td>\n",
 457 |               "      <td>0</td>\n",
 458 |               "      <td>0.0</td>\n",
 459 |               "      <td>1</td>\n",
 460 |               "      <td>1</td>\n",
 461 |               "      <td>2</td>\n",
 462 |               "      <td>0</td>\n",
 463 |               "    </tr>\n",
 464 |               "  </tbody>\n",
 465 |               "</table>\n",
 466 |               "</div>\n",
 467 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-5f706685-1fd1-44f9-ba5a-9783a7751daa')\"\n",
 468 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
 469 |               "              style=\"display:none;\">\n",
 470 |               "        \n",
 471 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
 472 |               "       width=\"24px\">\n",
 473 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
 474 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
 475 |               "  </svg>\n",
 476 |               "      </button>\n",
 477 |               "      \n",
 478 |               "  <style>\n",
 479 |               "    .colab-df-container {\n",
 480 |               "      display:flex;\n",
 481 |               "      flex-wrap:wrap;\n",
 482 |               "      gap: 12px;\n",
 483 |               "    }\n",
 484 |               "\n",
 485 |               "    .colab-df-convert {\n",
 486 |               "      background-color: #E8F0FE;\n",
 487 |               "      border: none;\n",
 488 |               "      border-radius: 50%;\n",
 489 |               "      cursor: pointer;\n",
 490 |               "      display: none;\n",
 491 |               "      fill: #1967D2;\n",
 492 |               "      height: 32px;\n",
 493 |               "      padding: 0 0 0 0;\n",
 494 |               "      width: 32px;\n",
 495 |               "    }\n",
 496 |               "\n",
 497 |               "    .colab-df-convert:hover {\n",
 498 |               "      background-color: #E2EBFA;\n",
 499 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
 500 |               "      fill: #174EA6;\n",
 501 |               "    }\n",
 502 |               "\n",
 503 |               "    [theme=dark] .colab-df-convert {\n",
 504 |               "      background-color: #3B4455;\n",
 505 |               "      fill: #D2E3FC;\n",
 506 |               "    }\n",
 507 |               "\n",
 508 |               "    [theme=dark] .colab-df-convert:hover {\n",
 509 |               "      background-color: #434B5C;\n",
 510 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
 511 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
 512 |               "      fill: #FFFFFF;\n",
 513 |               "    }\n",
 514 |               "  </style>\n",
 515 |               "\n",
 516 |               "      <script>\n",
 517 |               "        const buttonEl =\n",
 518 |               "          document.querySelector('#df-5f706685-1fd1-44f9-ba5a-9783a7751daa button.colab-df-convert');\n",
 519 |               "        buttonEl.style.display =\n",
 520 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
 521 |               "\n",
 522 |               "        async function convertToInteractive(key) {\n",
 523 |               "          const element = document.querySelector('#df-5f706685-1fd1-44f9-ba5a-9783a7751daa');\n",
 524 |               "          const dataTable =\n",
 525 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
 526 |               "                                                     [key], {});\n",
 527 |               "          if (!dataTable) return;\n",
 528 |               "\n",
 529 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
 530 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
 531 |               "            + ' to learn more about interactive tables.';\n",
 532 |               "          element.innerHTML = '';\n",
 533 |               "          dataTable['output_type'] = 'display_data';\n",
 534 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
 535 |               "          const docLink = document.createElement('div');\n",
 536 |               "          docLink.innerHTML = docLinkHtml;\n",
 537 |               "          element.appendChild(docLink);\n",
 538 |               "        }\n",
 539 |               "      </script>\n",
 540 |               "    </div>\n",
 541 |               "  </div>\n",
 542 |               "  "
 543 |             ]
 544 |           },
 545 |           "metadata": {},
 546 |           "execution_count": 4
 547 |         }
 548 |       ]
 549 |     },
 550 |     {
 551 |       "cell_type": "code",
 552 |       "metadata": {
 553 |         "colab": {
 554 |           "base_uri": "https://localhost:8080/"
 555 |         },
 556 |         "id": "8nX1tIzbrz0u",
 557 |         "outputId": "9833ad88-1626-477c-d363-045b919a5589"
 558 |       },
 559 |       "source": [
 560 |         "# number of rows and columns in the dataset\n",
 561 |         "heart_data.shape"
 562 |       ],
 563 |       "execution_count": null,
 564 |       "outputs": [
 565 |         {
 566 |           "output_type": "execute_result",
 567 |           "data": {
 568 |             "text/plain": [
 569 |               "(303, 14)"
 570 |             ]
 571 |           },
 572 |           "metadata": {},
 573 |           "execution_count": 5
 574 |         }
 575 |       ]
 576 |     },
 577 |     {
 578 |       "cell_type": "code",
 579 |       "metadata": {
 580 |         "colab": {
 581 |           "base_uri": "https://localhost:8080/"
 582 |         },
 583 |         "id": "7_xTcw1Sr6aJ",
 584 |         "outputId": "10d605fe-bbdd-4084-924f-d228f0b15221"
 585 |       },
 586 |       "source": [
 587 |         "# getting some info about the data\n",
 588 |         "heart_data.info()"
 589 |       ],
 590 |       "execution_count": null,
 591 |       "outputs": [
 592 |         {
 593 |           "output_type": "stream",
 594 |           "name": "stdout",
 595 |           "text": [
 596 |             "<class 'pandas.core.frame.DataFrame'>\n",
 597 |             "RangeIndex: 303 entries, 0 to 302\n",
 598 |             "Data columns (total 14 columns):\n",
 599 |             " #   Column    Non-Null Count  Dtype  \n",
 600 |             "---  ------    --------------  -----  \n",
 601 |             " 0   age       303 non-null    int64  \n",
 602 |             " 1   sex       303 non-null    int64  \n",
 603 |             " 2   cp        303 non-null    int64  \n",
 604 |             " 3   trestbps  303 non-null    int64  \n",
 605 |             " 4   chol      303 non-null    int64  \n",
 606 |             " 5   fbs       303 non-null    int64  \n",
 607 |             " 6   restecg   303 non-null    int64  \n",
 608 |             " 7   thalach   303 non-null    int64  \n",
 609 |             " 8   exang     303 non-null    int64  \n",
 610 |             " 9   oldpeak   303 non-null    float64\n",
 611 |             " 10  slope     303 non-null    int64  \n",
 612 |             " 11  ca        303 non-null    int64  \n",
 613 |             " 12  thal      303 non-null    int64  \n",
 614 |             " 13  target    303 non-null    int64  \n",
 615 |             "dtypes: float64(1), int64(13)\n",
 616 |             "memory usage: 33.3 KB\n"
 617 |           ]
 618 |         }
 619 |       ]
 620 |     },
 621 |     {
 622 |       "cell_type": "code",
 623 |       "metadata": {
 624 |         "colab": {
 625 |           "base_uri": "https://localhost:8080/"
 626 |         },
 627 |         "id": "GjHtW31rsGlb",
 628 |         "outputId": "ce7ae9fd-669e-4ff0-b0a4-59e44865ea16"
 629 |       },
 630 |       "source": [
 631 |         "# checking for missing values\n",
 632 |         "heart_data.isnull().sum()"
 633 |       ],
 634 |       "execution_count": null,
 635 |       "outputs": [
 636 |         {
 637 |           "output_type": "execute_result",
 638 |           "data": {
 639 |             "text/plain": [
 640 |               "age         0\n",
 641 |               "sex         0\n",
 642 |               "cp          0\n",
 643 |               "trestbps    0\n",
 644 |               "chol        0\n",
 645 |               "fbs         0\n",
 646 |               "restecg     0\n",
 647 |               "thalach     0\n",
 648 |               "exang       0\n",
 649 |               "oldpeak     0\n",
 650 |               "slope       0\n",
 651 |               "ca          0\n",
 652 |               "thal        0\n",
 653 |               "target      0\n",
 654 |               "dtype: int64"
 655 |             ]
 656 |           },
 657 |           "metadata": {},
 658 |           "execution_count": 7
 659 |         }
 660 |       ]
 661 |     },
 662 |     {
 663 |       "cell_type": "code",
 664 |       "metadata": {
 665 |         "colab": {
 666 |           "base_uri": "https://localhost:8080/",
 667 |           "height": 364
 668 |         },
 669 |         "id": "OHmcP7DJsSEP",
 670 |         "outputId": "6d87c7ab-216f-4abf-a304-84a4ae6a2661"
 671 |       },
 672 |       "source": [
 673 |         "# statistical measures about the data\n",
 674 |         "heart_data.describe()"
 675 |       ],
 676 |       "execution_count": null,
 677 |       "outputs": [
 678 |         {
 679 |           "output_type": "execute_result",
 680 |           "data": {
 681 |             "text/plain": [
 682 |               "              age         sex          cp    trestbps        chol         fbs  \\\n",
 683 |               "count  303.000000  303.000000  303.000000  303.000000  303.000000  303.000000   \n",
 684 |               "mean    54.366337    0.683168    0.966997  131.623762  246.264026    0.148515   \n",
 685 |               "std      9.082101    0.466011    1.032052   17.538143   51.830751    0.356198   \n",
 686 |               "min     29.000000    0.000000    0.000000   94.000000  126.000000    0.000000   \n",
 687 |               "25%     47.500000    0.000000    0.000000  120.000000  211.000000    0.000000   \n",
 688 |               "50%     55.000000    1.000000    1.000000  130.000000  240.000000    0.000000   \n",
 689 |               "75%     61.000000    1.000000    2.000000  140.000000  274.500000    0.000000   \n",
 690 |               "max     77.000000    1.000000    3.000000  200.000000  564.000000    1.000000   \n",
 691 |               "\n",
 692 |               "          restecg     thalach       exang     oldpeak       slope          ca  \\\n",
 693 |               "count  303.000000  303.000000  303.000000  303.000000  303.000000  303.000000   \n",
 694 |               "mean     0.528053  149.646865    0.326733    1.039604    1.399340    0.729373   \n",
 695 |               "std      0.525860   22.905161    0.469794    1.161075    0.616226    1.022606   \n",
 696 |               "min      0.000000   71.000000    0.000000    0.000000    0.000000    0.000000   \n",
 697 |               "25%      0.000000  133.500000    0.000000    0.000000    1.000000    0.000000   \n",
 698 |               "50%      1.000000  153.000000    0.000000    0.800000    1.000000    0.000000   \n",
 699 |               "75%      1.000000  166.000000    1.000000    1.600000    2.000000    1.000000   \n",
 700 |               "max      2.000000  202.000000    1.000000    6.200000    2.000000    4.000000   \n",
 701 |               "\n",
 702 |               "             thal      target  \n",
 703 |               "count  303.000000  303.000000  \n",
 704 |               "mean     2.313531    0.544554  \n",
 705 |               "std      0.612277    0.498835  \n",
 706 |               "min      0.000000    0.000000  \n",
 707 |               "25%      2.000000    0.000000  \n",
 708 |               "50%      2.000000    1.000000  \n",
 709 |               "75%      3.000000    1.000000  \n",
 710 |               "max      3.000000    1.000000  "
 711 |             ],
 712 |             "text/html": [
 713 |               "\n",
 714 |               "  <div id=\"df-189f2581-9c73-4140-8aaa-51ff34091889\">\n",
 715 |               "    <div class=\"colab-df-container\">\n",
 716 |               "      <div>\n",
 717 |               "<style scoped>\n",
 718 |               "    .dataframe tbody tr th:only-of-type {\n",
 719 |               "        vertical-align: middle;\n",
 720 |               "    }\n",
 721 |               "\n",
 722 |               "    .dataframe tbody tr th {\n",
 723 |               "        vertical-align: top;\n",
 724 |               "    }\n",
 725 |               "\n",
 726 |               "    .dataframe thead th {\n",
 727 |               "        text-align: right;\n",
 728 |               "    }\n",
 729 |               "</style>\n",
 730 |               "<table border=\"1\" class=\"dataframe\">\n",
 731 |               "  <thead>\n",
 732 |               "    <tr style=\"text-align: right;\">\n",
 733 |               "      <th></th>\n",
 734 |               "      <th>age</th>\n",
 735 |               "      <th>sex</th>\n",
 736 |               "      <th>cp</th>\n",
 737 |               "      <th>trestbps</th>\n",
 738 |               "      <th>chol</th>\n",
 739 |               "      <th>fbs</th>\n",
 740 |               "      <th>restecg</th>\n",
 741 |               "      <th>thalach</th>\n",
 742 |               "      <th>exang</th>\n",
 743 |               "      <th>oldpeak</th>\n",
 744 |               "      <th>slope</th>\n",
 745 |               "      <th>ca</th>\n",
 746 |               "      <th>thal</th>\n",
 747 |               "      <th>target</th>\n",
 748 |               "    </tr>\n",
 749 |               "  </thead>\n",
 750 |               "  <tbody>\n",
 751 |               "    <tr>\n",
 752 |               "      <th>count</th>\n",
 753 |               "      <td>303.000000</td>\n",
 754 |               "      <td>303.000000</td>\n",
 755 |               "      <td>303.000000</td>\n",
 756 |               "      <td>303.000000</td>\n",
 757 |               "      <td>303.000000</td>\n",
 758 |               "      <td>303.000000</td>\n",
 759 |               "      <td>303.000000</td>\n",
 760 |               "      <td>303.000000</td>\n",
 761 |               "      <td>303.000000</td>\n",
 762 |               "      <td>303.000000</td>\n",
 763 |               "      <td>303.000000</td>\n",
 764 |               "      <td>303.000000</td>\n",
 765 |               "      <td>303.000000</td>\n",
 766 |               "      <td>303.000000</td>\n",
 767 |               "    </tr>\n",
 768 |               "    <tr>\n",
 769 |               "      <th>mean</th>\n",
 770 |               "      <td>54.366337</td>\n",
 771 |               "      <td>0.683168</td>\n",
 772 |               "      <td>0.966997</td>\n",
 773 |               "      <td>131.623762</td>\n",
 774 |               "      <td>246.264026</td>\n",
 775 |               "      <td>0.148515</td>\n",
 776 |               "      <td>0.528053</td>\n",
 777 |               "      <td>149.646865</td>\n",
 778 |               "      <td>0.326733</td>\n",
 779 |               "      <td>1.039604</td>\n",
 780 |               "      <td>1.399340</td>\n",
 781 |               "      <td>0.729373</td>\n",
 782 |               "      <td>2.313531</td>\n",
 783 |               "      <td>0.544554</td>\n",
 784 |               "    </tr>\n",
 785 |               "    <tr>\n",
 786 |               "      <th>std</th>\n",
 787 |               "      <td>9.082101</td>\n",
 788 |               "      <td>0.466011</td>\n",
 789 |               "      <td>1.032052</td>\n",
 790 |               "      <td>17.538143</td>\n",
 791 |               "      <td>51.830751</td>\n",
 792 |               "      <td>0.356198</td>\n",
 793 |               "      <td>0.525860</td>\n",
 794 |               "      <td>22.905161</td>\n",
 795 |               "      <td>0.469794</td>\n",
 796 |               "      <td>1.161075</td>\n",
 797 |               "      <td>0.616226</td>\n",
 798 |               "      <td>1.022606</td>\n",
 799 |               "      <td>0.612277</td>\n",
 800 |               "      <td>0.498835</td>\n",
 801 |               "    </tr>\n",
 802 |               "    <tr>\n",
 803 |               "      <th>min</th>\n",
 804 |               "      <td>29.000000</td>\n",
 805 |               "      <td>0.000000</td>\n",
 806 |               "      <td>0.000000</td>\n",
 807 |               "      <td>94.000000</td>\n",
 808 |               "      <td>126.000000</td>\n",
 809 |               "      <td>0.000000</td>\n",
 810 |               "      <td>0.000000</td>\n",
 811 |               "      <td>71.000000</td>\n",
 812 |               "      <td>0.000000</td>\n",
 813 |               "      <td>0.000000</td>\n",
 814 |               "      <td>0.000000</td>\n",
 815 |               "      <td>0.000000</td>\n",
 816 |               "      <td>0.000000</td>\n",
 817 |               "      <td>0.000000</td>\n",
 818 |               "    </tr>\n",
 819 |               "    <tr>\n",
 820 |               "      <th>25%</th>\n",
 821 |               "      <td>47.500000</td>\n",
 822 |               "      <td>0.000000</td>\n",
 823 |               "      <td>0.000000</td>\n",
 824 |               "      <td>120.000000</td>\n",
 825 |               "      <td>211.000000</td>\n",
 826 |               "      <td>0.000000</td>\n",
 827 |               "      <td>0.000000</td>\n",
 828 |               "      <td>133.500000</td>\n",
 829 |               "      <td>0.000000</td>\n",
 830 |               "      <td>0.000000</td>\n",
 831 |               "      <td>1.000000</td>\n",
 832 |               "      <td>0.000000</td>\n",
 833 |               "      <td>2.000000</td>\n",
 834 |               "      <td>0.000000</td>\n",
 835 |               "    </tr>\n",
 836 |               "    <tr>\n",
 837 |               "      <th>50%</th>\n",
 838 |               "      <td>55.000000</td>\n",
 839 |               "      <td>1.000000</td>\n",
 840 |               "      <td>1.000000</td>\n",
 841 |               "      <td>130.000000</td>\n",
 842 |               "      <td>240.000000</td>\n",
 843 |               "      <td>0.000000</td>\n",
 844 |               "      <td>1.000000</td>\n",
 845 |               "      <td>153.000000</td>\n",
 846 |               "      <td>0.000000</td>\n",
 847 |               "      <td>0.800000</td>\n",
 848 |               "      <td>1.000000</td>\n",
 849 |               "      <td>0.000000</td>\n",
 850 |               "      <td>2.000000</td>\n",
 851 |               "      <td>1.000000</td>\n",
 852 |               "    </tr>\n",
 853 |               "    <tr>\n",
 854 |               "      <th>75%</th>\n",
 855 |               "      <td>61.000000</td>\n",
 856 |               "      <td>1.000000</td>\n",
 857 |               "      <td>2.000000</td>\n",
 858 |               "      <td>140.000000</td>\n",
 859 |               "      <td>274.500000</td>\n",
 860 |               "      <td>0.000000</td>\n",
 861 |               "      <td>1.000000</td>\n",
 862 |               "      <td>166.000000</td>\n",
 863 |               "      <td>1.000000</td>\n",
 864 |               "      <td>1.600000</td>\n",
 865 |               "      <td>2.000000</td>\n",
 866 |               "      <td>1.000000</td>\n",
 867 |               "      <td>3.000000</td>\n",
 868 |               "      <td>1.000000</td>\n",
 869 |               "    </tr>\n",
 870 |               "    <tr>\n",
 871 |               "      <th>max</th>\n",
 872 |               "      <td>77.000000</td>\n",
 873 |               "      <td>1.000000</td>\n",
 874 |               "      <td>3.000000</td>\n",
 875 |               "      <td>200.000000</td>\n",
 876 |               "      <td>564.000000</td>\n",
 877 |               "      <td>1.000000</td>\n",
 878 |               "      <td>2.000000</td>\n",
 879 |               "      <td>202.000000</td>\n",
 880 |               "      <td>1.000000</td>\n",
 881 |               "      <td>6.200000</td>\n",
 882 |               "      <td>2.000000</td>\n",
 883 |               "      <td>4.000000</td>\n",
 884 |               "      <td>3.000000</td>\n",
 885 |               "      <td>1.000000</td>\n",
 886 |               "    </tr>\n",
 887 |               "  </tbody>\n",
 888 |               "</table>\n",
 889 |               "</div>\n",
 890 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-189f2581-9c73-4140-8aaa-51ff34091889')\"\n",
 891 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
 892 |               "              style=\"display:none;\">\n",
 893 |               "        \n",
 894 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
 895 |               "       width=\"24px\">\n",
 896 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
 897 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
 898 |               "  </svg>\n",
 899 |               "      </button>\n",
 900 |               "      \n",
 901 |               "  <style>\n",
 902 |               "    .colab-df-container {\n",
 903 |               "      display:flex;\n",
 904 |               "      flex-wrap:wrap;\n",
 905 |               "      gap: 12px;\n",
 906 |               "    }\n",
 907 |               "\n",
 908 |               "    .colab-df-convert {\n",
 909 |               "      background-color: #E8F0FE;\n",
 910 |               "      border: none;\n",
 911 |               "      border-radius: 50%;\n",
 912 |               "      cursor: pointer;\n",
 913 |               "      display: none;\n",
 914 |               "      fill: #1967D2;\n",
 915 |               "      height: 32px;\n",
 916 |               "      padding: 0 0 0 0;\n",
 917 |               "      width: 32px;\n",
 918 |               "    }\n",
 919 |               "\n",
 920 |               "    .colab-df-convert:hover {\n",
 921 |               "      background-color: #E2EBFA;\n",
 922 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
 923 |               "      fill: #174EA6;\n",
 924 |               "    }\n",
 925 |               "\n",
 926 |               "    [theme=dark] .colab-df-convert {\n",
 927 |               "      background-color: #3B4455;\n",
 928 |               "      fill: #D2E3FC;\n",
 929 |               "    }\n",
 930 |               "\n",
 931 |               "    [theme=dark] .colab-df-convert:hover {\n",
 932 |               "      background-color: #434B5C;\n",
 933 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
 934 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
 935 |               "      fill: #FFFFFF;\n",
 936 |               "    }\n",
 937 |               "  </style>\n",
 938 |               "\n",
 939 |               "      <script>\n",
 940 |               "        const buttonEl =\n",
 941 |               "          document.querySelector('#df-189f2581-9c73-4140-8aaa-51ff34091889 button.colab-df-convert');\n",
 942 |               "        buttonEl.style.display =\n",
 943 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
 944 |               "\n",
 945 |               "        async function convertToInteractive(key) {\n",
 946 |               "          const element = document.querySelector('#df-189f2581-9c73-4140-8aaa-51ff34091889');\n",
 947 |               "          const dataTable =\n",
 948 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
 949 |               "                                                     [key], {});\n",
 950 |               "          if (!dataTable) return;\n",
 951 |               "\n",
 952 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
 953 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
 954 |               "            + ' to learn more about interactive tables.';\n",
 955 |               "          element.innerHTML = '';\n",
 956 |               "          dataTable['output_type'] = 'display_data';\n",
 957 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
 958 |               "          const docLink = document.createElement('div');\n",
 959 |               "          docLink.innerHTML = docLinkHtml;\n",
 960 |               "          element.appendChild(docLink);\n",
 961 |               "        }\n",
 962 |               "      </script>\n",
 963 |               "    </div>\n",
 964 |               "  </div>\n",
 965 |               "  "
 966 |             ]
 967 |           },
 968 |           "metadata": {},
 969 |           "execution_count": 8
 970 |         }
 971 |       ]
 972 |     },
 973 |     {
 974 |       "cell_type": "code",
 975 |       "metadata": {
 976 |         "colab": {
 977 |           "base_uri": "https://localhost:8080/"
 978 |         },
 979 |         "id": "4InaOSIUsfWP",
 980 |         "outputId": "ad9d637a-8a1a-4435-881d-994f4f788d38"
 981 |       },
 982 |       "source": [
 983 |         "# checking the distribution of Target Variable\n",
 984 |         "heart_data['target'].value_counts()"
 985 |       ],
 986 |       "execution_count": null,
 987 |       "outputs": [
 988 |         {
 989 |           "output_type": "execute_result",
 990 |           "data": {
 991 |             "text/plain": [
 992 |               "1    165\n",
 993 |               "0    138\n",
 994 |               "Name: target, dtype: int64"
 995 |             ]
 996 |           },
 997 |           "metadata": {},
 998 |           "execution_count": 9
 999 |         }
1000 |       ]
1001 |     },
1002 |     {
1003 |       "cell_type": "markdown",
1004 |       "metadata": {
1005 |         "id": "aSOBu4qDtJy5"
1006 |       },
1007 |       "source": [
1008 |         "1 --> Defective Heart\n",
1009 |         "\n",
1010 |         "0 --> Healthy Heart"
1011 |       ]
1012 |     },
1013 |     {
1014 |       "cell_type": "markdown",
1015 |       "metadata": {
1016 |         "id": "tW8i4igjtPRC"
1017 |       },
1018 |       "source": [
1019 |         "Splitting the Features and Target"
1020 |       ]
1021 |     },
1022 |     {
1023 |       "cell_type": "code",
1024 |       "metadata": {
1025 |         "id": "Q6yfbswrs7m3"
1026 |       },
1027 |       "source": [
1028 |         "X = heart_data.drop(columns='target', axis=1)\n",
1029 |         "Y = heart_data['target']"
1030 |       ],
1031 |       "execution_count": null,
1032 |       "outputs": []
1033 |     },
1034 |     {
1035 |       "cell_type": "code",
1036 |       "metadata": {
1037 |         "colab": {
1038 |           "base_uri": "https://localhost:8080/"
1039 |         },
1040 |         "id": "XJoCp4ZKtpZy",
1041 |         "outputId": "516ecd1a-46a2-416f-9edc-3a05bd425ab9"
1042 |       },
1043 |       "source": [
1044 |         "print(X)"
1045 |       ],
1046 |       "execution_count": null,
1047 |       "outputs": [
1048 |         {
1049 |           "output_type": "stream",
1050 |           "name": "stdout",
1051 |           "text": [
1052 |             "     age  sex  cp  trestbps  chol  fbs  restecg  thalach  exang  oldpeak  \\\n",
1053 |             "0     63    1   3       145   233    1        0      150      0      2.3   \n",
1054 |             "1     37    1   2       130   250    0        1      187      0      3.5   \n",
1055 |             "2     41    0   1       130   204    0        0      172      0      1.4   \n",
1056 |             "3     56    1   1       120   236    0        1      178      0      0.8   \n",
1057 |             "4     57    0   0       120   354    0        1      163      1      0.6   \n",
1058 |             "..   ...  ...  ..       ...   ...  ...      ...      ...    ...      ...   \n",
1059 |             "298   57    0   0       140   241    0        1      123      1      0.2   \n",
1060 |             "299   45    1   3       110   264    0        1      132      0      1.2   \n",
1061 |             "300   68    1   0       144   193    1        1      141      0      3.4   \n",
1062 |             "301   57    1   0       130   131    0        1      115      1      1.2   \n",
1063 |             "302   57    0   1       130   236    0        0      174      0      0.0   \n",
1064 |             "\n",
1065 |             "     slope  ca  thal  \n",
1066 |             "0        0   0     1  \n",
1067 |             "1        0   0     2  \n",
1068 |             "2        2   0     2  \n",
1069 |             "3        2   0     2  \n",
1070 |             "4        2   0     2  \n",
1071 |             "..     ...  ..   ...  \n",
1072 |             "298      1   0     3  \n",
1073 |             "299      1   0     3  \n",
1074 |             "300      1   2     3  \n",
1075 |             "301      1   1     3  \n",
1076 |             "302      1   1     2  \n",
1077 |             "\n",
1078 |             "[303 rows x 13 columns]\n"
1079 |           ]
1080 |         }
1081 |       ]
1082 |     },
1083 |     {
1084 |       "cell_type": "code",
1085 |       "metadata": {
1086 |         "colab": {
1087 |           "base_uri": "https://localhost:8080/"
1088 |         },
1089 |         "id": "nukuj-YItq1w",
1090 |         "outputId": "3c412e56-1867-42f7-e1d6-ea573b1ef4af"
1091 |       },
1092 |       "source": [
1093 |         "print(Y)"
1094 |       ],
1095 |       "execution_count": null,
1096 |       "outputs": [
1097 |         {
1098 |           "output_type": "stream",
1099 |           "name": "stdout",
1100 |           "text": [
1101 |             "0      1\n",
1102 |             "1      1\n",
1103 |             "2      1\n",
1104 |             "3      1\n",
1105 |             "4      1\n",
1106 |             "      ..\n",
1107 |             "298    0\n",
1108 |             "299    0\n",
1109 |             "300    0\n",
1110 |             "301    0\n",
1111 |             "302    0\n",
1112 |             "Name: target, Length: 303, dtype: int64\n"
1113 |           ]
1114 |         }
1115 |       ]
1116 |     },
1117 |     {
1118 |       "cell_type": "markdown",
1119 |       "metadata": {
1120 |         "id": "_EcjSE3Et18n"
1121 |       },
1122 |       "source": [
1123 |         "Splitting the Data into Training data & Test Data"
1124 |       ]
1125 |     },
1126 |     {
1127 |       "cell_type": "code",
1128 |       "metadata": {
1129 |         "id": "a-UUfRUxtuga"
1130 |       },
1131 |       "source": [
1132 |         "X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2, stratify=Y, random_state=2)"
1133 |       ],
1134 |       "execution_count": null,
1135 |       "outputs": []
1136 |     },
1137 |     {
1138 |       "cell_type": "code",
1139 |       "metadata": {
1140 |         "colab": {
1141 |           "base_uri": "https://localhost:8080/"
1142 |         },
1143 |         "id": "x7PrjC6zuf6X",
1144 |         "outputId": "ebc6e966-5cfd-4b84-dd99-eee68f318454"
1145 |       },
1146 |       "source": [
1147 |         "print(X.shape, X_train.shape, X_test.shape)"
1148 |       ],
1149 |       "execution_count": null,
1150 |       "outputs": [
1151 |         {
1152 |           "output_type": "stream",
1153 |           "name": "stdout",
1154 |           "text": [
1155 |             "(303, 13) (242, 13) (61, 13)\n"
1156 |           ]
1157 |         }
1158 |       ]
1159 |     },
1160 |     {
1161 |       "cell_type": "markdown",
1162 |       "metadata": {
1163 |         "id": "beSkZmpVuvn9"
1164 |       },
1165 |       "source": [
1166 |         "Model Training"
1167 |       ]
1168 |     },
1169 |     {
1170 |       "cell_type": "code",
1171 |       "metadata": {
1172 |         "id": "4-Md74FYuqNL"
1173 |       },
1174 |       "source": [
1175 |         "model = LogisticRegression(max_iter=1000)"
1176 |       ],
1177 |       "execution_count": null,
1178 |       "outputs": []
1179 |     },
1180 |     {
1181 |       "cell_type": "code",
1182 |       "metadata": {
1183 |         "colab": {
1184 |           "base_uri": "https://localhost:8080/"
1185 |         },
1186 |         "id": "kCdHYxGUu7XD",
1187 |         "outputId": "88a60b92-f47a-4df2-f6cc-cebe41f33ef8"
1188 |       },
1189 |       "source": [
1190 |         "# training the LogisticRegression model with Training data\n",
1191 |         "model.fit(X_train, Y_train)"
1192 |       ],
1193 |       "execution_count": null,
1194 |       "outputs": [
1195 |         {
1196 |           "output_type": "execute_result",
1197 |           "data": {
1198 |             "text/plain": [
1199 |               "LogisticRegression(max_iter=1000)"
1200 |             ]
1201 |           },
1202 |           "metadata": {},
1203 |           "execution_count": 16
1204 |         }
1205 |       ]
1206 |     },
1207 |     {
1208 |       "cell_type": "markdown",
1209 |       "metadata": {
1210 |         "id": "ZYIw8Gi9vXfU"
1211 |       },
1212 |       "source": [
1213 |         "Model Evaluation"
1214 |       ]
1215 |     },
1216 |     {
1217 |       "cell_type": "markdown",
1218 |       "metadata": {
1219 |         "id": "wmxAekfZvZa9"
1220 |       },
1221 |       "source": [
1222 |         "**Accuracy Score**"
1223 |       ]
1224 |     },
1225 |     {
1226 |       "cell_type": "code",
1227 |       "source": [
1228 |         "from sklearn.metrics import accuracy_score"
1229 |       ],
1230 |       "metadata": {
1231 |         "id": "aMMAnoWYFQY5"
1232 |       },
1233 |       "execution_count": null,
1234 |       "outputs": []
1235 |     },
1236 |     {
1237 |       "cell_type": "code",
1238 |       "metadata": {
1239 |         "id": "g19JaUTMvPKy",
1240 |         "colab": {
1241 |           "base_uri": "https://localhost:8080/"
1242 |         },
1243 |         "outputId": "bc2da15b-efbe-449e-c1c7-733b11deb097"
1244 |       },
1245 |       "source": [
1246 |         "# accuracy on training data\n",
1247 |         "X_train_prediction = model.predict(X_train)\n",
1248 |         "training_data_accuracy = accuracy_score(Y_train, X_train_prediction)\n",
1249 |         "print(training_data_accuracy)"
1250 |       ],
1251 |       "execution_count": null,
1252 |       "outputs": [
1253 |         {
1254 |           "output_type": "stream",
1255 |           "name": "stdout",
1256 |           "text": [
1257 |             "0.8553719008264463\n"
1258 |           ]
1259 |         }
1260 |       ]
1261 |     },
1262 |     {
1263 |       "cell_type": "code",
1264 |       "metadata": {
1265 |         "colab": {
1266 |           "base_uri": "https://localhost:8080/"
1267 |         },
1268 |         "id": "uQBZvBh8v7R_",
1269 |         "outputId": "fec6bfaf-83cf-4a6c-e75d-6c91cc256409"
1270 |       },
1271 |       "source": [
1272 |         "print('Accuracy on Training data : ', round(training_data_accuracy*100, 2), '%')"
1273 |       ],
1274 |       "execution_count": null,
1275 |       "outputs": [
1276 |         {
1277 |           "output_type": "stream",
1278 |           "name": "stdout",
1279 |           "text": [
1280 |             "Accuracy on Training data :  85.54 %\n"
1281 |           ]
1282 |         }
1283 |       ]
1284 |     },
1285 |     {
1286 |       "cell_type": "code",
1287 |       "metadata": {
1288 |         "id": "mDONDJdlwBIO",
1289 |         "colab": {
1290 |           "base_uri": "https://localhost:8080/"
1291 |         },
1292 |         "outputId": "4326f2ea-4f90-4b72-85dd-2d66ad9ff430"
1293 |       },
1294 |       "source": [
1295 |         "# accuracy on test data\n",
1296 |         "X_test_prediction = model.predict(X_test)\n",
1297 |         "test_data_accuracy = accuracy_score(Y_test, X_test_prediction)\n",
1298 |         "print(test_data_accuracy)"
1299 |       ],
1300 |       "execution_count": null,
1301 |       "outputs": [
1302 |         {
1303 |           "output_type": "stream",
1304 |           "name": "stdout",
1305 |           "text": [
1306 |             "0.8032786885245902\n"
1307 |           ]
1308 |         }
1309 |       ]
1310 |     },
1311 |     {
1312 |       "cell_type": "code",
1313 |       "metadata": {
1314 |         "colab": {
1315 |           "base_uri": "https://localhost:8080/"
1316 |         },
1317 |         "id": "_MBS-OqdwYpf",
1318 |         "outputId": "d001ccf6-78ae-4163-b228-e4447ca18f23"
1319 |       },
1320 |       "source": [
1321 |         "print('Accuracy on Test data : ', round(test_data_accuracy*100, 2), '%')"
1322 |       ],
1323 |       "execution_count": null,
1324 |       "outputs": [
1325 |         {
1326 |           "output_type": "stream",
1327 |           "name": "stdout",
1328 |           "text": [
1329 |             "Accuracy on Test data :  80.33 %\n"
1330 |           ]
1331 |         }
1332 |       ]
1333 |     },
1334 |     {
1335 |       "cell_type": "markdown",
1336 |       "source": [
1337 |         "**Precision**"
1338 |       ],
1339 |       "metadata": {
1340 |         "id": "FSTrUVcRZwCw"
1341 |       }
1342 |     },
1343 |     {
1344 |       "cell_type": "markdown",
1345 |       "source": [
1346 |         "Precision is the ratio of number of True Positive to the total number of Predicted Positive. It measures, out of the total predicted positive, how many are actually positive."
1347 |       ],
1348 |       "metadata": {
1349 |         "id": "UHh_Fs8FbaaD"
1350 |       }
1351 |     },
1352 |     {
1353 |       "cell_type": "code",
1354 |       "source": [
1355 |         "from sklearn.metrics import precision_score"
1356 |       ],
1357 |       "metadata": {
1358 |         "id": "ewiHzUzMTjSy"
1359 |       },
1360 |       "execution_count": null,
1361 |       "outputs": []
1362 |     },
1363 |     {
1364 |       "cell_type": "code",
1365 |       "source": [
1366 |         "# precision for training data predictions\n",
1367 |         "precision_train = precision_score(Y_train, X_train_prediction)\n",
1368 |         "print('Training data Precision =', precision_train)"
1369 |       ],
1370 |       "metadata": {
1371 |         "colab": {
1372 |           "base_uri": "https://localhost:8080/"
1373 |         },
1374 |         "id": "IgRFBRkqX3HA",
1375 |         "outputId": "9805e399-f18b-4c16-b39d-85ef4cbb4c28"
1376 |       },
1377 |       "execution_count": null,
1378 |       "outputs": [
1379 |         {
1380 |           "output_type": "stream",
1381 |           "name": "stdout",
1382 |           "text": [
1383 |             "Training data Precision = 0.8299319727891157\n"
1384 |           ]
1385 |         }
1386 |       ]
1387 |     },
1388 |     {
1389 |       "cell_type": "code",
1390 |       "source": [
1391 |         "# precision for test data predictions\n",
1392 |         "precision_test = precision_score(Y_test, X_test_prediction)\n",
1393 |         "print('Test data Precision =', precision_test)"
1394 |       ],
1395 |       "metadata": {
1396 |         "colab": {
1397 |           "base_uri": "https://localhost:8080/"
1398 |         },
1399 |         "id": "ZwHkEDrvZLVO",
1400 |         "outputId": "a31614ba-eba1-4cb1-ccee-c07f01f6b0af"
1401 |       },
1402 |       "execution_count": null,
1403 |       "outputs": [
1404 |         {
1405 |           "output_type": "stream",
1406 |           "name": "stdout",
1407 |           "text": [
1408 |             "Test data Precision = 0.8181818181818182\n"
1409 |           ]
1410 |         }
1411 |       ]
1412 |     },
1413 |     {
1414 |       "cell_type": "markdown",
1415 |       "source": [
1416 |         "**Recall**"
1417 |       ],
1418 |       "metadata": {
1419 |         "id": "w2ciOBvubQCO"
1420 |       }
1421 |     },
1422 |     {
1423 |       "cell_type": "markdown",
1424 |       "source": [
1425 |         "Recall is the ratio of number of True Positive to the total number of Actual Positive. It measures, out of the total actual positive, how many are predicted as True Positive."
1426 |       ],
1427 |       "metadata": {
1428 |         "id": "MmnuwGfibtYV"
1429 |       }
1430 |     },
1431 |     {
1432 |       "cell_type": "code",
1433 |       "source": [
1434 |         "from sklearn.metrics import recall_score"
1435 |       ],
1436 |       "metadata": {
1437 |         "id": "T5bYBiioTkwI"
1438 |       },
1439 |       "execution_count": null,
1440 |       "outputs": []
1441 |     },
1442 |     {
1443 |       "cell_type": "code",
1444 |       "source": [
1445 |         "# recall for training data predictions\n",
1446 |         "recall_train = recall_score(Y_train, X_train_prediction)\n",
1447 |         "print('Training data Recall =', recall_train)"
1448 |       ],
1449 |       "metadata": {
1450 |         "colab": {
1451 |           "base_uri": "https://localhost:8080/"
1452 |         },
1453 |         "id": "70bDi6xmZn14",
1454 |         "outputId": "f1968195-cd44-4248-c060-e9565b91185e"
1455 |       },
1456 |       "execution_count": null,
1457 |       "outputs": [
1458 |         {
1459 |           "output_type": "stream",
1460 |           "name": "stdout",
1461 |           "text": [
1462 |             "Training data Recall = 0.9242424242424242\n"
1463 |           ]
1464 |         }
1465 |       ]
1466 |     },
1467 |     {
1468 |       "cell_type": "code",
1469 |       "source": [
1470 |         "# recall for test data predictions\n",
1471 |         "recall_test = recall_score(Y_test, X_test_prediction)\n",
1472 |         "print('Test data Recall =', recall_test)"
1473 |       ],
1474 |       "metadata": {
1475 |         "colab": {
1476 |           "base_uri": "https://localhost:8080/"
1477 |         },
1478 |         "id": "ci9n7r01ZqE5",
1479 |         "outputId": "ecea1b81-89a8-402b-a2d7-9ce16bb631d3"
1480 |       },
1481 |       "execution_count": null,
1482 |       "outputs": [
1483 |         {
1484 |           "output_type": "stream",
1485 |           "name": "stdout",
1486 |           "text": [
1487 |             "Test data Recall = 0.8181818181818182\n"
1488 |           ]
1489 |         }
1490 |       ]
1491 |     },
1492 |     {
1493 |       "cell_type": "markdown",
1494 |       "source": [
1495 |         "**F1 Score**"
1496 |       ],
1497 |       "metadata": {
1498 |         "id": "MBYUgKOLck-_"
1499 |       }
1500 |     },
1501 |     {
1502 |       "cell_type": "markdown",
1503 |       "source": [
1504 |         "F1 Score is an important evaluation metric for binary classification that combines Precision & Recall. F1 Score is the harmonic mean of Precision & Recall."
1505 |       ],
1506 |       "metadata": {
1507 |         "id": "YIudfNwmgCjs"
1508 |       }
1509 |     },
1510 |     {
1511 |       "cell_type": "code",
1512 |       "source": [
1513 |         "from sklearn.metrics import f1_score"
1514 |       ],
1515 |       "metadata": {
1516 |         "id": "pP9PIZscaFm0"
1517 |       },
1518 |       "execution_count": null,
1519 |       "outputs": []
1520 |     },
1521 |     {
1522 |       "cell_type": "code",
1523 |       "source": [
1524 |         "# F1 score for training data predictions\n",
1525 |         "f1_score_train = f1_score(Y_train, X_train_prediction)\n",
1526 |         "print('Training data F1 Score =', f1_score_train)"
1527 |       ],
1528 |       "metadata": {
1529 |         "colab": {
1530 |           "base_uri": "https://localhost:8080/"
1531 |         },
1532 |         "outputId": "04695f71-0f67-425c-cca9-2a618ecc43f5",
1533 |         "id": "oHwExAAtaFm8"
1534 |       },
1535 |       "execution_count": null,
1536 |       "outputs": [
1537 |         {
1538 |           "output_type": "stream",
1539 |           "name": "stdout",
1540 |           "text": [
1541 |             "Training data F1 Score = 0.8745519713261649\n"
1542 |           ]
1543 |         }
1544 |       ]
1545 |     },
1546 |     {
1547 |       "cell_type": "code",
1548 |       "source": [
1549 |         "# F1 Score for test data predictions\n",
1550 |         "f1_score_test = recall_score(Y_test, X_test_prediction)\n",
1551 |         "print('Test data F1 Score =', f1_score_test)"
1552 |       ],
1553 |       "metadata": {
1554 |         "colab": {
1555 |           "base_uri": "https://localhost:8080/"
1556 |         },
1557 |         "outputId": "13266b05-9f52-41d2-ee43-ba7b3b138809",
1558 |         "id": "n628BUyvaFm9"
1559 |       },
1560 |       "execution_count": null,
1561 |       "outputs": [
1562 |         {
1563 |           "output_type": "stream",
1564 |           "name": "stdout",
1565 |           "text": [
1566 |             "Test data F1 Score = 0.8181818181818182\n"
1567 |           ]
1568 |         }
1569 |       ]
1570 |     },
1571 |     {
1572 |       "cell_type": "markdown",
1573 |       "source": [
1574 |         "**Precision, Recall, & F1 Score - function**"
1575 |       ],
1576 |       "metadata": {
1577 |         "id": "5tH0z-JUa76n"
1578 |       }
1579 |     },
1580 |     {
1581 |       "cell_type": "code",
1582 |       "source": [
1583 |         "def precision_recall_f1_score(true_labels, pred_labels):\n",
1584 |         "\n",
1585 |         "  precision_value = precision_score(true_labels, pred_labels)\n",
1586 |         "  recall_value = recall_score(true_labels, pred_labels)\n",
1587 |         "  f1_score_value = f1_score(true_labels, pred_labels)\n",
1588 |         "\n",
1589 |         "  print('Precision =',precision_value)\n",
1590 |         "  print('Recall =',recall_value)\n",
1591 |         "  print('F1 Score =',f1_score_value)"
1592 |       ],
1593 |       "metadata": {
1594 |         "id": "xGPnMqsdfMay"
1595 |       },
1596 |       "execution_count": null,
1597 |       "outputs": []
1598 |     },
1599 |     {
1600 |       "cell_type": "code",
1601 |       "source": [
1602 |         "# classification metrics for training data\n",
1603 |         "precision_recall_f1_score(Y_train, X_train_prediction)"
1604 |       ],
1605 |       "metadata": {
1606 |         "colab": {
1607 |           "base_uri": "https://localhost:8080/"
1608 |         },
1609 |         "id": "hTOAPCDEb5FB",
1610 |         "outputId": "dc71c805-de04-4e54-ea1d-3a642853c35f"
1611 |       },
1612 |       "execution_count": null,
1613 |       "outputs": [
1614 |         {
1615 |           "output_type": "stream",
1616 |           "name": "stdout",
1617 |           "text": [
1618 |             "Precision = 0.8299319727891157\n",
1619 |             "Recall = 0.9242424242424242\n",
1620 |             "F1 Score = 0.8745519713261649\n"
1621 |           ]
1622 |         }
1623 |       ]
1624 |     },
1625 |     {
1626 |       "cell_type": "code",
1627 |       "source": [
1628 |         "# classification metrics for test data\n",
1629 |         "precision_recall_f1_score(Y_test, X_test_prediction)"
1630 |       ],
1631 |       "metadata": {
1632 |         "colab": {
1633 |           "base_uri": "https://localhost:8080/"
1634 |         },
1635 |         "id": "kr20IWwicIdq",
1636 |         "outputId": "e400f2fc-9b8f-4728-f2db-2a22deb9e650"
1637 |       },
1638 |       "execution_count": null,
1639 |       "outputs": [
1640 |         {
1641 |           "output_type": "stream",
1642 |           "name": "stdout",
1643 |           "text": [
1644 |             "Precision = 0.8181818181818182\n",
1645 |             "Recall = 0.8181818181818182\n",
1646 |             "F1 Score = 0.8181818181818182\n"
1647 |           ]
1648 |         }
1649 |       ]
1650 |     },
1651 |     {
1652 |       "cell_type": "code",
1653 |       "source": [],
1654 |       "metadata": {
1655 |         "id": "W6gtqxPkcR01"
1656 |       },
1657 |       "execution_count": null,
1658 |       "outputs": []
1659 |     }
1660 |   ]
1661 | }


--------------------------------------------------------------------------------
/Accuracy_score_and_Confusion_Matrix.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |   "nbformat": 4,
   3 |   "nbformat_minor": 0,
   4 |   "metadata": {
   5 |     "colab": {
   6 |       "provenance": [],
   7 |       "collapsed_sections": []
   8 |     },
   9 |     "kernelspec": {
  10 |       "name": "python3",
  11 |       "display_name": "Python 3"
  12 |     },
  13 |     "language_info": {
  14 |       "name": "python"
  15 |     }
  16 |   },
  17 |   "cells": [
  18 |     {
  19 |       "cell_type": "markdown",
  20 |       "metadata": {
  21 |         "id": "aTb-9TFFqprC"
  22 |       },
  23 |       "source": [
  24 |         "Importing the Dependencies"
  25 |       ]
  26 |     },
  27 |     {
  28 |       "cell_type": "code",
  29 |       "metadata": {
  30 |         "id": "3q9U3S_whh3-"
  31 |       },
  32 |       "source": [
  33 |         "import numpy as np\n",
  34 |         "import pandas as pd\n",
  35 |         "from sklearn.model_selection import train_test_split\n",
  36 |         "from sklearn.linear_model import LogisticRegression"
  37 |       ],
  38 |       "execution_count": null,
  39 |       "outputs": []
  40 |     },
  41 |     {
  42 |       "cell_type": "markdown",
  43 |       "metadata": {
  44 |         "id": "egMd5zeurTMR"
  45 |       },
  46 |       "source": [
  47 |         "Data Collection and Processing"
  48 |       ]
  49 |     },
  50 |     {
  51 |       "cell_type": "code",
  52 |       "metadata": {
  53 |         "id": "0q-3-LkQrREV"
  54 |       },
  55 |       "source": [
  56 |         "# loading the csv data to a Pandas DataFrame\n",
  57 |         "heart_data = pd.read_csv('heart.csv')"
  58 |       ],
  59 |       "execution_count": null,
  60 |       "outputs": []
  61 |     },
  62 |     {
  63 |       "cell_type": "code",
  64 |       "metadata": {
  65 |         "colab": {
  66 |           "base_uri": "https://localhost:8080/",
  67 |           "height": 206
  68 |         },
  69 |         "id": "M8dQxSTqriWD",
  70 |         "outputId": "d603ff60-b730-4e5f-dc02-834978b234d9"
  71 |       },
  72 |       "source": [
  73 |         "# print first 5 rows of the dataset\n",
  74 |         "heart_data.head()"
  75 |       ],
  76 |       "execution_count": null,
  77 |       "outputs": [
  78 |         {
  79 |           "output_type": "execute_result",
  80 |           "data": {
  81 |             "text/plain": [
  82 |               "   age  sex  cp  trestbps  chol  fbs  restecg  thalach  exang  oldpeak  slope  \\\n",
  83 |               "0   63    1   3       145   233    1        0      150      0      2.3      0   \n",
  84 |               "1   37    1   2       130   250    0        1      187      0      3.5      0   \n",
  85 |               "2   41    0   1       130   204    0        0      172      0      1.4      2   \n",
  86 |               "3   56    1   1       120   236    0        1      178      0      0.8      2   \n",
  87 |               "4   57    0   0       120   354    0        1      163      1      0.6      2   \n",
  88 |               "\n",
  89 |               "   ca  thal  target  \n",
  90 |               "0   0     1       1  \n",
  91 |               "1   0     2       1  \n",
  92 |               "2   0     2       1  \n",
  93 |               "3   0     2       1  \n",
  94 |               "4   0     2       1  "
  95 |             ],
  96 |             "text/html": [
  97 |               "\n",
  98 |               "  <div id=\"df-67f741c9-b9e0-491b-9ec0-56197b51236d\">\n",
  99 |               "    <div class=\"colab-df-container\">\n",
 100 |               "      <div>\n",
 101 |               "<style scoped>\n",
 102 |               "    .dataframe tbody tr th:only-of-type {\n",
 103 |               "        vertical-align: middle;\n",
 104 |               "    }\n",
 105 |               "\n",
 106 |               "    .dataframe tbody tr th {\n",
 107 |               "        vertical-align: top;\n",
 108 |               "    }\n",
 109 |               "\n",
 110 |               "    .dataframe thead th {\n",
 111 |               "        text-align: right;\n",
 112 |               "    }\n",
 113 |               "</style>\n",
 114 |               "<table border=\"1\" class=\"dataframe\">\n",
 115 |               "  <thead>\n",
 116 |               "    <tr style=\"text-align: right;\">\n",
 117 |               "      <th></th>\n",
 118 |               "      <th>age</th>\n",
 119 |               "      <th>sex</th>\n",
 120 |               "      <th>cp</th>\n",
 121 |               "      <th>trestbps</th>\n",
 122 |               "      <th>chol</th>\n",
 123 |               "      <th>fbs</th>\n",
 124 |               "      <th>restecg</th>\n",
 125 |               "      <th>thalach</th>\n",
 126 |               "      <th>exang</th>\n",
 127 |               "      <th>oldpeak</th>\n",
 128 |               "      <th>slope</th>\n",
 129 |               "      <th>ca</th>\n",
 130 |               "      <th>thal</th>\n",
 131 |               "      <th>target</th>\n",
 132 |               "    </tr>\n",
 133 |               "  </thead>\n",
 134 |               "  <tbody>\n",
 135 |               "    <tr>\n",
 136 |               "      <th>0</th>\n",
 137 |               "      <td>63</td>\n",
 138 |               "      <td>1</td>\n",
 139 |               "      <td>3</td>\n",
 140 |               "      <td>145</td>\n",
 141 |               "      <td>233</td>\n",
 142 |               "      <td>1</td>\n",
 143 |               "      <td>0</td>\n",
 144 |               "      <td>150</td>\n",
 145 |               "      <td>0</td>\n",
 146 |               "      <td>2.3</td>\n",
 147 |               "      <td>0</td>\n",
 148 |               "      <td>0</td>\n",
 149 |               "      <td>1</td>\n",
 150 |               "      <td>1</td>\n",
 151 |               "    </tr>\n",
 152 |               "    <tr>\n",
 153 |               "      <th>1</th>\n",
 154 |               "      <td>37</td>\n",
 155 |               "      <td>1</td>\n",
 156 |               "      <td>2</td>\n",
 157 |               "      <td>130</td>\n",
 158 |               "      <td>250</td>\n",
 159 |               "      <td>0</td>\n",
 160 |               "      <td>1</td>\n",
 161 |               "      <td>187</td>\n",
 162 |               "      <td>0</td>\n",
 163 |               "      <td>3.5</td>\n",
 164 |               "      <td>0</td>\n",
 165 |               "      <td>0</td>\n",
 166 |               "      <td>2</td>\n",
 167 |               "      <td>1</td>\n",
 168 |               "    </tr>\n",
 169 |               "    <tr>\n",
 170 |               "      <th>2</th>\n",
 171 |               "      <td>41</td>\n",
 172 |               "      <td>0</td>\n",
 173 |               "      <td>1</td>\n",
 174 |               "      <td>130</td>\n",
 175 |               "      <td>204</td>\n",
 176 |               "      <td>0</td>\n",
 177 |               "      <td>0</td>\n",
 178 |               "      <td>172</td>\n",
 179 |               "      <td>0</td>\n",
 180 |               "      <td>1.4</td>\n",
 181 |               "      <td>2</td>\n",
 182 |               "      <td>0</td>\n",
 183 |               "      <td>2</td>\n",
 184 |               "      <td>1</td>\n",
 185 |               "    </tr>\n",
 186 |               "    <tr>\n",
 187 |               "      <th>3</th>\n",
 188 |               "      <td>56</td>\n",
 189 |               "      <td>1</td>\n",
 190 |               "      <td>1</td>\n",
 191 |               "      <td>120</td>\n",
 192 |               "      <td>236</td>\n",
 193 |               "      <td>0</td>\n",
 194 |               "      <td>1</td>\n",
 195 |               "      <td>178</td>\n",
 196 |               "      <td>0</td>\n",
 197 |               "      <td>0.8</td>\n",
 198 |               "      <td>2</td>\n",
 199 |               "      <td>0</td>\n",
 200 |               "      <td>2</td>\n",
 201 |               "      <td>1</td>\n",
 202 |               "    </tr>\n",
 203 |               "    <tr>\n",
 204 |               "      <th>4</th>\n",
 205 |               "      <td>57</td>\n",
 206 |               "      <td>0</td>\n",
 207 |               "      <td>0</td>\n",
 208 |               "      <td>120</td>\n",
 209 |               "      <td>354</td>\n",
 210 |               "      <td>0</td>\n",
 211 |               "      <td>1</td>\n",
 212 |               "      <td>163</td>\n",
 213 |               "      <td>1</td>\n",
 214 |               "      <td>0.6</td>\n",
 215 |               "      <td>2</td>\n",
 216 |               "      <td>0</td>\n",
 217 |               "      <td>2</td>\n",
 218 |               "      <td>1</td>\n",
 219 |               "    </tr>\n",
 220 |               "  </tbody>\n",
 221 |               "</table>\n",
 222 |               "</div>\n",
 223 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-67f741c9-b9e0-491b-9ec0-56197b51236d')\"\n",
 224 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
 225 |               "              style=\"display:none;\">\n",
 226 |               "        \n",
 227 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
 228 |               "       width=\"24px\">\n",
 229 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
 230 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
 231 |               "  </svg>\n",
 232 |               "      </button>\n",
 233 |               "      \n",
 234 |               "  <style>\n",
 235 |               "    .colab-df-container {\n",
 236 |               "      display:flex;\n",
 237 |               "      flex-wrap:wrap;\n",
 238 |               "      gap: 12px;\n",
 239 |               "    }\n",
 240 |               "\n",
 241 |               "    .colab-df-convert {\n",
 242 |               "      background-color: #E8F0FE;\n",
 243 |               "      border: none;\n",
 244 |               "      border-radius: 50%;\n",
 245 |               "      cursor: pointer;\n",
 246 |               "      display: none;\n",
 247 |               "      fill: #1967D2;\n",
 248 |               "      height: 32px;\n",
 249 |               "      padding: 0 0 0 0;\n",
 250 |               "      width: 32px;\n",
 251 |               "    }\n",
 252 |               "\n",
 253 |               "    .colab-df-convert:hover {\n",
 254 |               "      background-color: #E2EBFA;\n",
 255 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
 256 |               "      fill: #174EA6;\n",
 257 |               "    }\n",
 258 |               "\n",
 259 |               "    [theme=dark] .colab-df-convert {\n",
 260 |               "      background-color: #3B4455;\n",
 261 |               "      fill: #D2E3FC;\n",
 262 |               "    }\n",
 263 |               "\n",
 264 |               "    [theme=dark] .colab-df-convert:hover {\n",
 265 |               "      background-color: #434B5C;\n",
 266 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
 267 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
 268 |               "      fill: #FFFFFF;\n",
 269 |               "    }\n",
 270 |               "  </style>\n",
 271 |               "\n",
 272 |               "      <script>\n",
 273 |               "        const buttonEl =\n",
 274 |               "          document.querySelector('#df-67f741c9-b9e0-491b-9ec0-56197b51236d button.colab-df-convert');\n",
 275 |               "        buttonEl.style.display =\n",
 276 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
 277 |               "\n",
 278 |               "        async function convertToInteractive(key) {\n",
 279 |               "          const element = document.querySelector('#df-67f741c9-b9e0-491b-9ec0-56197b51236d');\n",
 280 |               "          const dataTable =\n",
 281 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
 282 |               "                                                     [key], {});\n",
 283 |               "          if (!dataTable) return;\n",
 284 |               "\n",
 285 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
 286 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
 287 |               "            + ' to learn more about interactive tables.';\n",
 288 |               "          element.innerHTML = '';\n",
 289 |               "          dataTable['output_type'] = 'display_data';\n",
 290 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
 291 |               "          const docLink = document.createElement('div');\n",
 292 |               "          docLink.innerHTML = docLinkHtml;\n",
 293 |               "          element.appendChild(docLink);\n",
 294 |               "        }\n",
 295 |               "      </script>\n",
 296 |               "    </div>\n",
 297 |               "  </div>\n",
 298 |               "  "
 299 |             ]
 300 |           },
 301 |           "metadata": {},
 302 |           "execution_count": 3
 303 |         }
 304 |       ]
 305 |     },
 306 |     {
 307 |       "cell_type": "code",
 308 |       "metadata": {
 309 |         "colab": {
 310 |           "base_uri": "https://localhost:8080/",
 311 |           "height": 206
 312 |         },
 313 |         "id": "Fx_aCZDgrqdR",
 314 |         "outputId": "cf89729f-96e1-4087-b473-d164e0583a3b"
 315 |       },
 316 |       "source": [
 317 |         "# print last 5 rows of the dataset\n",
 318 |         "heart_data.tail()"
 319 |       ],
 320 |       "execution_count": null,
 321 |       "outputs": [
 322 |         {
 323 |           "output_type": "execute_result",
 324 |           "data": {
 325 |             "text/plain": [
 326 |               "     age  sex  cp  trestbps  chol  fbs  restecg  thalach  exang  oldpeak  \\\n",
 327 |               "298   57    0   0       140   241    0        1      123      1      0.2   \n",
 328 |               "299   45    1   3       110   264    0        1      132      0      1.2   \n",
 329 |               "300   68    1   0       144   193    1        1      141      0      3.4   \n",
 330 |               "301   57    1   0       130   131    0        1      115      1      1.2   \n",
 331 |               "302   57    0   1       130   236    0        0      174      0      0.0   \n",
 332 |               "\n",
 333 |               "     slope  ca  thal  target  \n",
 334 |               "298      1   0     3       0  \n",
 335 |               "299      1   0     3       0  \n",
 336 |               "300      1   2     3       0  \n",
 337 |               "301      1   1     3       0  \n",
 338 |               "302      1   1     2       0  "
 339 |             ],
 340 |             "text/html": [
 341 |               "\n",
 342 |               "  <div id=\"df-59b6fe1f-52ca-45c1-abbc-21d16e825dd9\">\n",
 343 |               "    <div class=\"colab-df-container\">\n",
 344 |               "      <div>\n",
 345 |               "<style scoped>\n",
 346 |               "    .dataframe tbody tr th:only-of-type {\n",
 347 |               "        vertical-align: middle;\n",
 348 |               "    }\n",
 349 |               "\n",
 350 |               "    .dataframe tbody tr th {\n",
 351 |               "        vertical-align: top;\n",
 352 |               "    }\n",
 353 |               "\n",
 354 |               "    .dataframe thead th {\n",
 355 |               "        text-align: right;\n",
 356 |               "    }\n",
 357 |               "</style>\n",
 358 |               "<table border=\"1\" class=\"dataframe\">\n",
 359 |               "  <thead>\n",
 360 |               "    <tr style=\"text-align: right;\">\n",
 361 |               "      <th></th>\n",
 362 |               "      <th>age</th>\n",
 363 |               "      <th>sex</th>\n",
 364 |               "      <th>cp</th>\n",
 365 |               "      <th>trestbps</th>\n",
 366 |               "      <th>chol</th>\n",
 367 |               "      <th>fbs</th>\n",
 368 |               "      <th>restecg</th>\n",
 369 |               "      <th>thalach</th>\n",
 370 |               "      <th>exang</th>\n",
 371 |               "      <th>oldpeak</th>\n",
 372 |               "      <th>slope</th>\n",
 373 |               "      <th>ca</th>\n",
 374 |               "      <th>thal</th>\n",
 375 |               "      <th>target</th>\n",
 376 |               "    </tr>\n",
 377 |               "  </thead>\n",
 378 |               "  <tbody>\n",
 379 |               "    <tr>\n",
 380 |               "      <th>298</th>\n",
 381 |               "      <td>57</td>\n",
 382 |               "      <td>0</td>\n",
 383 |               "      <td>0</td>\n",
 384 |               "      <td>140</td>\n",
 385 |               "      <td>241</td>\n",
 386 |               "      <td>0</td>\n",
 387 |               "      <td>1</td>\n",
 388 |               "      <td>123</td>\n",
 389 |               "      <td>1</td>\n",
 390 |               "      <td>0.2</td>\n",
 391 |               "      <td>1</td>\n",
 392 |               "      <td>0</td>\n",
 393 |               "      <td>3</td>\n",
 394 |               "      <td>0</td>\n",
 395 |               "    </tr>\n",
 396 |               "    <tr>\n",
 397 |               "      <th>299</th>\n",
 398 |               "      <td>45</td>\n",
 399 |               "      <td>1</td>\n",
 400 |               "      <td>3</td>\n",
 401 |               "      <td>110</td>\n",
 402 |               "      <td>264</td>\n",
 403 |               "      <td>0</td>\n",
 404 |               "      <td>1</td>\n",
 405 |               "      <td>132</td>\n",
 406 |               "      <td>0</td>\n",
 407 |               "      <td>1.2</td>\n",
 408 |               "      <td>1</td>\n",
 409 |               "      <td>0</td>\n",
 410 |               "      <td>3</td>\n",
 411 |               "      <td>0</td>\n",
 412 |               "    </tr>\n",
 413 |               "    <tr>\n",
 414 |               "      <th>300</th>\n",
 415 |               "      <td>68</td>\n",
 416 |               "      <td>1</td>\n",
 417 |               "      <td>0</td>\n",
 418 |               "      <td>144</td>\n",
 419 |               "      <td>193</td>\n",
 420 |               "      <td>1</td>\n",
 421 |               "      <td>1</td>\n",
 422 |               "      <td>141</td>\n",
 423 |               "      <td>0</td>\n",
 424 |               "      <td>3.4</td>\n",
 425 |               "      <td>1</td>\n",
 426 |               "      <td>2</td>\n",
 427 |               "      <td>3</td>\n",
 428 |               "      <td>0</td>\n",
 429 |               "    </tr>\n",
 430 |               "    <tr>\n",
 431 |               "      <th>301</th>\n",
 432 |               "      <td>57</td>\n",
 433 |               "      <td>1</td>\n",
 434 |               "      <td>0</td>\n",
 435 |               "      <td>130</td>\n",
 436 |               "      <td>131</td>\n",
 437 |               "      <td>0</td>\n",
 438 |               "      <td>1</td>\n",
 439 |               "      <td>115</td>\n",
 440 |               "      <td>1</td>\n",
 441 |               "      <td>1.2</td>\n",
 442 |               "      <td>1</td>\n",
 443 |               "      <td>1</td>\n",
 444 |               "      <td>3</td>\n",
 445 |               "      <td>0</td>\n",
 446 |               "    </tr>\n",
 447 |               "    <tr>\n",
 448 |               "      <th>302</th>\n",
 449 |               "      <td>57</td>\n",
 450 |               "      <td>0</td>\n",
 451 |               "      <td>1</td>\n",
 452 |               "      <td>130</td>\n",
 453 |               "      <td>236</td>\n",
 454 |               "      <td>0</td>\n",
 455 |               "      <td>0</td>\n",
 456 |               "      <td>174</td>\n",
 457 |               "      <td>0</td>\n",
 458 |               "      <td>0.0</td>\n",
 459 |               "      <td>1</td>\n",
 460 |               "      <td>1</td>\n",
 461 |               "      <td>2</td>\n",
 462 |               "      <td>0</td>\n",
 463 |               "    </tr>\n",
 464 |               "  </tbody>\n",
 465 |               "</table>\n",
 466 |               "</div>\n",
 467 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-59b6fe1f-52ca-45c1-abbc-21d16e825dd9')\"\n",
 468 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
 469 |               "              style=\"display:none;\">\n",
 470 |               "        \n",
 471 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
 472 |               "       width=\"24px\">\n",
 473 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
 474 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
 475 |               "  </svg>\n",
 476 |               "      </button>\n",
 477 |               "      \n",
 478 |               "  <style>\n",
 479 |               "    .colab-df-container {\n",
 480 |               "      display:flex;\n",
 481 |               "      flex-wrap:wrap;\n",
 482 |               "      gap: 12px;\n",
 483 |               "    }\n",
 484 |               "\n",
 485 |               "    .colab-df-convert {\n",
 486 |               "      background-color: #E8F0FE;\n",
 487 |               "      border: none;\n",
 488 |               "      border-radius: 50%;\n",
 489 |               "      cursor: pointer;\n",
 490 |               "      display: none;\n",
 491 |               "      fill: #1967D2;\n",
 492 |               "      height: 32px;\n",
 493 |               "      padding: 0 0 0 0;\n",
 494 |               "      width: 32px;\n",
 495 |               "    }\n",
 496 |               "\n",
 497 |               "    .colab-df-convert:hover {\n",
 498 |               "      background-color: #E2EBFA;\n",
 499 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
 500 |               "      fill: #174EA6;\n",
 501 |               "    }\n",
 502 |               "\n",
 503 |               "    [theme=dark] .colab-df-convert {\n",
 504 |               "      background-color: #3B4455;\n",
 505 |               "      fill: #D2E3FC;\n",
 506 |               "    }\n",
 507 |               "\n",
 508 |               "    [theme=dark] .colab-df-convert:hover {\n",
 509 |               "      background-color: #434B5C;\n",
 510 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
 511 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
 512 |               "      fill: #FFFFFF;\n",
 513 |               "    }\n",
 514 |               "  </style>\n",
 515 |               "\n",
 516 |               "      <script>\n",
 517 |               "        const buttonEl =\n",
 518 |               "          document.querySelector('#df-59b6fe1f-52ca-45c1-abbc-21d16e825dd9 button.colab-df-convert');\n",
 519 |               "        buttonEl.style.display =\n",
 520 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
 521 |               "\n",
 522 |               "        async function convertToInteractive(key) {\n",
 523 |               "          const element = document.querySelector('#df-59b6fe1f-52ca-45c1-abbc-21d16e825dd9');\n",
 524 |               "          const dataTable =\n",
 525 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
 526 |               "                                                     [key], {});\n",
 527 |               "          if (!dataTable) return;\n",
 528 |               "\n",
 529 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
 530 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
 531 |               "            + ' to learn more about interactive tables.';\n",
 532 |               "          element.innerHTML = '';\n",
 533 |               "          dataTable['output_type'] = 'display_data';\n",
 534 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
 535 |               "          const docLink = document.createElement('div');\n",
 536 |               "          docLink.innerHTML = docLinkHtml;\n",
 537 |               "          element.appendChild(docLink);\n",
 538 |               "        }\n",
 539 |               "      </script>\n",
 540 |               "    </div>\n",
 541 |               "  </div>\n",
 542 |               "  "
 543 |             ]
 544 |           },
 545 |           "metadata": {},
 546 |           "execution_count": 4
 547 |         }
 548 |       ]
 549 |     },
 550 |     {
 551 |       "cell_type": "code",
 552 |       "metadata": {
 553 |         "colab": {
 554 |           "base_uri": "https://localhost:8080/"
 555 |         },
 556 |         "id": "8nX1tIzbrz0u",
 557 |         "outputId": "56f1381e-f062-447b-8507-7aaad7be906f"
 558 |       },
 559 |       "source": [
 560 |         "# number of rows and columns in the dataset\n",
 561 |         "heart_data.shape"
 562 |       ],
 563 |       "execution_count": null,
 564 |       "outputs": [
 565 |         {
 566 |           "output_type": "execute_result",
 567 |           "data": {
 568 |             "text/plain": [
 569 |               "(303, 14)"
 570 |             ]
 571 |           },
 572 |           "metadata": {},
 573 |           "execution_count": 5
 574 |         }
 575 |       ]
 576 |     },
 577 |     {
 578 |       "cell_type": "code",
 579 |       "metadata": {
 580 |         "colab": {
 581 |           "base_uri": "https://localhost:8080/"
 582 |         },
 583 |         "id": "7_xTcw1Sr6aJ",
 584 |         "outputId": "02954844-fd60-407f-8bae-1f1fe73ffa16"
 585 |       },
 586 |       "source": [
 587 |         "# getting some info about the data\n",
 588 |         "heart_data.info()"
 589 |       ],
 590 |       "execution_count": null,
 591 |       "outputs": [
 592 |         {
 593 |           "output_type": "stream",
 594 |           "name": "stdout",
 595 |           "text": [
 596 |             "<class 'pandas.core.frame.DataFrame'>\n",
 597 |             "RangeIndex: 303 entries, 0 to 302\n",
 598 |             "Data columns (total 14 columns):\n",
 599 |             " #   Column    Non-Null Count  Dtype  \n",
 600 |             "---  ------    --------------  -----  \n",
 601 |             " 0   age       303 non-null    int64  \n",
 602 |             " 1   sex       303 non-null    int64  \n",
 603 |             " 2   cp        303 non-null    int64  \n",
 604 |             " 3   trestbps  303 non-null    int64  \n",
 605 |             " 4   chol      303 non-null    int64  \n",
 606 |             " 5   fbs       303 non-null    int64  \n",
 607 |             " 6   restecg   303 non-null    int64  \n",
 608 |             " 7   thalach   303 non-null    int64  \n",
 609 |             " 8   exang     303 non-null    int64  \n",
 610 |             " 9   oldpeak   303 non-null    float64\n",
 611 |             " 10  slope     303 non-null    int64  \n",
 612 |             " 11  ca        303 non-null    int64  \n",
 613 |             " 12  thal      303 non-null    int64  \n",
 614 |             " 13  target    303 non-null    int64  \n",
 615 |             "dtypes: float64(1), int64(13)\n",
 616 |             "memory usage: 33.3 KB\n"
 617 |           ]
 618 |         }
 619 |       ]
 620 |     },
 621 |     {
 622 |       "cell_type": "code",
 623 |       "metadata": {
 624 |         "colab": {
 625 |           "base_uri": "https://localhost:8080/"
 626 |         },
 627 |         "id": "GjHtW31rsGlb",
 628 |         "outputId": "d1edce51-05e9-44aa-8d5f-b266fee0b634"
 629 |       },
 630 |       "source": [
 631 |         "# checking for missing values\n",
 632 |         "heart_data.isnull().sum()"
 633 |       ],
 634 |       "execution_count": null,
 635 |       "outputs": [
 636 |         {
 637 |           "output_type": "execute_result",
 638 |           "data": {
 639 |             "text/plain": [
 640 |               "age         0\n",
 641 |               "sex         0\n",
 642 |               "cp          0\n",
 643 |               "trestbps    0\n",
 644 |               "chol        0\n",
 645 |               "fbs         0\n",
 646 |               "restecg     0\n",
 647 |               "thalach     0\n",
 648 |               "exang       0\n",
 649 |               "oldpeak     0\n",
 650 |               "slope       0\n",
 651 |               "ca          0\n",
 652 |               "thal        0\n",
 653 |               "target      0\n",
 654 |               "dtype: int64"
 655 |             ]
 656 |           },
 657 |           "metadata": {},
 658 |           "execution_count": 7
 659 |         }
 660 |       ]
 661 |     },
 662 |     {
 663 |       "cell_type": "code",
 664 |       "metadata": {
 665 |         "colab": {
 666 |           "base_uri": "https://localhost:8080/",
 667 |           "height": 364
 668 |         },
 669 |         "id": "OHmcP7DJsSEP",
 670 |         "outputId": "04cf61ff-fd64-4211-b575-6d49d5e566ff"
 671 |       },
 672 |       "source": [
 673 |         "# statistical measures about the data\n",
 674 |         "heart_data.describe()"
 675 |       ],
 676 |       "execution_count": null,
 677 |       "outputs": [
 678 |         {
 679 |           "output_type": "execute_result",
 680 |           "data": {
 681 |             "text/plain": [
 682 |               "              age         sex          cp    trestbps        chol         fbs  \\\n",
 683 |               "count  303.000000  303.000000  303.000000  303.000000  303.000000  303.000000   \n",
 684 |               "mean    54.366337    0.683168    0.966997  131.623762  246.264026    0.148515   \n",
 685 |               "std      9.082101    0.466011    1.032052   17.538143   51.830751    0.356198   \n",
 686 |               "min     29.000000    0.000000    0.000000   94.000000  126.000000    0.000000   \n",
 687 |               "25%     47.500000    0.000000    0.000000  120.000000  211.000000    0.000000   \n",
 688 |               "50%     55.000000    1.000000    1.000000  130.000000  240.000000    0.000000   \n",
 689 |               "75%     61.000000    1.000000    2.000000  140.000000  274.500000    0.000000   \n",
 690 |               "max     77.000000    1.000000    3.000000  200.000000  564.000000    1.000000   \n",
 691 |               "\n",
 692 |               "          restecg     thalach       exang     oldpeak       slope          ca  \\\n",
 693 |               "count  303.000000  303.000000  303.000000  303.000000  303.000000  303.000000   \n",
 694 |               "mean     0.528053  149.646865    0.326733    1.039604    1.399340    0.729373   \n",
 695 |               "std      0.525860   22.905161    0.469794    1.161075    0.616226    1.022606   \n",
 696 |               "min      0.000000   71.000000    0.000000    0.000000    0.000000    0.000000   \n",
 697 |               "25%      0.000000  133.500000    0.000000    0.000000    1.000000    0.000000   \n",
 698 |               "50%      1.000000  153.000000    0.000000    0.800000    1.000000    0.000000   \n",
 699 |               "75%      1.000000  166.000000    1.000000    1.600000    2.000000    1.000000   \n",
 700 |               "max      2.000000  202.000000    1.000000    6.200000    2.000000    4.000000   \n",
 701 |               "\n",
 702 |               "             thal      target  \n",
 703 |               "count  303.000000  303.000000  \n",
 704 |               "mean     2.313531    0.544554  \n",
 705 |               "std      0.612277    0.498835  \n",
 706 |               "min      0.000000    0.000000  \n",
 707 |               "25%      2.000000    0.000000  \n",
 708 |               "50%      2.000000    1.000000  \n",
 709 |               "75%      3.000000    1.000000  \n",
 710 |               "max      3.000000    1.000000  "
 711 |             ],
 712 |             "text/html": [
 713 |               "\n",
 714 |               "  <div id=\"df-cfc372bc-b811-4f6f-8396-95a5eae48508\">\n",
 715 |               "    <div class=\"colab-df-container\">\n",
 716 |               "      <div>\n",
 717 |               "<style scoped>\n",
 718 |               "    .dataframe tbody tr th:only-of-type {\n",
 719 |               "        vertical-align: middle;\n",
 720 |               "    }\n",
 721 |               "\n",
 722 |               "    .dataframe tbody tr th {\n",
 723 |               "        vertical-align: top;\n",
 724 |               "    }\n",
 725 |               "\n",
 726 |               "    .dataframe thead th {\n",
 727 |               "        text-align: right;\n",
 728 |               "    }\n",
 729 |               "</style>\n",
 730 |               "<table border=\"1\" class=\"dataframe\">\n",
 731 |               "  <thead>\n",
 732 |               "    <tr style=\"text-align: right;\">\n",
 733 |               "      <th></th>\n",
 734 |               "      <th>age</th>\n",
 735 |               "      <th>sex</th>\n",
 736 |               "      <th>cp</th>\n",
 737 |               "      <th>trestbps</th>\n",
 738 |               "      <th>chol</th>\n",
 739 |               "      <th>fbs</th>\n",
 740 |               "      <th>restecg</th>\n",
 741 |               "      <th>thalach</th>\n",
 742 |               "      <th>exang</th>\n",
 743 |               "      <th>oldpeak</th>\n",
 744 |               "      <th>slope</th>\n",
 745 |               "      <th>ca</th>\n",
 746 |               "      <th>thal</th>\n",
 747 |               "      <th>target</th>\n",
 748 |               "    </tr>\n",
 749 |               "  </thead>\n",
 750 |               "  <tbody>\n",
 751 |               "    <tr>\n",
 752 |               "      <th>count</th>\n",
 753 |               "      <td>303.000000</td>\n",
 754 |               "      <td>303.000000</td>\n",
 755 |               "      <td>303.000000</td>\n",
 756 |               "      <td>303.000000</td>\n",
 757 |               "      <td>303.000000</td>\n",
 758 |               "      <td>303.000000</td>\n",
 759 |               "      <td>303.000000</td>\n",
 760 |               "      <td>303.000000</td>\n",
 761 |               "      <td>303.000000</td>\n",
 762 |               "      <td>303.000000</td>\n",
 763 |               "      <td>303.000000</td>\n",
 764 |               "      <td>303.000000</td>\n",
 765 |               "      <td>303.000000</td>\n",
 766 |               "      <td>303.000000</td>\n",
 767 |               "    </tr>\n",
 768 |               "    <tr>\n",
 769 |               "      <th>mean</th>\n",
 770 |               "      <td>54.366337</td>\n",
 771 |               "      <td>0.683168</td>\n",
 772 |               "      <td>0.966997</td>\n",
 773 |               "      <td>131.623762</td>\n",
 774 |               "      <td>246.264026</td>\n",
 775 |               "      <td>0.148515</td>\n",
 776 |               "      <td>0.528053</td>\n",
 777 |               "      <td>149.646865</td>\n",
 778 |               "      <td>0.326733</td>\n",
 779 |               "      <td>1.039604</td>\n",
 780 |               "      <td>1.399340</td>\n",
 781 |               "      <td>0.729373</td>\n",
 782 |               "      <td>2.313531</td>\n",
 783 |               "      <td>0.544554</td>\n",
 784 |               "    </tr>\n",
 785 |               "    <tr>\n",
 786 |               "      <th>std</th>\n",
 787 |               "      <td>9.082101</td>\n",
 788 |               "      <td>0.466011</td>\n",
 789 |               "      <td>1.032052</td>\n",
 790 |               "      <td>17.538143</td>\n",
 791 |               "      <td>51.830751</td>\n",
 792 |               "      <td>0.356198</td>\n",
 793 |               "      <td>0.525860</td>\n",
 794 |               "      <td>22.905161</td>\n",
 795 |               "      <td>0.469794</td>\n",
 796 |               "      <td>1.161075</td>\n",
 797 |               "      <td>0.616226</td>\n",
 798 |               "      <td>1.022606</td>\n",
 799 |               "      <td>0.612277</td>\n",
 800 |               "      <td>0.498835</td>\n",
 801 |               "    </tr>\n",
 802 |               "    <tr>\n",
 803 |               "      <th>min</th>\n",
 804 |               "      <td>29.000000</td>\n",
 805 |               "      <td>0.000000</td>\n",
 806 |               "      <td>0.000000</td>\n",
 807 |               "      <td>94.000000</td>\n",
 808 |               "      <td>126.000000</td>\n",
 809 |               "      <td>0.000000</td>\n",
 810 |               "      <td>0.000000</td>\n",
 811 |               "      <td>71.000000</td>\n",
 812 |               "      <td>0.000000</td>\n",
 813 |               "      <td>0.000000</td>\n",
 814 |               "      <td>0.000000</td>\n",
 815 |               "      <td>0.000000</td>\n",
 816 |               "      <td>0.000000</td>\n",
 817 |               "      <td>0.000000</td>\n",
 818 |               "    </tr>\n",
 819 |               "    <tr>\n",
 820 |               "      <th>25%</th>\n",
 821 |               "      <td>47.500000</td>\n",
 822 |               "      <td>0.000000</td>\n",
 823 |               "      <td>0.000000</td>\n",
 824 |               "      <td>120.000000</td>\n",
 825 |               "      <td>211.000000</td>\n",
 826 |               "      <td>0.000000</td>\n",
 827 |               "      <td>0.000000</td>\n",
 828 |               "      <td>133.500000</td>\n",
 829 |               "      <td>0.000000</td>\n",
 830 |               "      <td>0.000000</td>\n",
 831 |               "      <td>1.000000</td>\n",
 832 |               "      <td>0.000000</td>\n",
 833 |               "      <td>2.000000</td>\n",
 834 |               "      <td>0.000000</td>\n",
 835 |               "    </tr>\n",
 836 |               "    <tr>\n",
 837 |               "      <th>50%</th>\n",
 838 |               "      <td>55.000000</td>\n",
 839 |               "      <td>1.000000</td>\n",
 840 |               "      <td>1.000000</td>\n",
 841 |               "      <td>130.000000</td>\n",
 842 |               "      <td>240.000000</td>\n",
 843 |               "      <td>0.000000</td>\n",
 844 |               "      <td>1.000000</td>\n",
 845 |               "      <td>153.000000</td>\n",
 846 |               "      <td>0.000000</td>\n",
 847 |               "      <td>0.800000</td>\n",
 848 |               "      <td>1.000000</td>\n",
 849 |               "      <td>0.000000</td>\n",
 850 |               "      <td>2.000000</td>\n",
 851 |               "      <td>1.000000</td>\n",
 852 |               "    </tr>\n",
 853 |               "    <tr>\n",
 854 |               "      <th>75%</th>\n",
 855 |               "      <td>61.000000</td>\n",
 856 |               "      <td>1.000000</td>\n",
 857 |               "      <td>2.000000</td>\n",
 858 |               "      <td>140.000000</td>\n",
 859 |               "      <td>274.500000</td>\n",
 860 |               "      <td>0.000000</td>\n",
 861 |               "      <td>1.000000</td>\n",
 862 |               "      <td>166.000000</td>\n",
 863 |               "      <td>1.000000</td>\n",
 864 |               "      <td>1.600000</td>\n",
 865 |               "      <td>2.000000</td>\n",
 866 |               "      <td>1.000000</td>\n",
 867 |               "      <td>3.000000</td>\n",
 868 |               "      <td>1.000000</td>\n",
 869 |               "    </tr>\n",
 870 |               "    <tr>\n",
 871 |               "      <th>max</th>\n",
 872 |               "      <td>77.000000</td>\n",
 873 |               "      <td>1.000000</td>\n",
 874 |               "      <td>3.000000</td>\n",
 875 |               "      <td>200.000000</td>\n",
 876 |               "      <td>564.000000</td>\n",
 877 |               "      <td>1.000000</td>\n",
 878 |               "      <td>2.000000</td>\n",
 879 |               "      <td>202.000000</td>\n",
 880 |               "      <td>1.000000</td>\n",
 881 |               "      <td>6.200000</td>\n",
 882 |               "      <td>2.000000</td>\n",
 883 |               "      <td>4.000000</td>\n",
 884 |               "      <td>3.000000</td>\n",
 885 |               "      <td>1.000000</td>\n",
 886 |               "    </tr>\n",
 887 |               "  </tbody>\n",
 888 |               "</table>\n",
 889 |               "</div>\n",
 890 |               "      <button class=\"colab-df-convert\" onclick=\"convertToInteractive('df-cfc372bc-b811-4f6f-8396-95a5eae48508')\"\n",
 891 |               "              title=\"Convert this dataframe to an interactive table.\"\n",
 892 |               "              style=\"display:none;\">\n",
 893 |               "        \n",
 894 |               "  <svg xmlns=\"http://www.w3.org/2000/svg\" height=\"24px\"viewBox=\"0 0 24 24\"\n",
 895 |               "       width=\"24px\">\n",
 896 |               "    <path d=\"M0 0h24v24H0V0z\" fill=\"none\"/>\n",
 897 |               "    <path d=\"M18.56 5.44l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94zm-11 1L8.5 8.5l.94-2.06 2.06-.94-2.06-.94L8.5 2.5l-.94 2.06-2.06.94zm10 10l.94 2.06.94-2.06 2.06-.94-2.06-.94-.94-2.06-.94 2.06-2.06.94z\"/><path d=\"M17.41 7.96l-1.37-1.37c-.4-.4-.92-.59-1.43-.59-.52 0-1.04.2-1.43.59L10.3 9.45l-7.72 7.72c-.78.78-.78 2.05 0 2.83L4 21.41c.39.39.9.59 1.41.59.51 0 1.02-.2 1.41-.59l7.78-7.78 2.81-2.81c.8-.78.8-2.07 0-2.86zM5.41 20L4 18.59l7.72-7.72 1.47 1.35L5.41 20z\"/>\n",
 898 |               "  </svg>\n",
 899 |               "      </button>\n",
 900 |               "      \n",
 901 |               "  <style>\n",
 902 |               "    .colab-df-container {\n",
 903 |               "      display:flex;\n",
 904 |               "      flex-wrap:wrap;\n",
 905 |               "      gap: 12px;\n",
 906 |               "    }\n",
 907 |               "\n",
 908 |               "    .colab-df-convert {\n",
 909 |               "      background-color: #E8F0FE;\n",
 910 |               "      border: none;\n",
 911 |               "      border-radius: 50%;\n",
 912 |               "      cursor: pointer;\n",
 913 |               "      display: none;\n",
 914 |               "      fill: #1967D2;\n",
 915 |               "      height: 32px;\n",
 916 |               "      padding: 0 0 0 0;\n",
 917 |               "      width: 32px;\n",
 918 |               "    }\n",
 919 |               "\n",
 920 |               "    .colab-df-convert:hover {\n",
 921 |               "      background-color: #E2EBFA;\n",
 922 |               "      box-shadow: 0px 1px 2px rgba(60, 64, 67, 0.3), 0px 1px 3px 1px rgba(60, 64, 67, 0.15);\n",
 923 |               "      fill: #174EA6;\n",
 924 |               "    }\n",
 925 |               "\n",
 926 |               "    [theme=dark] .colab-df-convert {\n",
 927 |               "      background-color: #3B4455;\n",
 928 |               "      fill: #D2E3FC;\n",
 929 |               "    }\n",
 930 |               "\n",
 931 |               "    [theme=dark] .colab-df-convert:hover {\n",
 932 |               "      background-color: #434B5C;\n",
 933 |               "      box-shadow: 0px 1px 3px 1px rgba(0, 0, 0, 0.15);\n",
 934 |               "      filter: drop-shadow(0px 1px 2px rgba(0, 0, 0, 0.3));\n",
 935 |               "      fill: #FFFFFF;\n",
 936 |               "    }\n",
 937 |               "  </style>\n",
 938 |               "\n",
 939 |               "      <script>\n",
 940 |               "        const buttonEl =\n",
 941 |               "          document.querySelector('#df-cfc372bc-b811-4f6f-8396-95a5eae48508 button.colab-df-convert');\n",
 942 |               "        buttonEl.style.display =\n",
 943 |               "          google.colab.kernel.accessAllowed ? 'block' : 'none';\n",
 944 |               "\n",
 945 |               "        async function convertToInteractive(key) {\n",
 946 |               "          const element = document.querySelector('#df-cfc372bc-b811-4f6f-8396-95a5eae48508');\n",
 947 |               "          const dataTable =\n",
 948 |               "            await google.colab.kernel.invokeFunction('convertToInteractive',\n",
 949 |               "                                                     [key], {});\n",
 950 |               "          if (!dataTable) return;\n",
 951 |               "\n",
 952 |               "          const docLinkHtml = 'Like what you see? Visit the ' +\n",
 953 |               "            '<a target=\"_blank\" href=https://colab.research.google.com/notebooks/data_table.ipynb>data table notebook</a>'\n",
 954 |               "            + ' to learn more about interactive tables.';\n",
 955 |               "          element.innerHTML = '';\n",
 956 |               "          dataTable['output_type'] = 'display_data';\n",
 957 |               "          await google.colab.output.renderOutput(dataTable, element);\n",
 958 |               "          const docLink = document.createElement('div');\n",
 959 |               "          docLink.innerHTML = docLinkHtml;\n",
 960 |               "          element.appendChild(docLink);\n",
 961 |               "        }\n",
 962 |               "      </script>\n",
 963 |               "    </div>\n",
 964 |               "  </div>\n",
 965 |               "  "
 966 |             ]
 967 |           },
 968 |           "metadata": {},
 969 |           "execution_count": 8
 970 |         }
 971 |       ]
 972 |     },
 973 |     {
 974 |       "cell_type": "code",
 975 |       "metadata": {
 976 |         "colab": {
 977 |           "base_uri": "https://localhost:8080/"
 978 |         },
 979 |         "id": "4InaOSIUsfWP",
 980 |         "outputId": "acf2ef21-c6ef-4d3a-a14c-0399e02bcb6a"
 981 |       },
 982 |       "source": [
 983 |         "# checking the distribution of Target Variable\n",
 984 |         "heart_data['target'].value_counts()"
 985 |       ],
 986 |       "execution_count": null,
 987 |       "outputs": [
 988 |         {
 989 |           "output_type": "execute_result",
 990 |           "data": {
 991 |             "text/plain": [
 992 |               "1    165\n",
 993 |               "0    138\n",
 994 |               "Name: target, dtype: int64"
 995 |             ]
 996 |           },
 997 |           "metadata": {},
 998 |           "execution_count": 9
 999 |         }
1000 |       ]
1001 |     },
1002 |     {
1003 |       "cell_type": "markdown",
1004 |       "metadata": {
1005 |         "id": "aSOBu4qDtJy5"
1006 |       },
1007 |       "source": [
1008 |         "1 --> Defective Heart\n",
1009 |         "\n",
1010 |         "0 --> Healthy Heart"
1011 |       ]
1012 |     },
1013 |     {
1014 |       "cell_type": "markdown",
1015 |       "metadata": {
1016 |         "id": "tW8i4igjtPRC"
1017 |       },
1018 |       "source": [
1019 |         "Splitting the Features and Target"
1020 |       ]
1021 |     },
1022 |     {
1023 |       "cell_type": "code",
1024 |       "metadata": {
1025 |         "id": "Q6yfbswrs7m3"
1026 |       },
1027 |       "source": [
1028 |         "X = heart_data.drop(columns='target', axis=1)\n",
1029 |         "Y = heart_data['target']"
1030 |       ],
1031 |       "execution_count": null,
1032 |       "outputs": []
1033 |     },
1034 |     {
1035 |       "cell_type": "code",
1036 |       "metadata": {
1037 |         "colab": {
1038 |           "base_uri": "https://localhost:8080/"
1039 |         },
1040 |         "id": "XJoCp4ZKtpZy",
1041 |         "outputId": "aa2ea3a8-6917-4780-bc6f-ccaaf3df6dca"
1042 |       },
1043 |       "source": [
1044 |         "print(X)"
1045 |       ],
1046 |       "execution_count": null,
1047 |       "outputs": [
1048 |         {
1049 |           "output_type": "stream",
1050 |           "name": "stdout",
1051 |           "text": [
1052 |             "     age  sex  cp  trestbps  chol  fbs  restecg  thalach  exang  oldpeak  \\\n",
1053 |             "0     63    1   3       145   233    1        0      150      0      2.3   \n",
1054 |             "1     37    1   2       130   250    0        1      187      0      3.5   \n",
1055 |             "2     41    0   1       130   204    0        0      172      0      1.4   \n",
1056 |             "3     56    1   1       120   236    0        1      178      0      0.8   \n",
1057 |             "4     57    0   0       120   354    0        1      163      1      0.6   \n",
1058 |             "..   ...  ...  ..       ...   ...  ...      ...      ...    ...      ...   \n",
1059 |             "298   57    0   0       140   241    0        1      123      1      0.2   \n",
1060 |             "299   45    1   3       110   264    0        1      132      0      1.2   \n",
1061 |             "300   68    1   0       144   193    1        1      141      0      3.4   \n",
1062 |             "301   57    1   0       130   131    0        1      115      1      1.2   \n",
1063 |             "302   57    0   1       130   236    0        0      174      0      0.0   \n",
1064 |             "\n",
1065 |             "     slope  ca  thal  \n",
1066 |             "0        0   0     1  \n",
1067 |             "1        0   0     2  \n",
1068 |             "2        2   0     2  \n",
1069 |             "3        2   0     2  \n",
1070 |             "4        2   0     2  \n",
1071 |             "..     ...  ..   ...  \n",
1072 |             "298      1   0     3  \n",
1073 |             "299      1   0     3  \n",
1074 |             "300      1   2     3  \n",
1075 |             "301      1   1     3  \n",
1076 |             "302      1   1     2  \n",
1077 |             "\n",
1078 |             "[303 rows x 13 columns]\n"
1079 |           ]
1080 |         }
1081 |       ]
1082 |     },
1083 |     {
1084 |       "cell_type": "code",
1085 |       "metadata": {
1086 |         "colab": {
1087 |           "base_uri": "https://localhost:8080/"
1088 |         },
1089 |         "id": "nukuj-YItq1w",
1090 |         "outputId": "9329a137-443a-490c-bcf9-20daee07a300"
1091 |       },
1092 |       "source": [
1093 |         "print(Y)"
1094 |       ],
1095 |       "execution_count": null,
1096 |       "outputs": [
1097 |         {
1098 |           "output_type": "stream",
1099 |           "name": "stdout",
1100 |           "text": [
1101 |             "0      1\n",
1102 |             "1      1\n",
1103 |             "2      1\n",
1104 |             "3      1\n",
1105 |             "4      1\n",
1106 |             "      ..\n",
1107 |             "298    0\n",
1108 |             "299    0\n",
1109 |             "300    0\n",
1110 |             "301    0\n",
1111 |             "302    0\n",
1112 |             "Name: target, Length: 303, dtype: int64\n"
1113 |           ]
1114 |         }
1115 |       ]
1116 |     },
1117 |     {
1118 |       "cell_type": "markdown",
1119 |       "metadata": {
1120 |         "id": "_EcjSE3Et18n"
1121 |       },
1122 |       "source": [
1123 |         "Splitting the Data into Training data & Test Data"
1124 |       ]
1125 |     },
1126 |     {
1127 |       "cell_type": "code",
1128 |       "metadata": {
1129 |         "id": "a-UUfRUxtuga"
1130 |       },
1131 |       "source": [
1132 |         "X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2, stratify=Y, random_state=2)"
1133 |       ],
1134 |       "execution_count": null,
1135 |       "outputs": []
1136 |     },
1137 |     {
1138 |       "cell_type": "code",
1139 |       "metadata": {
1140 |         "colab": {
1141 |           "base_uri": "https://localhost:8080/"
1142 |         },
1143 |         "id": "x7PrjC6zuf6X",
1144 |         "outputId": "985f083d-068e-49ec-e05d-73ec42da6535"
1145 |       },
1146 |       "source": [
1147 |         "print(X.shape, X_train.shape, X_test.shape)"
1148 |       ],
1149 |       "execution_count": null,
1150 |       "outputs": [
1151 |         {
1152 |           "output_type": "stream",
1153 |           "name": "stdout",
1154 |           "text": [
1155 |             "(303, 13) (242, 13) (61, 13)\n"
1156 |           ]
1157 |         }
1158 |       ]
1159 |     },
1160 |     {
1161 |       "cell_type": "markdown",
1162 |       "metadata": {
1163 |         "id": "beSkZmpVuvn9"
1164 |       },
1165 |       "source": [
1166 |         "Model Training"
1167 |       ]
1168 |     },
1169 |     {
1170 |       "cell_type": "code",
1171 |       "metadata": {
1172 |         "id": "4-Md74FYuqNL"
1173 |       },
1174 |       "source": [
1175 |         "model = LogisticRegression(max_iter=1000)"
1176 |       ],
1177 |       "execution_count": null,
1178 |       "outputs": []
1179 |     },
1180 |     {
1181 |       "cell_type": "code",
1182 |       "metadata": {
1183 |         "colab": {
1184 |           "base_uri": "https://localhost:8080/"
1185 |         },
1186 |         "id": "kCdHYxGUu7XD",
1187 |         "outputId": "9c90961d-3dd0-41ab-e2ff-9d6d58b10d86"
1188 |       },
1189 |       "source": [
1190 |         "# training the LogisticRegression model with Training data\n",
1191 |         "model.fit(X_train, Y_train)"
1192 |       ],
1193 |       "execution_count": null,
1194 |       "outputs": [
1195 |         {
1196 |           "output_type": "execute_result",
1197 |           "data": {
1198 |             "text/plain": [
1199 |               "LogisticRegression(max_iter=1000)"
1200 |             ]
1201 |           },
1202 |           "metadata": {},
1203 |           "execution_count": 16
1204 |         }
1205 |       ]
1206 |     },
1207 |     {
1208 |       "cell_type": "markdown",
1209 |       "metadata": {
1210 |         "id": "ZYIw8Gi9vXfU"
1211 |       },
1212 |       "source": [
1213 |         "Model Evaluation"
1214 |       ]
1215 |     },
1216 |     {
1217 |       "cell_type": "markdown",
1218 |       "metadata": {
1219 |         "id": "wmxAekfZvZa9"
1220 |       },
1221 |       "source": [
1222 |         "**Accuracy Score**"
1223 |       ]
1224 |     },
1225 |     {
1226 |       "cell_type": "code",
1227 |       "source": [
1228 |         "from sklearn.metrics import accuracy_score"
1229 |       ],
1230 |       "metadata": {
1231 |         "id": "aMMAnoWYFQY5"
1232 |       },
1233 |       "execution_count": null,
1234 |       "outputs": []
1235 |     },
1236 |     {
1237 |       "cell_type": "code",
1238 |       "metadata": {
1239 |         "id": "g19JaUTMvPKy",
1240 |         "colab": {
1241 |           "base_uri": "https://localhost:8080/"
1242 |         },
1243 |         "outputId": "b0767826-8d91-471f-fcbf-a12dce724760"
1244 |       },
1245 |       "source": [
1246 |         "# accuracy on training data\n",
1247 |         "X_train_prediction = model.predict(X_train)\n",
1248 |         "training_data_accuracy = accuracy_score(Y_train, X_train_prediction)\n",
1249 |         "print(training_data_accuracy)"
1250 |       ],
1251 |       "execution_count": null,
1252 |       "outputs": [
1253 |         {
1254 |           "output_type": "stream",
1255 |           "name": "stdout",
1256 |           "text": [
1257 |             "0.8553719008264463\n"
1258 |           ]
1259 |         }
1260 |       ]
1261 |     },
1262 |     {
1263 |       "cell_type": "code",
1264 |       "metadata": {
1265 |         "colab": {
1266 |           "base_uri": "https://localhost:8080/"
1267 |         },
1268 |         "id": "uQBZvBh8v7R_",
1269 |         "outputId": "1d5402ac-000f-4ba1-dd95-b66c2a9b6994"
1270 |       },
1271 |       "source": [
1272 |         "print('Accuracy on Training data : ', round(training_data_accuracy*100, 2), '%')"
1273 |       ],
1274 |       "execution_count": null,
1275 |       "outputs": [
1276 |         {
1277 |           "output_type": "stream",
1278 |           "name": "stdout",
1279 |           "text": [
1280 |             "Accuracy on Training data :  85.54 %\n"
1281 |           ]
1282 |         }
1283 |       ]
1284 |     },
1285 |     {
1286 |       "cell_type": "code",
1287 |       "metadata": {
1288 |         "id": "mDONDJdlwBIO",
1289 |         "colab": {
1290 |           "base_uri": "https://localhost:8080/"
1291 |         },
1292 |         "outputId": "458c59fe-e403-4528-e904-6666177cfc9a"
1293 |       },
1294 |       "source": [
1295 |         "# accuracy on test data\n",
1296 |         "X_test_prediction = model.predict(X_test)\n",
1297 |         "test_data_accuracy = accuracy_score(Y_test, X_test_prediction)\n",
1298 |         "print(test_data_accuracy)"
1299 |       ],
1300 |       "execution_count": null,
1301 |       "outputs": [
1302 |         {
1303 |           "output_type": "stream",
1304 |           "name": "stdout",
1305 |           "text": [
1306 |             "0.8032786885245902\n"
1307 |           ]
1308 |         }
1309 |       ]
1310 |     },
1311 |     {
1312 |       "cell_type": "code",
1313 |       "metadata": {
1314 |         "colab": {
1315 |           "base_uri": "https://localhost:8080/"
1316 |         },
1317 |         "id": "_MBS-OqdwYpf",
1318 |         "outputId": "0b7f8490-91e8-466a-dc5d-b4227452f1c3"
1319 |       },
1320 |       "source": [
1321 |         "print('Accuracy on Test data : ', round(test_data_accuracy*100, 2), '%')"
1322 |       ],
1323 |       "execution_count": null,
1324 |       "outputs": [
1325 |         {
1326 |           "output_type": "stream",
1327 |           "name": "stdout",
1328 |           "text": [
1329 |             "Accuracy on Test data :  80.33 %\n"
1330 |           ]
1331 |         }
1332 |       ]
1333 |     },
1334 |     {
1335 |       "cell_type": "markdown",
1336 |       "source": [
1337 |         "**Confuaion Matrix**"
1338 |       ],
1339 |       "metadata": {
1340 |         "id": "hOqOj3xEEqvW"
1341 |       }
1342 |     },
1343 |     {
1344 |       "cell_type": "code",
1345 |       "source": [
1346 |         "from sklearn.metrics import confusion_matrix"
1347 |       ],
1348 |       "metadata": {
1349 |         "id": "pZSEUHp7Eqcr"
1350 |       },
1351 |       "execution_count": null,
1352 |       "outputs": []
1353 |     },
1354 |     {
1355 |       "cell_type": "code",
1356 |       "source": [
1357 |         "cf_matrix = confusion_matrix(Y_test, X_test_prediction)\n",
1358 |         "\n",
1359 |         "print(cf_matrix)"
1360 |       ],
1361 |       "metadata": {
1362 |         "colab": {
1363 |           "base_uri": "https://localhost:8080/"
1364 |         },
1365 |         "id": "cXkoIIujFeQn",
1366 |         "outputId": "ef1f91f5-7f29-4500-a649-a119f34fc04f"
1367 |       },
1368 |       "execution_count": null,
1369 |       "outputs": [
1370 |         {
1371 |           "output_type": "stream",
1372 |           "name": "stdout",
1373 |           "text": [
1374 |             "[[22  6]\n",
1375 |             " [ 6 27]]\n"
1376 |           ]
1377 |         }
1378 |       ]
1379 |     },
1380 |     {
1381 |       "cell_type": "code",
1382 |       "source": [
1383 |         "tn, fp, fn, tp = cf_matrix.ravel()\n",
1384 |         "\n",
1385 |         "print(tn, fp, fn, tp)"
1386 |       ],
1387 |       "metadata": {
1388 |         "colab": {
1389 |           "base_uri": "https://localhost:8080/"
1390 |         },
1391 |         "id": "tpmo_nY8FyZl",
1392 |         "outputId": "34ab13d8-be83-4381-f1f7-17c168e389b3"
1393 |       },
1394 |       "execution_count": null,
1395 |       "outputs": [
1396 |         {
1397 |           "output_type": "stream",
1398 |           "name": "stdout",
1399 |           "text": [
1400 |             "22 6 6 27\n"
1401 |           ]
1402 |         }
1403 |       ]
1404 |     },
1405 |     {
1406 |       "cell_type": "code",
1407 |       "source": [
1408 |         "import seaborn as sns\n",
1409 |         "sns.heatmap(cf_matrix, annot=True)"
1410 |       ],
1411 |       "metadata": {
1412 |         "colab": {
1413 |           "base_uri": "https://localhost:8080/",
1414 |           "height": 282
1415 |         },
1416 |         "id": "i4ffPhNZGBR_",
1417 |         "outputId": "f1a0fc3e-8f55-4b19-d6bc-a62518a3c48b"
1418 |       },
1419 |       "execution_count": null,
1420 |       "outputs": [
1421 |         {
1422 |           "output_type": "execute_result",
1423 |           "data": {
1424 |             "text/plain": [
1425 |               "<matplotlib.axes._subplots.AxesSubplot at 0x7f2e02c0fcd0>"
1426 |             ]
1427 |           },
1428 |           "metadata": {},
1429 |           "execution_count": 25
1430 |         },
1431 |         {
1432 |           "output_type": "display_data",
1433 |           "data": {
1434 |             "text/plain": [
1435 |               "<Figure size 432x288 with 2 Axes>"
1436 |             ],
1437 |             "image/png": "iVBORw0KGgoAAAANSUhEUgAAAWQAAAD4CAYAAADbyJysAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4yLjIsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy+WH4yJAAAVZElEQVR4nO3deZBdZZnH8e+PTgclCwYRhBDZyVSimNRAUAGHNYQeFBdKE5WKGmi0ZGQrAaUAB6zSKiDMjFJKC2GpweDMEEZGAiFm0MDIkrAHwhq27rQJEEwgQZLu+8wffRIu4W7duen73sPvY73V97xne8pKPT6+5z3vUURgZmaNt02jAzAzsz5OyGZmiXBCNjNLhBOymVkinJDNzBIxZGvfYN3Mkz2Nw95j5LlzGx2CJahnfZe29BobXl1Wc85p3XGvLb5fPblCNjNLxFavkM3MBlWht9ERDJgTspnlS29PoyMYMCdkM8uViEKjQxgwJ2Qzy5eCE7KZWRpcIZuZJcIP9czMEuEK2cwsDeFZFmZmifBDPTOzRHjIwswsEX6oZ2aWCFfIZmaJ8EM9M7NE+KGemVkaIjyGbGaWhiYeQ/YC9WaWL4VC7a0CSWMk3SnpCUmPSzot6/+xpC5JD2etrcz5UyQ9JelZSefWErorZDPLl/pVyD3AWRHxoKQRwAOS5mf7Lo+IS8udKKkFuAI4GugEFkm6JSKeqHRDJ2Qzy5feDXW5TER0A93Z7zckLQVG13j6JODZiFgGIOlG4HigYkL2kIWZ5Us/hiwktUtaXNTaS11S0h7AROC+rOtUSY9KmiVpVIlTRgMvF213UkMyd0I2s3yJQs0tIjoi4oCi1rH55SQNB24CTo+INcAvgb2BCfRV0JfVK3QPWZhZvtRxHrKkVvqS8Q0RMQcgIlYU7f818PsSp3YBY4q2d8v6KnKFbGb5Ur9ZFgKuBpZGxMyi/l2KDvsisKTE6YuAfSXtKWkoMBW4pVrorpDNLFeiTg/1gIOBE4HHJD2c9f0ImCZpAhDAC8ApAJJ2Ba6KiLaI6JF0KjAPaAFmRcTj1W7ohGxm+VKnaW8RcTegErvmljl+OdBWtD233LHlOCGbWb54LQszs0Q08avTTshmli+ukM3MEuEK2cwsET1eoN7MLA2ukM3MEuExZDOzRLhCNjNLhCtkM7NEuEI2M0uEZ1mYmSUiotERDJgTspnli8eQzcwS4YRsZpYIP9QzM0tEb2+jIxgwJ2QzyxcPWZiZJaJOCVnSGOB6YGf6PtfUERH/KukS4HPAeuA54FsR8dcS578AvAH0Aj0RcUC1e/ojp2aWL1GovVXWA5wVEeOATwHfkzQOmA98PCL2B54GfljhGodHxIRakjG4QjaznIlCfeYhR0Q30J39fkPSUmB0RNxRdNi9wAl1uSGukM0sbwqFmpukdkmLi1p7qUtK2gOYCNy32a5vA7eViSSAOyQ9UO66m3OFbGb50o9ZFhHRAXRUOkbScOAm4PSIWFPUfx59wxo3lDn1kIjokrQTMF/SkxGxsNK9XCGbWb70o0KuRlIrfcn4hoiYU9T/TeA44OsRpd/Vjoiu7O9K4GZgUrX7OSGbWb7UKSFLEnA1sDQiZhb1TwHOBj4fEevKnDtM0oiNv4HJwJJqoXvIYivR8FEMPfbbaLuRENDz2EJ6HlpA62dPoGWv/aG3l8LqV1g/7xp4+61Gh2sNsv32I+m48lLGjx9LRHDyyWdx730PNDqs5la/xYUOBk4EHpP0cNb3I+DfgG3pG4YAuDciviNpV+CqiGijb6rczdn+IcBvIuL2ajd0Qt5KIgqs/9N/EitfgtZt+cA3zqf3xSfoffEJNtw1B6JA66FfpnVSGxvuuqnR4VqDXD7zIubNu5OvTm2ntbWV7bb7YKNDan51moccEXcDKrFrbpnjlwNt2e9lwCf7e08PWWwta1f3JWOADW9TeK0bDf8QhRef2DT/sdC9DA0f1cAgrZFGjhzBoYccxKxrZgOwYcMGVq9eU+Usq6oQtbfEVK2QJf0dcDwwOuvqAm6JiKVbM7A80cgPs81OYyj85fl39Q8ZfzA9Ty9qUFTWaHvu+TFeffU1rr7qcvbffxwPPvgoZ5x5AevWeQhrizTxWhYVK2RJ5wA30le23581AbMlnVvhvE1z+2bd82Q9420+rduy7ee+y4Y//hbW/21T95BJbUQU6F26+bRGe78Y0tLCxImf4Morr+fAScewdu06zjn71EaH1fSiUKi5paZahTwDGB8RG4o7Jc0EHgd+Vuqk4rl962aenN7/Lxgs27Sw7ee+S8/S++h99qFN3S3jPkPLXvvz9n/NrHCy5V1nVzednd3cv6jv38acObdy9g+ckLdYgkMRtao2hlwAdi3Rv0u2zyoYOnk6hVXd9Dw4f1PfNnuMp/XAY3j7d7+AnvUNjM4abcWKV+jsXM5+++0NwBFHHMLSpU83OKocqN9aFoOuWoV8OrBA0jPAy1nfx4B9AP9PeQXb7LoPQ8Z9msIrnbR84wIA1v/fHIYePg1ahvCBL58JQG/3MjYs+PdGhmoNdNoZ53P9dT9n6NBWnn/+JWacdGajQ2p+TVwhV0zIEXG7pP3oe8Ok+KHeooho3pHzQVBY/izrZp78nv6/PX9eA6KxVD3yyON86tNtjQ4jX3qaNzVVnWUREQX6VjQyM0tfgkMRtfKLIWaWL3kdsjAzazYpTmerlROymeWLK2Qzs0Q4IZuZJaKJX512QjazXKnXN/UawQnZzPLFCdnMLBGeZWFmlogmrpC9QL2Z5UudFqiXNEbSnZKekPS4pNOy/h0kzZf0TPa35FcmJE3PjnlG0vRaQndCNrNcid5Cza2KHuCsiBgHfAr4nqRxwLnAgojYF1iQbb+LpB2AC4GD6FsL6MJyibuYE7KZ5UudKuSI6I6IB7PfbwBL6Vtk7Xjguuyw64AvlDj9GGB+RKyKiNeB+cCUaqF7DNnMcqU/094ktQPtRV0d2Qc2Nj9uD2AicB+wc0R0Z7v+Qt8Xpjc3mneWLAbo5J0VM8tyQjazfOlHQi7+ulE5koYDNwGnR8Qa6Z0PUUdESKrbU0QPWZhZvhT60aqQ1EpfMr4hIuZk3Ssk7ZLt3wVYWeLULmBM0fZuWV9FTshmlivRU6i5VaK+UvhqYGlEFH8A8xZg46yJ6cDvSpw+D5gsaVT2MG9y1leRE7KZ5Uv9KuSDgROBIyQ9nLU2+j7ufHT2abujsm0kHSDpKoCIWAVcDCzK2kVZX0UeQzazXKnXWhYRcTegMruPLHH8YuCkou1ZwKz+3NMJ2czypXnfnHZCNrN88WpvZmapcIVsZpaG6Gl0BAPnhGxmuRKukM3MEuGEbGaWBlfIZmaJcEI2M0tE9JZ7lyN9TshmliuukM3MEhEFV8hmZklwhWxmlogIV8hmZklwhWxmloiCZ1mYmaXBD/XMzBLhhGxmloio43LIkmYBxwErI+LjWd9vgbHZIR8C/hoRE0qc+wLwBtAL9ETEAdXu54RsZrlS5wr5WuAXwPWbrh/x1Y2/JV0GrK5w/uER8WqtN3NCNrNcqee0t4hYKGmPUvuyr1J/BTiiXvfzV6fNLFd6e1Vzk9QuaXFRa+/HrQ4FVkTEM2X2B3CHpAdqva4rZDPLlf5UyBHRAXQM8FbTgNkV9h8SEV2SdgLmS3oyIhZWuqATspnlymDMspA0BPgS8Pdl44joyv6ulHQzMAmomJA9ZGFmuRJRe9sCRwFPRkRnqZ2ShkkasfE3MBlYUu2iTshmlitRUM2tGkmzgXuAsZI6Jc3Idk1ls+EKSbtKmptt7gzcLekR4H7g1oi4vdr9PGRhZrnSW6hfnRkR08r0f7NE33KgLfu9DPhkf+/nhGxmuVLPF0MGmxOymeVKwctvmpmlweshm5klwkMWFYw8d271g+x9563ldzU6BMspD1mYmSWinrMsBpsTspnlShOPWDghm1m+eMjCzCwRnmVhZpaIJv7otBOymeVL4ArZzCwJPR6yMDNLgytkM7NEeAzZzCwRrpDNzBLRzBVy875jaGZWQi+quVUjaZaklZKWFPX9WFKXpIez1lbm3CmSnpL0rKRza4ndCdnMcqWg2lsNrgWmlOi/PCImZO09K6hJagGuAI4FxgHTJI2rdjMnZDPLlQKquVUTEQuBVQMIYxLwbEQsi4j1wI3A8dVOckI2s1yJfrQtcKqkR7MhjVEl9o8GXi7a7sz6KnJCNrNcKfSjSWqXtLiotddwi18CewMTgG7gsnrF7lkWZpYrBdU+7S0iOoCO/lw/IlZs/C3p18DvSxzWBYwp2t4t66vIFbKZ5UpvP9pASNqlaPOLwJIShy0C9pW0p6ShwFTglmrXdoVsZrlS4+yJmkiaDRwG7CipE7gQOEzSBPqGoV8ATsmO3RW4KiLaIqJH0qnAPKAFmBURj1e7nxOymeVKLbMnahUR00p0X13m2OVAW9H2XKBfHxV1QjazXPEnnMzMElHPIYvB5oRsZrnSzGtZOCGbWa70ukI2M0uDK2Qzs0Q4IZuZJaKJP6nnhGxm+eIK2cwsEQN9JToFTshmliueh2xmlggPWZiZJcIJ2cwsEV7LwswsER5DNjNLhGdZmJklotDEgxZOyGaWK838UM/f1DOzXIl+tGokzZK0UtKSor5LJD0p6VFJN0v6UJlzX5D0mKSHJS2uJXYnZDPLlUI/Wg2uBaZs1jcf+HhE7A88DfywwvmHR8SEiDiglps5IZtZrvQoam7VRMRCYNVmfXdERE+2eS+wW71id0I2s1zpz5CFpHZJi4taez9v923gtgqh3CHpgVqv64d6ZpYr/XmoFxEdQMdA7iPpPKAHuKHMIYdERJeknYD5kp7MKu6yXCGbWa4UiJrbQEn6JnAc8PWIKHmhiOjK/q4EbgYmVbuuE7KZ5Uo9Z1mUImkKcDbw+YhYV+aYYZJGbPwNTAaWlDq2mBOymeVKPWdZSJoN3AOMldQpaQbwC2AEfcMQD0v6VXbsrpLmZqfuDNwt6RHgfuDWiLi92v08hmxmudJbxzf1ImJaie6ryxy7HGjLfi8DPtnf+zkhm1muNPObek7IZpYr4bUszMzS4ArZqtp++5F0XHkp48ePJSI4+eSzuPe+Bxodlg2i7hWv8KOLL+W1119HiBOOP5YTv/IFzjr/p7zwUicAb7z5JiOGD+em665ocLTNy6u9WVWXz7yIefPu5KtT22ltbWW77T7Y6JBskA1paeEH/3Qy48buw9q16/jKjO/zmQMnctnF7yyFcMnPf83wYds1MMrm17zp2NPeBsXIkSM49JCDmHXNbAA2bNjA6tVrGhyVDbaP7LgD48buA8CwYdux1+5jWPHKa5v2RwS3/+9C2o4+rEER5kMPUXNLjRPyINhzz4/x6quvcfVVl7Po/nlc+atLXCG/z3V1r2DpM8+x//ixm/oeeGQJHx41it3HjG5gZM0v+vGf1Aw4IUv6VoV9mxbsKBTWDvQWuTGkpYWJEz/BlVdez4GTjmHt2nWcc/apjQ7LGmTdurc447yfcM73T2H4sGGb+ufO/yNtR/9DAyPLhzovvzmotqRC/udyOyKiIyIOiIgDttlmWLnD3jc6u7rp7Ozm/kUPATBnzq1MnPCJBkdljbChp4fTz/sJ/zj5cI4+7OBN/T09vfzhT39mypGfbWB0+dDMFXLFh3qSHi23i75XA60GK1a8Qmfncvbbb2+efvo5jjjiEJYufbrRYdkgiwgu+Om/sNfuY5g+9Uvv2nfv4ofYa/fd+OhOH2lQdPmRYuVbq2qzLHYGjgFe36xfwJ+3SkQ5ddoZ53P9dT9n6NBWnn/+JWacdGajQ7JB9tCjj/M/ty9g37334MvTvwfAaadM57OfmcRtf/gTxx51WGMDzIne0ouvNQWVWTmub6d0NXBNRNxdYt9vIuJr1W4wZOjo5v1vx7aat5bf1egQLEGtO+6lLb3G13b/Ys055zcv3rzF96unihVyRMyosK9qMjYzG2wpjg3Xyi+GmFmu5HkM2cysqfjVaTOzRHjIwswsEc08y8KvTptZrtTzI6eSZklaKWlJUd8OkuZLeib7O6rMudOzY56RNL2W2J2QzSxX6vzq9LXAlM36zgUWRMS+wIJs+10k7QBcCBxE39emLyyXuIs5IZtZrtTz1emIWAis2qz7eOC67Pd1wBdKnHoMMD8iVkXE68B83pvY38MJ2cxypT9DFsULoWWtvYZb7BwR3dnvv1B6GYnRwMtF251ZX0V+qGdmuVLp7eMSx3YAHVtwr5BUt6eIrpDNLFd6iZrbAK2QtAtA9ndliWO6gDFF27tlfRU5IZtZrtRzlkUZtwAbZ01MB35X4ph5wGRJo7KHeZOzvoqckM0sVyKi5laNpNnAPcBYSZ2SZgA/A46W9AxwVLaNpAMkXZXFsAq4GFiUtYuyvoo8hmxmuVLPV6cjYlqZXUeWOHYxcFLR9ixgVn/u54RsZrniV6fNzBLRzK9OOyGbWa54tTczs0Q4IZuZJaI/L4akxgnZzHLFFbKZWSI8y8LMLBG90bxf1XNCNrNc8RiymVkiPIZsZpYIjyGbmSWi4CELM7M0uEI2M0uEZ1mYmSXCQxZmZonwkIWZWSKauUL2J5zMLFeiH/+pRNJYSQ8XtTWSTt/smMMkrS465oItid0VspnlSm/01uU6EfEUMAFAUgt9X42+ucShd0XEcfW4pxOymeXKVnp1+kjguYh4cWtcfCMPWZhZrhSImpukdkmLi1p7mctOBWaX2fdpSY9Iuk3S+C2J3RWymeVKfyrkiOgAOiodI2ko8HnghyV2PwjsHhFvSmoD/hvYt/Zo380VspnlSiGi5lajY4EHI2LF5jsiYk1EvJn9ngu0StpxoLE7IZtZrtRrlkWRaZQZrpD0UUnKfk+iL6e+NtDYPWRhZrlSz1enJQ0DjgZOKer7DkBE/Ao4AfiupB7gLWBqbMFTRW3txZyHDB3dvLO0bat5a/ldjQ7BEtS6417a0mvsOHK/mnPOq2ue3uL71ZMrZDPLlWZ+U88J2cxyxZ9wMjNLhD/hZGaWCFfIZmaJ8AL1ZmaJ8EM9M7NEeMjCzCwR/mKImVkiXCGbmSWimceQt/qr0/YOSe3Zcn9mm/jfhW3k1d4GV7nFr+39zf8uDHBCNjNLhhOymVkinJAHl8cJrRT/uzDAD/XMzJLhCtnMLBFOyGZmiXBCHiSSpkh6StKzks5tdDzWeJJmSVopaUmjY7E0OCEPAkktwBX0fU58HDBN0rjGRmUJuBaY0uggLB1OyINjEvBsRCyLiPXAjcDxDY7JGiwiFgKrGh2HpcMJeXCMBl4u2u7M+szMNnFCNjNLhBPy4OgCxhRt75b1mZlt4oQ8OBYB+0raU9JQYCpwS4NjMrPEOCEPgojoAU4F5gFLgf+IiMcbG5U1mqTZwD3AWEmdkmY0OiZrLL86bWaWCFfIZmaJcEI2M0uEE7KZWSKckM3MEuGEbGaWCCdkM7NEOCGbmSXi/wFdHVEE8LeS2QAAAABJRU5ErkJggg==\n"
1438 |           },
1439 |           "metadata": {
1440 |             "needs_background": "light"
1441 |           }
1442 |         }
1443 |       ]
1444 |     },
1445 |     {
1446 |       "cell_type": "markdown",
1447 |       "source": [
1448 |         "confusion matrix for multi class classification: https://colab.research.google.com/drive/17FViiMJbJXQ5s9GOW94emoHcCKUcYr3l?usp=sharing"
1449 |       ],
1450 |       "metadata": {
1451 |         "id": "yFibQac0G4fh"
1452 |       }
1453 |     },
1454 |     {
1455 |       "cell_type": "code",
1456 |       "source": [],
1457 |       "metadata": {
1458 |         "id": "fr6QfOeqGr_3"
1459 |       },
1460 |       "execution_count": null,
1461 |       "outputs": []
1462 |     }
1463 |   ]
1464 | }


--------------------------------------------------------------------------------